Gagan Bhatia commited on
Commit
fbbe319
1 Parent(s): 6570db2

Update process_data.py

Browse files
Files changed (1) hide show
  1. src/data/process_data.py +1 -0
src/data/process_data.py CHANGED
@@ -9,6 +9,7 @@ def process_data(split="train"):
9
  params = yaml.safe_load(f)
10
 
11
  df = pd.read_csv("data/raw/{}.csv".format(split))
 
12
  if os.path.exists("data/raw/{}.csv".format(split)):
13
  os.remove("data/raw/{}.csv".format(split))
14
  df.to_csv('data/processed/{}.csv'.format(split))
 
9
  params = yaml.safe_load(f)
10
 
11
  df = pd.read_csv("data/raw/{}.csv".format(split))
12
+ df.columns = ["Unnamed: 0", "input_text", "output_text"]
13
  if os.path.exists("data/raw/{}.csv".format(split)):
14
  os.remove("data/raw/{}.csv".format(split))
15
  df.to_csv('data/processed/{}.csv'.format(split))