Gagan Bhatia commited on
Commit
1528dbf
1 Parent(s): 1b154c5

Update process_data.py

Browse files
Files changed (1) hide show
  1. src/data/process_data.py +1 -0
src/data/process_data.py CHANGED
@@ -3,6 +3,7 @@ import pandas as pd
3
 
4
  def process_data(split='train'):
5
 
 
6
  df.columns = ['Unnamed: 0', 'input_text', 'output_text']
7
  print(df.columns)
8
  df.to_csv('C:/Users/gbhat/Documents/GitHub/summarization/data/processed/{}.csv'.format(split))
 
3
 
4
  def process_data(split='train'):
5
 
6
+ df = pd.read_csv('data/raw/{}.csv'.format(split))
7
  df.columns = ['Unnamed: 0', 'input_text', 'output_text']
8
  print(df.columns)
9
  df.to_csv('C:/Users/gbhat/Documents/GitHub/summarization/data/processed/{}.csv'.format(split))