Gagan Bhatia commited on
Commit
370f001
1 Parent(s): 06d3c94

Update make_dataset.py

Browse files
Files changed (1) hide show
  1. src/data/make_dataset.py +1 -0
src/data/make_dataset.py CHANGED
@@ -8,6 +8,7 @@ def make_dataset(dataset='cnn_dailymail', split='train'):
8
  df = pd.DataFrame()
9
  df['article'] = dataset['article']
10
  df['highlights'] = dataset['highlights']
 
11
 
12
  if __name__ == '__main__':
13
  make_dataset(dataset='cnn_dailymail', split='train', version="3.0.0")
 
8
  df = pd.DataFrame()
9
  df['article'] = dataset['article']
10
  df['highlights'] = dataset['highlights']
11
+ df.to_csv('C:/Users/gbhat/Documents/GitHub/summarization/data/raw/{}.csv'.format(split))
12
 
13
  if __name__ == '__main__':
14
  make_dataset(dataset='cnn_dailymail', split='train', version="3.0.0")