Gagan Bhatia commited on
Commit
0130907
1 Parent(s): cc08aa0

Update make_dataset.py

Browse files
Files changed (1) hide show
  1. src/data/make_dataset.py +1 -0
src/data/make_dataset.py CHANGED
@@ -9,6 +9,7 @@ import pprint
9
  def make_dataset(dataset='cnn_dailymail', split='train'):
10
  """make dataset for summarisation"""
11
  if not os.path.exists('data/raw'):
 
12
  dataset = load_dataset(dataset, '3.0.0', split=split)
13
  df = pd.DataFrame()
14
  df['article'] = dataset['article']
 
9
  def make_dataset(dataset='cnn_dailymail', split='train'):
10
  """make dataset for summarisation"""
11
  if not os.path.exists('data/raw'):
12
+ os.makedirs('data/raw')
13
  dataset = load_dataset(dataset, '3.0.0', split=split)
14
  df = pd.DataFrame()
15
  df['article'] = dataset['article']