Gagan Bhatia commited on
Commit
9d3af5f
1 Parent(s): 37328df

Update make_dataset.py

Browse files
Files changed (1) hide show
  1. src/data/make_dataset.py +1 -0
src/data/make_dataset.py CHANGED
@@ -9,6 +9,7 @@ def make_dataset(dataset="cnn_dailymail", split="train"):
9
  """make dataset for summarisation"""
10
  os.makedirs('data/raw')
11
  dataset = load_dataset(dataset, '3.0.0', split=split)
 
12
  df = pd.DataFrame()
13
  df['article'] = dataset['article']
14
  df['highlights'] = dataset['highlights']
 
9
  """make dataset for summarisation"""
10
  os.makedirs('data/raw')
11
  dataset = load_dataset(dataset, '3.0.0', split=split)
12
+ if not os.path.exists("data/raw"):
13
  df = pd.DataFrame()
14
  df['article'] = dataset['article']
15
  df['highlights'] = dataset['highlights']