Gagan Bhatia commited on
Commit
cc08aa0
1 Parent(s): 19ef522

Update make_dataset.py

Browse files
Files changed (1) hide show
  1. src/data/make_dataset.py +1 -0
src/data/make_dataset.py CHANGED
@@ -8,6 +8,7 @@ import pprint
8
 
9
  def make_dataset(dataset='cnn_dailymail', split='train'):
10
  """make dataset for summarisation"""
 
11
  dataset = load_dataset(dataset, '3.0.0', split=split)
12
  df = pd.DataFrame()
13
  df['article'] = dataset['article']
 
8
 
9
  def make_dataset(dataset='cnn_dailymail', split='train'):
10
  """make dataset for summarisation"""
11
+ if not os.path.exists('data/raw'):
12
  dataset = load_dataset(dataset, '3.0.0', split=split)
13
  df = pd.DataFrame()
14
  df['article'] = dataset['article']