Gagan Bhatia commited on
Commit
bc51ebd
1 Parent(s): 8d55377

Update make_dataset.py

Browse files
Files changed (1) hide show
  1. src/data/make_dataset.py +1 -0
src/data/make_dataset.py CHANGED
@@ -11,6 +11,7 @@ def make_dataset(dataset="cnn_dailymail", split="train"):
11
  os.makedirs("data/raw")
12
  dataset = load_dataset(dataset, "3.0.0", split=split)
13
  df = pd.DataFrame()
 
14
  df["highlights"] = dataset["highlights"]
15
  df.to_csv("data/raw/{}.csv".format(split))
16
 
 
11
  os.makedirs("data/raw")
12
  dataset = load_dataset(dataset, "3.0.0", split=split)
13
  df = pd.DataFrame()
14
+ df["article"] = dataset["article"]
15
  df["highlights"] = dataset["highlights"]
16
  df.to_csv("data/raw/{}.csv".format(split))
17