compendious commited on
Commit
035b2bd
·
1 Parent(s): f179148

And reviewed cleaner scripts

backend/README.md ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ # Backend
2
+
3
+ The backend is just for API implementation and model orchestration. For actual data-related or model-related work, see the rest of the codebase.
frontend/README.md CHANGED
@@ -1,4 +1,4 @@
1
- # Précis — Frontend
2
 
3
  React 19 + Vite frontend for Précis. See the [root README](../README.md) for full setup instructions.
4
 
 
1
+ # Frontend
2
 
3
  React 19 + Vite frontend for Précis. See the [root README](../README.md) for full setup instructions.
4
 
scripts/cleaners/clean_ds.py CHANGED
@@ -22,7 +22,7 @@ def write_jsonl(rows, output_path):
22
  with open(output_path, 'w', encoding='utf-8') as f:
23
  for row in rows:
24
  new_data = {
25
- "id": row["id"],
26
  "original_source": "DialogSum",
27
  "dialogue": row["dialogue"],
28
  "summary": row["summary"],
 
22
  with open(output_path, 'w', encoding='utf-8') as f:
23
  for row in rows:
24
  new_data = {
25
+ "id": i,
26
  "original_source": "DialogSum",
27
  "dialogue": row["dialogue"],
28
  "summary": row["summary"],
scripts/cleaners/clean_ms.py CHANGED
@@ -24,7 +24,7 @@ def write_jsonl(lines, output_path):
24
  for line in lines:
25
  data = json.loads(line)
26
  new_data = {
27
- "id": data["id"],
28
  "original_source": "MediaSum",
29
  "url": data["url"],
30
  "summary": data["summary"],
 
24
  for line in lines:
25
  data = json.loads(line)
26
  new_data = {
27
+ "id": i,
28
  "original_source": "MediaSum",
29
  "url": data["url"],
30
  "summary": data["summary"],