Spaces:
Running
Running
let's try 321 again
Browse files
docs/data/presse.parquet.sh
CHANGED
@@ -6,7 +6,7 @@ SELECT title
|
|
6 |
, author
|
7 |
, LPAD((REGEXP_EXTRACT(date, '1[0-9][0-9][0-9]') || '-01-01'), 10, '0')::DATE AS year
|
8 |
FROM read_parquet(
|
9 |
-
[('https://huggingface.co/datasets/PleIAs/French-PD-Newspapers/resolve/main/gallica_presse_{:d}.parquet').format(n) for n in range(1,
|
10 |
);
|
11 |
COPY presse TO '$TMPDIR/presse.parquet' (FORMAT 'parquet', COMPRESSION 'GZIP');
|
12 |
""" | duckdb
|
|
|
6 |
, author
|
7 |
, LPAD((REGEXP_EXTRACT(date, '1[0-9][0-9][0-9]') || '-01-01'), 10, '0')::DATE AS year
|
8 |
FROM read_parquet(
|
9 |
+
[('https://huggingface.co/datasets/PleIAs/French-PD-Newspapers/resolve/main/gallica_presse_{:d}.parquet').format(n) for n in range(1, 321)])
|
10 |
);
|
11 |
COPY presse TO '$TMPDIR/presse.parquet' (FORMAT 'parquet', COMPRESSION 'GZIP');
|
12 |
""" | duckdb
|