fil commited on
Commit
dae32f4
·
1 Parent(s): 8e6eb11

try smaller

Browse files
Files changed (1) hide show
  1. docs/data/presse.parquet.sh +1 -1
docs/data/presse.parquet.sh CHANGED
@@ -6,7 +6,7 @@ SELECT title
6
  , author
7
  , LPAD((REGEXP_EXTRACT(date, '1[0-9][0-9][0-9]') || '-01-01'), 10, '0')::DATE AS year
8
  FROM read_parquet(
9
- [('https://huggingface.co/datasets/PleIAs/French-PD-Newspapers/resolve/main/gallica_presse_{:d}.parquet').format(n) for n in range(1, 321)])
10
  );
11
  COPY presse TO '$TMPDIR/presse.parquet' (FORMAT 'parquet', COMPRESSION 'GZIP');
12
  """ | duckdb
 
6
  , author
7
  , LPAD((REGEXP_EXTRACT(date, '1[0-9][0-9][0-9]') || '-01-01'), 10, '0')::DATE AS year
8
  FROM read_parquet(
9
+ [('https://huggingface.co/datasets/PleIAs/French-PD-Newspapers/resolve/main/gallica_presse_{:d}.parquet').format(n) for n in range(1, 2)])
10
  );
11
  COPY presse TO '$TMPDIR/presse.parquet' (FORMAT 'parquet', COMPRESSION 'GZIP');
12
  """ | duckdb