mcding commited on
Commit
8e1a6c6
0 Parent(s):

New initial commit

Browse files
Files changed (5) hide show
  1. .gitattributes +35 -0
  2. Dockerfile +15 -0
  3. README.md +10 -0
  4. requirements.txt +2 -0
  5. run.py +33 -0
.gitattributes ADDED
@@ -0,0 +1,35 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ *.7z filter=lfs diff=lfs merge=lfs -text
2
+ *.arrow filter=lfs diff=lfs merge=lfs -text
3
+ *.bin filter=lfs diff=lfs merge=lfs -text
4
+ *.bz2 filter=lfs diff=lfs merge=lfs -text
5
+ *.ckpt filter=lfs diff=lfs merge=lfs -text
6
+ *.ftz filter=lfs diff=lfs merge=lfs -text
7
+ *.gz filter=lfs diff=lfs merge=lfs -text
8
+ *.h5 filter=lfs diff=lfs merge=lfs -text
9
+ *.joblib filter=lfs diff=lfs merge=lfs -text
10
+ *.lfs.* filter=lfs diff=lfs merge=lfs -text
11
+ *.mlmodel filter=lfs diff=lfs merge=lfs -text
12
+ *.model filter=lfs diff=lfs merge=lfs -text
13
+ *.msgpack filter=lfs diff=lfs merge=lfs -text
14
+ *.npy filter=lfs diff=lfs merge=lfs -text
15
+ *.npz filter=lfs diff=lfs merge=lfs -text
16
+ *.onnx filter=lfs diff=lfs merge=lfs -text
17
+ *.ot filter=lfs diff=lfs merge=lfs -text
18
+ *.parquet filter=lfs diff=lfs merge=lfs -text
19
+ *.pb filter=lfs diff=lfs merge=lfs -text
20
+ *.pickle filter=lfs diff=lfs merge=lfs -text
21
+ *.pkl filter=lfs diff=lfs merge=lfs -text
22
+ *.pt filter=lfs diff=lfs merge=lfs -text
23
+ *.pth filter=lfs diff=lfs merge=lfs -text
24
+ *.rar filter=lfs diff=lfs merge=lfs -text
25
+ *.safetensors filter=lfs diff=lfs merge=lfs -text
26
+ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
27
+ *.tar.* filter=lfs diff=lfs merge=lfs -text
28
+ *.tar filter=lfs diff=lfs merge=lfs -text
29
+ *.tflite filter=lfs diff=lfs merge=lfs -text
30
+ *.tgz filter=lfs diff=lfs merge=lfs -text
31
+ *.wasm filter=lfs diff=lfs merge=lfs -text
32
+ *.xz filter=lfs diff=lfs merge=lfs -text
33
+ *.zip filter=lfs diff=lfs merge=lfs -text
34
+ *.zst filter=lfs diff=lfs merge=lfs -text
35
+ *tfevents* filter=lfs diff=lfs merge=lfs -text
Dockerfile ADDED
@@ -0,0 +1,15 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ FROM python:3.9
2
+
3
+ WORKDIR /code
4
+ ENV HOME=/code
5
+
6
+ RUN apt install curl
7
+ RUN pip install pip -U
8
+
9
+ RUN pip install renumics-spotlight==1.6.6
10
+ RUN pip install datasets
11
+
12
+ COPY . .
13
+ RUN mkdir -p /code/.cache
14
+ RUN chmod -R 777 /code
15
+ CMD ["python", "run.py"]
README.md ADDED
@@ -0,0 +1,10 @@
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ title: Dataset Viewer
3
+ emoji: 😻
4
+ colorFrom: yellow
5
+ colorTo: yellow
6
+ sdk: docker
7
+ pinned: false
8
+ ---
9
+
10
+ Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference
requirements.txt ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ renumics-spotlight
2
+ datasets
run.py ADDED
@@ -0,0 +1,33 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ import os
2
+ from huggingface_hub import login
3
+ from datasets import load_dataset
4
+ from renumics import spotlight
5
+
6
+ DATASET_LIST = [
7
+ (os.environ["HF_USERNAME"] + "/Easy2Hard-AMC", "v1", "default"),
8
+ (os.environ["HF_USERNAME"] + "/Easy2Hard-Lichess", "v1", "default"),
9
+ (os.environ["HF_USERNAME"] + "/Easy2Hard-ARC", "v1", "test"),
10
+ (os.environ["HF_USERNAME"] + "/Easy2Hard-GSM8K", "v1", "test"),
11
+ (os.environ["HF_USERNAME"] + "/Easy2Hard-HellaSwag", "v1", "validation"),
12
+ (os.environ["HF_USERNAME"] + "/Easy2Hard-Winogrande", "v1", "validation"),
13
+ (os.environ["HF_USERNAME"] + "/Easy2Hard-Leaderboard", "v1", "default"),
14
+ ]
15
+
16
+
17
+ if __name__ == "__main__":
18
+ # Load dataset and save
19
+ login(token=os.environ["HF_TOKEN"])
20
+ for dataset in DATASET_LIST:
21
+ ds = load_dataset(dataset[0], dataset[1], split=dataset[2])
22
+ ds.to_parquet(
23
+ f"{dataset[0].replace('/', '_')}_{dataset[1]}_{dataset[2]}.parquet"
24
+ )
25
+
26
+ view = spotlight.show(
27
+ dataset=ds.to_pandas(),
28
+ folder=".",
29
+ port=7860,
30
+ host="0.0.0.0",
31
+ allow_filebrowsing=True,
32
+ wait="forever",
33
+ )