dedup simul
Browse files
data/plots/duplicates-simul/default.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"data": {"1": {"x": ["1B", "10B", "100B", "350B", "1T"], "y": [0.994974, 0.9515081, 0.60887281, 0.1741474885714285, 0.006232416], "label": "1"}, "2": {"x": ["1B", "10B", "100B", "350B", "1T"], "y": [0.005008, 0.047331, 0.30282154, 0.3071204342857143, 0.032470074], "label": "2"}, "3": {"x": ["1B", "10B", "100B", "350B", "1T"], "y": [1.8e-05, 0.0011439, 0.0745482, 0.2680183371428571, 0.083742993], "label": "3"}, "4-8": {"x": ["1B", "10B", "100B", "350B", "1T"], "y": [0.0, 1.7e-05, 0.01375745, 0.25064894285714273, 0.8176358810000001], "label": "4-8"}, "8-16": {"x": ["1B", "10B", "100B", "350B", "1T"], "y": [0.0, 0.0, 0.0, 6.479714285714286e-05, 0.05991048400000001], "label": "8-16"}, "16-32": {"x": ["1B", "10B", "100B", "350B", "1T"], "y": [0.0, 0.0, 0.0, 0.0, 8.152000000000001e-06], "label": "16-32"}}, "layout": {"title": {"text": "Sampling from 1000 identical buckets with 200B tokens each"}, "xaxis": {"title": {"text": "Sample size"}}, "yaxis": {"title": {"text": "Dataset fraction"}}, "barmode": "stack", "legend": {"title": {"text": "# duplicates", "font": {"size": 14, "weight": "bold"}}, "font": {"size": 14}, "bgcolor": "rgba(255, 255, 255, 0.9)", "orientation": "v", "xanchor": "left", "yanchor": "bottom", "x": 0.01, "y": 0}}}
|
data/plots/duplicates-simul/index.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"files": {"default": {"file": "default.json"}}, "settings": {"defaultMetric": "default", "slider": null, "autoSetXRange": false, "type": "bar"}}
|
data/plots/edu-100k/index.json
CHANGED
@@ -1 +1 @@
|
|
1 |
-
{"files": {"mmlu/acc_norm": {"file": "mmlu_acc_norm.json"}, "arc/acc_norm": {"file": "arc_acc_norm.json"}, "openbookqa/acc_norm": {"file": "openbookqa_acc_norm.json"}, "piqa/acc_norm": {"file": "piqa_acc_norm.json"}, "hellaswag/acc_norm": {"file": "hellaswag_acc_norm.json"}, "winogrande/acc_norm": {"file": "winogrande_acc_norm.json"}}, "settings": {"defaultMetric": "mmlu/acc_norm", "slider": null, "autoSetXRange": false}}
|
|
|
1 |
+
{"files": {"mmlu/acc_norm": {"file": "mmlu_acc_norm.json"}, "arc/acc_norm": {"file": "arc_acc_norm.json"}, "openbookqa/acc_norm": {"file": "openbookqa_acc_norm.json"}, "piqa/acc_norm": {"file": "piqa_acc_norm.json"}, "hellaswag/acc_norm": {"file": "hellaswag_acc_norm.json"}, "winogrande/acc_norm": {"file": "winogrande_acc_norm.json"}}, "settings": {"defaultMetric": "mmlu/acc_norm", "slider": null, "autoSetXRange": false, "type": "bar"}}
|
data/plots/edu-8k/index.json
CHANGED
@@ -1 +1 @@
|
|
1 |
-
{"files": {"mmlu/acc_norm": {"file": "mmlu_acc_norm.json"}, "arc/acc_norm": {"file": "arc_acc_norm.json"}, "openbookqa/acc_norm": {"file": "openbookqa_acc_norm.json"}, "piqa/acc_norm": {"file": "piqa_acc_norm.json"}, "hellaswag/acc_norm": {"file": "hellaswag_acc_norm.json"}, "winogrande/acc_norm": {"file": "winogrande_acc_norm.json"}}, "settings": {"defaultMetric": "mmlu/acc_norm", "slider": null, "autoSetXRange": false}}
|
|
|
1 |
+
{"files": {"mmlu/acc_norm": {"file": "mmlu_acc_norm.json"}, "arc/acc_norm": {"file": "arc_acc_norm.json"}, "openbookqa/acc_norm": {"file": "openbookqa_acc_norm.json"}, "piqa/acc_norm": {"file": "piqa_acc_norm.json"}, "hellaswag/acc_norm": {"file": "hellaswag_acc_norm.json"}, "winogrande/acc_norm": {"file": "winogrande_acc_norm.json"}}, "settings": {"defaultMetric": "mmlu/acc_norm", "slider": null, "autoSetXRange": false, "type": "bar"}}
|
src/plotting.js
CHANGED
@@ -40,9 +40,13 @@ const DEFAULT_SETTINGS = {
|
|
40 |
default: 0,
|
41 |
},
|
42 |
defaultMetric: "agg_score",
|
|
|
43 |
};
|
44 |
|
45 |
const DEFAULT_LAYOUT = {
|
|
|
|
|
|
|
46 |
title: {
|
47 |
text: "Plot Title",
|
48 |
font: {
|
@@ -146,6 +150,7 @@ const init_ablation_plot = function () {
|
|
146 |
const sliderValue = parseInt(slider?.value ?? 0);
|
147 |
console.log(indexMapping)
|
148 |
console.log(metricName)
|
|
|
149 |
const metricData = await fetch(
|
150 |
`data/plots/${plotName}/${indexMapping[metricName]["file"]}`
|
151 |
).then((response) => response.json());
|
@@ -154,7 +159,7 @@ const init_ablation_plot = function () {
|
|
154 |
const traceData = metricData.data[key];
|
155 |
const y = rollingWindow(traceData.y, sliderValue);
|
156 |
const x = traceData.x.slice(0, y.length);
|
157 |
-
const plotSettings =
|
158 |
const trace = {
|
159 |
x: x,
|
160 |
y: y,
|
|
|
40 |
default: 0,
|
41 |
},
|
42 |
defaultMetric: "agg_score",
|
43 |
+
type: "line"
|
44 |
};
|
45 |
|
46 |
const DEFAULT_LAYOUT = {
|
47 |
+
font: {
|
48 |
+
family: "apple-system, Arial, sans-serif",
|
49 |
+
},
|
50 |
title: {
|
51 |
text: "Plot Title",
|
52 |
font: {
|
|
|
150 |
const sliderValue = parseInt(slider?.value ?? 0);
|
151 |
console.log(indexMapping)
|
152 |
console.log(metricName)
|
153 |
+
console.log(plotElement)
|
154 |
const metricData = await fetch(
|
155 |
`data/plots/${plotName}/${indexMapping[metricName]["file"]}`
|
156 |
).then((response) => response.json());
|
|
|
159 |
const traceData = metricData.data[key];
|
160 |
const y = rollingWindow(traceData.y, sliderValue);
|
161 |
const x = traceData.x.slice(0, y.length);
|
162 |
+
const plotSettings = settings.type === "bar" ? BAR_SETTINGS : LINE_SETTINGS;
|
163 |
const trace = {
|
164 |
x: x,
|
165 |
y: y,
|