loubna plots
Browse files- data/plots/edu-100k/arc_acc_norm.json +1 -0
- data/plots/edu-100k/hellaswag_acc_norm.json +1 -0
- data/plots/edu-100k/index.json +1 -0
- data/plots/edu-100k/mmlu_acc_norm.json +1 -0
- data/plots/edu-100k/openbookqa_acc_norm.json +1 -0
- data/plots/edu-100k/piqa_acc_norm.json +1 -0
- data/plots/edu-100k/winogrande_acc_norm.json +1 -0
- data/plots/edu-8k/arc_acc_norm.json +1 -0
- data/plots/edu-8k/hellaswag_acc_norm.json +1 -0
- data/plots/edu-8k/index.json +1 -0
- data/plots/edu-8k/mmlu_acc_norm.json +1 -0
- data/plots/edu-8k/openbookqa_acc_norm.json +1 -0
- data/plots/edu-8k/piqa_acc_norm.json +1 -0
- data/plots/edu-8k/winogrande_acc_norm.json +1 -0
- plots/edu-100k.png +0 -0
- plots/edu-8k.png +0 -0
- src/plotting.js +15 -5
data/plots/edu-100k/arc_acc_norm.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"data": {"C4": {"x": ["C4"], "y": [0.4390000104904175], "label": "C4"}, "Dolma": {"x": ["Dolma"], "y": [0.4329999983310699], "label": "Dolma"}, "FineWeb (ours)": {"x": ["FineWeb (ours)"], "y": [0.4404999911785126], "label": "FineWeb (ours)"}, "RedPajama2": {"x": ["RedPajama2"], "y": [0.4395000040531158], "label": "RedPajama2"}, "RefinedWeb": {"x": ["RefinedWeb"], "y": [0.4375], "label": "RefinedWeb"}, "SlimPajama": {"x": ["SlimPajama"], "y": [0.4514999985694885], "label": "SlimPajama"}, "The Pile": {"x": ["The Pile"], "y": [0.4090000092983246], "label": "The Pile"}, "FineWeb-Edu": {"x": ["FineWeb-Edu"], "y": [0.5475000143051147], "label": "FineWeb-Edu"}}, "layout": {"showlegend": false, "title": {"text": "FineWeb-Edu at 100k steps"}, "xaxis": {"title": {"text": "Dataset", "standoff": 30}, "tickangle": 30}, "margin": {"b": 100}}}
|
data/plots/edu-100k/hellaswag_acc_norm.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"data": {"C4": {"x": ["C4"], "y": [0.6010000109672546], "label": "C4"}, "Dolma": {"x": ["Dolma"], "y": [0.5879999995231628], "label": "Dolma"}, "FineWeb (ours)": {"x": ["FineWeb (ours)"], "y": [0.6060000061988831], "label": "FineWeb (ours)"}, "RedPajama2": {"x": ["RedPajama2"], "y": [0.5440000295639038], "label": "RedPajama2"}, "RefinedWeb": {"x": ["RefinedWeb"], "y": [0.5709999799728394], "label": "RefinedWeb"}, "SlimPajama": {"x": ["SlimPajama"], "y": [0.5649999976158142], "label": "SlimPajama"}, "The Pile": {"x": ["The Pile"], "y": [0.515999972820282], "label": "The Pile"}, "FineWeb-Edu": {"x": ["FineWeb-Edu"], "y": [0.5830000042915344], "label": "FineWeb-Edu"}}, "layout": {"showlegend": false, "title": {"text": "FineWeb-Edu at 100k steps"}, "xaxis": {"title": {"text": "Dataset", "standoff": 30}, "tickangle": 30}, "margin": {"b": 100}}}
|
data/plots/edu-100k/index.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"files": {"mmlu/acc_norm": {"file": "mmlu_acc_norm.json"}, "arc/acc_norm": {"file": "arc_acc_norm.json"}, "openbookqa/acc_norm": {"file": "openbookqa_acc_norm.json"}, "piqa/acc_norm": {"file": "piqa_acc_norm.json"}, "hellaswag/acc_norm": {"file": "hellaswag_acc_norm.json"}, "winogrande/acc_norm": {"file": "winogrande_acc_norm.json"}}, "settings": {"defaultMetric": "mmlu/acc_norm", "slider": null, "autoSetXRange": false}}
|
data/plots/edu-100k/mmlu_acc_norm.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"data": {"C4": {"x": ["C4"], "y": [0.3100601136684418], "label": "C4"}, "Dolma": {"x": ["Dolma"], "y": [0.3082475662231445], "label": "Dolma"}, "FineWeb (ours)": {"x": ["FineWeb (ours)"], "y": [0.3212694227695465], "label": "FineWeb (ours)"}, "RedPajama2": {"x": ["RedPajama2"], "y": [0.3182428181171417], "label": "RedPajama2"}, "RefinedWeb": {"x": ["RefinedWeb"], "y": [0.3192791938781738], "label": "RefinedWeb"}, "SlimPajama": {"x": ["SlimPajama"], "y": [0.3266949653625488], "label": "SlimPajama"}, "The Pile": {"x": ["The Pile"], "y": [0.3129254281520843], "label": "The Pile"}, "FineWeb-Edu": {"x": ["FineWeb-Edu"], "y": [0.3591959178447723], "label": "FineWeb-Edu"}}, "layout": {"showlegend": false, "title": {"text": "FineWeb-Edu at 100k steps"}, "xaxis": {"title": {"text": "Dataset", "standoff": 30}, "tickangle": 30}, "margin": {"b": 100}}}
|
data/plots/edu-100k/openbookqa_acc_norm.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"data": {"C4": {"x": ["C4"], "y": [0.3740000128746032], "label": "C4"}, "Dolma": {"x": ["Dolma"], "y": [0.3499999940395355], "label": "Dolma"}, "FineWeb (ours)": {"x": ["FineWeb (ours)"], "y": [0.3680000007152557], "label": "FineWeb (ours)"}, "RedPajama2": {"x": ["RedPajama2"], "y": [0.3339999914169311], "label": "RedPajama2"}, "RefinedWeb": {"x": ["RefinedWeb"], "y": [0.3459999859333038], "label": "RefinedWeb"}, "SlimPajama": {"x": ["SlimPajama"], "y": [0.3499999940395355], "label": "SlimPajama"}, "The Pile": {"x": ["The Pile"], "y": [0.3339999914169311], "label": "The Pile"}, "FineWeb-Edu": {"x": ["FineWeb-Edu"], "y": [0.4000000059604645], "label": "FineWeb-Edu"}}, "layout": {"showlegend": false, "title": {"text": "FineWeb-Edu at 100k steps"}, "xaxis": {"title": {"text": "Dataset", "standoff": 30}, "tickangle": 30}, "margin": {"b": 100}}}
|
data/plots/edu-100k/piqa_acc_norm.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"data": {"C4": {"x": ["C4"], "y": [0.7739999890327454], "label": "C4"}, "Dolma": {"x": ["Dolma"], "y": [0.7549999952316284], "label": "Dolma"}, "FineWeb (ours)": {"x": ["FineWeb (ours)"], "y": [0.7580000162124634], "label": "FineWeb (ours)"}, "RedPajama2": {"x": ["RedPajama2"], "y": [0.7239999771118164], "label": "RedPajama2"}, "RefinedWeb": {"x": ["RefinedWeb"], "y": [0.7710000276565552], "label": "RefinedWeb"}, "SlimPajama": {"x": ["SlimPajama"], "y": [0.7379999756813049], "label": "SlimPajama"}, "The Pile": {"x": ["The Pile"], "y": [0.7179999947547913], "label": "The Pile"}, "FineWeb-Edu": {"x": ["FineWeb-Edu"], "y": [0.7590000033378601], "label": "FineWeb-Edu"}}, "layout": {"showlegend": false, "title": {"text": "FineWeb-Edu at 100k steps"}, "xaxis": {"title": {"text": "Dataset", "standoff": 30}, "tickangle": 30}, "margin": {"b": 100}}}
|
data/plots/edu-100k/winogrande_acc_norm.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"data": {"C4": {"x": ["C4"], "y": [0.5490000247955322], "label": "C4"}, "Dolma": {"x": ["Dolma"], "y": [0.550000011920929], "label": "Dolma"}, "FineWeb (ours)": {"x": ["FineWeb (ours)"], "y": [0.5559999942779541], "label": "FineWeb (ours)"}, "RedPajama2": {"x": ["RedPajama2"], "y": [0.5509999990463257], "label": "RedPajama2"}, "RefinedWeb": {"x": ["RefinedWeb"], "y": [0.5680000185966492], "label": "RefinedWeb"}, "SlimPajama": {"x": ["SlimPajama"], "y": [0.5519999861717224], "label": "SlimPajama"}, "The Pile": {"x": ["The Pile"], "y": [0.5350000262260437], "label": "The Pile"}, "FineWeb-Edu": {"x": ["FineWeb-Edu"], "y": [0.5720000267028809], "label": "FineWeb-Edu"}}, "layout": {"showlegend": false, "title": {"text": "FineWeb-Edu at 100k steps"}, "xaxis": {"title": {"text": "Dataset", "standoff": 30}, "tickangle": 30}, "margin": {"b": 100}}}
|
data/plots/edu-8k/arc_acc_norm.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"data": {"FW-Edu-threshold=4": {"x": ["FW-Edu-threshold=4"], "y": [0.4675000011920929], "label": "FW-Edu-threshold=4"}, "FW-Edu-threshold=3": {"x": ["FW-Edu-threshold=3"], "y": [0.42750000953674316], "label": "FW-Edu-threshold=3"}, "FW-Edu-threshold=2": {"x": ["FW-Edu-threshold=2"], "y": [0.38850000500679016], "label": "FW-Edu-threshold=2"}, "FineWeb (FW)": {"x": ["FineWeb (FW)"], "y": [0.35100001096725464], "label": "FineWeb (FW)"}}, "layout": {"showlegend": false, "title": {"text": "FineWeb-Edu thresholding"}, "xaxis": {"title": {"standoff": 60, "text": "Dataset"}, "tickangle": 30}, "margin": {"b": 120}}}
|
data/plots/edu-8k/hellaswag_acc_norm.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"data": {"FW-Edu-threshold=4": {"x": ["FW-Edu-threshold=4"], "y": [0.3720000088214874], "label": "FW-Edu-threshold=4"}, "FW-Edu-threshold=3": {"x": ["FW-Edu-threshold=3"], "y": [0.4390000104904175], "label": "FW-Edu-threshold=3"}, "FW-Edu-threshold=2": {"x": ["FW-Edu-threshold=2"], "y": [0.421999990940094], "label": "FW-Edu-threshold=2"}, "FineWeb (FW)": {"x": ["FineWeb (FW)"], "y": [0.41200000047683716], "label": "FineWeb (FW)"}}, "layout": {"showlegend": false, "title": {"text": "FineWeb-Edu thresholding"}, "xaxis": {"title": {"standoff": 60, "text": "Dataset"}, "tickangle": 30}, "margin": {"b": 120}}}
|
data/plots/edu-8k/index.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"files": {"mmlu/acc_norm": {"file": "mmlu_acc_norm.json"}, "arc/acc_norm": {"file": "arc_acc_norm.json"}, "openbookqa/acc_norm": {"file": "openbookqa_acc_norm.json"}, "piqa/acc_norm": {"file": "piqa_acc_norm.json"}, "hellaswag/acc_norm": {"file": "hellaswag_acc_norm.json"}, "winogrande/acc_norm": {"file": "winogrande_acc_norm.json"}}, "settings": {"defaultMetric": "mmlu/acc_norm", "slider": null, "autoSetXRange": false}}
|
data/plots/edu-8k/mmlu_acc_norm.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"data": {"FW-Edu-threshold=4": {"x": ["FW-Edu-threshold=4"], "y": [0.30724120140075684], "label": "FW-Edu-threshold=4"}, "FW-Edu-threshold=3": {"x": ["FW-Edu-threshold=3"], "y": [0.2939043641090393], "label": "FW-Edu-threshold=3"}, "FW-Edu-threshold=2": {"x": ["FW-Edu-threshold=2"], "y": [0.2838209271430969], "label": "FW-Edu-threshold=2"}, "FineWeb (FW)": {"x": ["FineWeb (FW)"], "y": [0.26926591992378235], "label": "FineWeb (FW)"}}, "layout": {"showlegend": false, "title": {"text": "FineWeb-Edu thresholding"}, "xaxis": {"title": {"standoff": 60, "text": "Dataset"}, "tickangle": 30}, "margin": {"b": 120}}}
|
data/plots/edu-8k/openbookqa_acc_norm.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"data": {"FW-Edu-threshold=4": {"x": ["FW-Edu-threshold=4"], "y": [0.3540000021457672], "label": "FW-Edu-threshold=4"}, "FW-Edu-threshold=3": {"x": ["FW-Edu-threshold=3"], "y": [0.3400000035762787], "label": "FW-Edu-threshold=3"}, "FW-Edu-threshold=2": {"x": ["FW-Edu-threshold=2"], "y": [0.3499999940395355], "label": "FW-Edu-threshold=2"}, "FineWeb (FW)": {"x": ["FineWeb (FW)"], "y": [0.2759999930858612], "label": "FineWeb (FW)"}}, "layout": {"showlegend": false, "title": {"text": "FineWeb-Edu thresholding"}, "xaxis": {"title": {"standoff": 60, "text": "Dataset"}, "tickangle": 30}, "margin": {"b": 120}}}
|
data/plots/edu-8k/piqa_acc_norm.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"data": {"FW-Edu-threshold=4": {"x": ["FW-Edu-threshold=4"], "y": [0.6399999856948853], "label": "FW-Edu-threshold=4"}, "FW-Edu-threshold=3": {"x": ["FW-Edu-threshold=3"], "y": [0.6819999814033508], "label": "FW-Edu-threshold=3"}, "FW-Edu-threshold=2": {"x": ["FW-Edu-threshold=2"], "y": [0.6970000267028809], "label": "FW-Edu-threshold=2"}, "FineWeb (FW)": {"x": ["FineWeb (FW)"], "y": [0.703000009059906], "label": "FineWeb (FW)"}}, "layout": {"showlegend": false, "title": {"text": "FineWeb-Edu thresholding"}, "xaxis": {"title": {"standoff": 60, "text": "Dataset"}, "tickangle": 30}, "margin": {"b": 120}}}
|
data/plots/edu-8k/winogrande_acc_norm.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"data": {"FW-Edu-threshold=4": {"x": ["FW-Edu-threshold=4"], "y": [0.5080000162124634], "label": "FW-Edu-threshold=4"}, "FW-Edu-threshold=3": {"x": ["FW-Edu-threshold=3"], "y": [0.4869999885559082], "label": "FW-Edu-threshold=3"}, "FW-Edu-threshold=2": {"x": ["FW-Edu-threshold=2"], "y": [0.5139999985694885], "label": "FW-Edu-threshold=2"}, "FineWeb (FW)": {"x": ["FineWeb (FW)"], "y": [0.49300000071525574], "label": "FineWeb (FW)"}}, "layout": {"showlegend": false, "title": {"text": "FineWeb-Edu thresholding"}, "xaxis": {"title": {"standoff": 60, "text": "Dataset"}, "tickangle": 30}, "margin": {"b": 120}}}
|
plots/edu-100k.png
ADDED
plots/edu-8k.png
ADDED
src/plotting.js
CHANGED
@@ -1,3 +1,13 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
const TASK_ID_TO_NAME = {
|
2 |
// Ablations
|
3 |
agg_score: "Aggregate Score",
|
@@ -97,6 +107,7 @@ const DEFAULT_LAYOUT = {
|
|
97 |
const getAutoRange = (traces) => {
|
98 |
let minX = Math.min(...traces.flatMap((trace) => trace.x));
|
99 |
let maxX = Math.max(...traces.flatMap((trace) => trace.x));
|
|
|
100 |
return [minX * 0.95, maxX * 1.05];
|
101 |
};
|
102 |
|
@@ -138,17 +149,15 @@ const init_ablation_plot = function () {
|
|
138 |
const traces = metricData?.traces?.[metricName] ?? [];
|
139 |
for (const key in metricData?.data ?? []) {
|
140 |
const traceData = metricData.data[key];
|
|
|
141 |
const y = rollingWindow(traceData.y, sliderValue);
|
142 |
const x = traceData.x.slice(0, y.length);
|
|
|
143 |
const trace = {
|
144 |
x: x,
|
145 |
y: y,
|
146 |
-
type: "scatter",
|
147 |
-
mode: "lines",
|
148 |
-
line: {
|
149 |
-
width: 2.5,
|
150 |
-
},
|
151 |
name: traceData.label,
|
|
|
152 |
};
|
153 |
traces.push(trace);
|
154 |
}
|
@@ -167,6 +176,7 @@ const init_ablation_plot = function () {
|
|
167 |
},
|
168 |
metricData.layout
|
169 |
);
|
|
|
170 |
Plotly.react(plot, traces, layout);
|
171 |
|
172 |
window.addEventListener("resize", () => {
|
|
|
1 |
+
const LINE_SETTINGS = {
|
2 |
+
width: 2.5,
|
3 |
+
type: "scatter",
|
4 |
+
mode: "lines",
|
5 |
+
}
|
6 |
+
const BAR_SETTINGS = {
|
7 |
+
width: 0.5,
|
8 |
+
type: "bar",
|
9 |
+
}
|
10 |
+
|
11 |
const TASK_ID_TO_NAME = {
|
12 |
// Ablations
|
13 |
agg_score: "Aggregate Score",
|
|
|
107 |
const getAutoRange = (traces) => {
|
108 |
let minX = Math.min(...traces.flatMap((trace) => trace.x));
|
109 |
let maxX = Math.max(...traces.flatMap((trace) => trace.x));
|
110 |
+
console.log(minX, maxX);
|
111 |
return [minX * 0.95, maxX * 1.05];
|
112 |
};
|
113 |
|
|
|
149 |
const traces = metricData?.traces?.[metricName] ?? [];
|
150 |
for (const key in metricData?.data ?? []) {
|
151 |
const traceData = metricData.data[key];
|
152 |
+
console.log(traceData)
|
153 |
const y = rollingWindow(traceData.y, sliderValue);
|
154 |
const x = traceData.x.slice(0, y.length);
|
155 |
+
const plotSettings = x.length > 1 ? LINE_SETTINGS : BAR_SETTINGS;
|
156 |
const trace = {
|
157 |
x: x,
|
158 |
y: y,
|
|
|
|
|
|
|
|
|
|
|
159 |
name: traceData.label,
|
160 |
+
...plotSettings,
|
161 |
};
|
162 |
traces.push(trace);
|
163 |
}
|
|
|
176 |
},
|
177 |
metricData.layout
|
178 |
);
|
179 |
+
console.log(layout);
|
180 |
Plotly.react(plot, traces, layout);
|
181 |
|
182 |
window.addEventListener("resize", () => {
|