radames's picture
first
d04fa6b
raw
history blame
6.49 kB
import { select } from "https://cdn.skypack.dev/d3-selection@3";
import { color, hcl } from "https://cdn.skypack.dev/d3-color@3";
import {
piecewise,
interpolateRgb,
} from "https://cdn.skypack.dev/d3-interpolate@3";
const d3 = { select, color, hcl, piecewise, interpolateRgb };
const colorPalette = d3.piecewise(d3.interpolateRgb.gamma(2.2), [
"#0E21A0",
"#4D2DB7",
"#9D44C0",
"#EC53B0",
"#F57B55",
"#FFDB5A",
]);
class WorkerPool {
constructor(size) {
this.workers = [];
this.size = size;
this.init();
}
get size() {
return this._size;
}
set size(size) {
this._size = size;
}
init() {
console.log("init", this.size);
for (let i = 0; i < this.size; i++) {
this.workers.push({
worker: new Worker("./llama2c.worker.js", { type: "module" }),
inUse: false,
id: window.crypto.randomUUID(),
});
}
}
getWorker() {
return new Promise((resolve) => {
const check = () => {
for (let worker of this.workers) {
if (!worker.inUse) {
worker.inUse = true;
resolve(worker.worker);
return;
}
}
setTimeout(check, 100);
};
check();
});
}
releaseWorker(worker) {
this.workers.find((w) => w.worker === worker).inUse = false;
}
}
// base url for audio examples
const MODELS_BASE_URL =
"https://huggingface.co/karpathy/tinyllamas/resolve/main";
// models base url
const MODELS = {
stories15M: {
url: "stories15M.bin",
seq_len: 256,
},
stories42M: {
url: "stories42M.bin",
seq_len: 1024,
},
stories110M: {
url: "stories110M.bin",
seq_len: 1024,
},
};
const workerPool = new WorkerPool(window.navigator.hardwareConcurrency);
async function generateSequence({
worker,
prompt,
weightsURL,
modelID,
maxSeqLen,
temp,
repeatPenalty,
contentEl,
controller,
}) {
return new Promise((resolve, reject) => {
const seed = BigInt(Math.floor(Math.random() * 2 ** 64 - 1));
worker.postMessage({
weightsURL,
modelID,
tokenizerURL: "tokenizer.json",
prompt,
temp,
repeatPenalty,
seed: seed,
maxSeqLen,
command: "start",
});
function handleAbort() {
console.log("abort");
worker.postMessage({ command: "abort" });
}
function updateStatus(data) {
if (data.status === "generating") {
const { message, prompt, sentence, tokensSec, totalTime } = data;
contentEl.innerHTML = `<span class="font-semibold">${prompt}</span>
${sentence.replace(/\<s\>|\<\/s\>/g, "")}`;
}
}
const handleMessage = (event) => {
const { status, error } = event.data;
if (status) updateStatus(event.data);
if (error) reject(new Error(error));
if (status === "complete" || status === "aborted") {
workerPool.releaseWorker(worker);
resolve(event.data);
}
};
controller.signal.addEventListener("abort", handleAbort);
worker.addEventListener("message", handleMessage);
});
}
async function initWorkers() {
const containerEl = d3.select("#container");
d3.select("#model").on("input", (e) => {
const model = MODELS[e.target.value];
d3.select("#max-seq").property("max", model.seq_len);
});
const containers = await Promise.all(
workerPool.workers.map(async (_, i) => {
const contentEl = d3.select(document.createElement("div"));
contentEl.on("pointerover pointerdown", (e) => {
d3.select(e.currentTarget).style("z-index", 100);
});
contentEl.on("pointerout pointercancel pointerleave", (e) => {
d3.select(e.currentTarget).style("z-index", "unset");
});
const bgColor = colorPalette(i / workerPool.size);
const fontColor = d3.hcl(bgColor).l < 50 ? "#fff" : "#000";
contentEl
.style("background-color", bgColor)
.style("color", fontColor)
.style("grid-row-start", `${i + 1}`)
.classed("c-block ", true);
containerEl.append(() => contentEl.node());
return [contentEl.node(), await workerPool.getWorker()];
})
);
return containers;
}
async function fetchArrayBuffer(url) {
const cacheName = "llama2c-candle-cache";
const cache = await caches.open(cacheName);
const cachedResponse = await cache.match(url);
if (cachedResponse) {
const data = await cachedResponse.arrayBuffer();
return new Uint8Array(data);
}
const res = await fetch(url, { cache: "force-cache" });
cache.put(url, res.clone());
return new Uint8Array(await res.arrayBuffer());
}
async function run(containers, controller) {
const getValue = (e) => e.value;
const prompt = document.querySelector("#prompt");
const maxSeqLen = document.querySelector("#max-seq");
const temp = document.querySelector("#temperature");
const repeatPenalty = document.querySelector("#repeat-penalty");
const modelID = document.querySelector("#model");
const weightsURL = `${MODELS_BASE_URL}/${MODELS[getValue(modelID)].url}`;
maxSeqLen.disabled = true;
temp.disabled = true;
repeatPenalty.disabled = true;
modelID.disabled = true;
// pre fetch and cache weights and tokenizer
await Promise.all([
fetchArrayBuffer(weightsURL),
fetchArrayBuffer(`tokenizer.json`),
]);
await Promise.all(
containers.map(([container, worker]) =>
generateSequence({
worker,
prompt: getValue(prompt),
weightsURL,
modelID: getValue(modelID),
maxSeqLen: getValue(maxSeqLen),
temp: getValue(temp),
repeatPenalty: getValue(repeatPenalty),
contentEl: container,
controller,
})
)
);
maxSeqLen.disabled = false;
temp.disabled = false;
repeatPenalty.disabled = false;
modelID.disabled = false;
}
initWorkers().then((containers) => {
const runBtn = d3.select(document.querySelector("#run"));
let runController = new AbortController();
let isRunning = false;
d3.select("#form").on("submit", async (e) => {
e.preventDefault();
if (isRunning) {
console.log("stop");
stopRunning();
} else {
console.log("start");
startRunning();
await run(containers, runController);
stopRunning();
}
});
function startRunning() {
isRunning = true;
runBtn.text("Stop");
}
function stopRunning() {
runBtn.text("Run");
runController.abort();
runController = new AbortController();
isRunning = false;
}
});