coyotte508
/

js-hub

Model card Files Files and versions Community

js-hub / utils /XetBlob.spec.ts

coyotte508 HF Staff

Add 1 files

21dd449 verified 1 day ago

raw

history blame contribute delete

26.8 kB

	import { describe, expect, it } from "vitest";
	import type { ReconstructionInfo } from "./XetBlob";
	import { bg4_regoup_bytes, XetBlob } from "./XetBlob";
	import { sum } from "./sum";

	describe("XetBlob", () => {
	it("should lazy load the first 22 bytes", async () => {
	const blob = new XetBlob({
	hash: "7b3b6d07673a88cf467e67c1f7edef1a8c268cbf66e9dd9b0366322d4ab56d9b",
	size: 5_234_139_343,
	refreshUrl: "https://huggingface.co/api/models/celinah/xet-experiments/xet-read-token/main",
	});

	expect(await blob.slice(10, 22).text()).toBe("__metadata__");
	});

	it("should load the first chunk correctly", async () => {
	let xorbCount = 0;
	const blob = new XetBlob({
	refreshUrl: "https://huggingface.co/api/models/celinah/xet-experiments/xet-read-token/main",
	hash: "7b3b6d07673a88cf467e67c1f7edef1a8c268cbf66e9dd9b0366322d4ab56d9b",
	size: 5_234_139_343,
	fetch: async (url, opts) => {
	if (typeof url === "string" && url.includes("/xorbs/")) {
	xorbCount++;
	}
	return fetch(url, opts);
	},
	});

	const xetDownload = await blob.slice(0, 29928).arrayBuffer();
	const bridgeDownload = await fetch(
	"https://huggingface.co/celinah/xet-experiments/resolve/main/model5GB.safetensors",
	{
	headers: {
	Range: "bytes=0-29927",
	},
	}
	).then((res) => res.arrayBuffer());

	expect(new Uint8Array(xetDownload)).toEqual(new Uint8Array(bridgeDownload));
	expect(xorbCount).toBe(1);
	});

	it("should load just past the first chunk correctly", async () => {
	let xorbCount = 0;
	const blob = new XetBlob({
	refreshUrl: "https://huggingface.co/api/models/celinah/xet-experiments/xet-read-token/main",
	hash: "7b3b6d07673a88cf467e67c1f7edef1a8c268cbf66e9dd9b0366322d4ab56d9b",
	size: 5_234_139_343,
	fetch: async (url, opts) => {
	if (typeof url === "string" && url.includes("/xorbs/")) {
	xorbCount++;
	}
	return fetch(url, opts);
	},
	});

	const xetDownload = await blob.slice(0, 29929).arrayBuffer();
	const bridgeDownload = await fetch(
	"https://huggingface.co/celinah/xet-experiments/resolve/main/model5GB.safetensors",
	{
	headers: {
	Range: "bytes=0-29928",
	},
	}
	).then((res) => res.arrayBuffer());

	expect(xetDownload.byteLength).toBe(29929);
	expect(new Uint8Array(xetDownload)).toEqual(new Uint8Array(bridgeDownload));
	expect(xorbCount).toBe(2);
	});

	it("should load the first 200kB correctly", async () => {
	let xorbCount = 0;
	const blob = new XetBlob({
	refreshUrl: "https://huggingface.co/api/models/celinah/xet-experiments/xet-read-token/main",
	hash: "7b3b6d07673a88cf467e67c1f7edef1a8c268cbf66e9dd9b0366322d4ab56d9b",
	size: 5_234_139_343,
	fetch: async (url, opts) => {
	if (typeof url === "string" && url.includes("/xorbs/")) {
	xorbCount++;
	}
	return fetch(url, opts);
	},
	// internalLogging: true,
	});

	const xetDownload = await blob.slice(0, 200_000).arrayBuffer();
	const bridgeDownload = await fetch(
	"https://huggingface.co/celinah/xet-experiments/resolve/main/model5GB.safetensors",
	{
	headers: {
	Range: "bytes=0-199999",
	},
	}
	).then((res) => res.arrayBuffer());

	expect(xetDownload.byteLength).toBe(200_000);
	expect(new Uint8Array(xetDownload)).toEqual(new Uint8Array(bridgeDownload));
	expect(xorbCount).toBe(2);
	}, 60_000);

	it("should load correctly when loading far into a chunk range", async () => {
	const blob = new XetBlob({
	refreshUrl: "https://huggingface.co/api/models/celinah/xet-experiments/xet-read-token/main",
	hash: "7b3b6d07673a88cf467e67c1f7edef1a8c268cbf66e9dd9b0366322d4ab56d9b",
	size: 5_234_139_343,
	// internalLogging: true,
	});

	const xetDownload = await blob.slice(10_000_000, 10_100_000).arrayBuffer();
	const bridgeDownload = await fetch(
	"https://huggingface.co/celinah/xet-experiments/resolve/main/model5GB.safetensors",
	{
	headers: {
	Range: "bytes=10000000-10099999",
	},
	}
	).then((res) => res.arrayBuffer());

	console.log("xet", xetDownload.byteLength, "bridge", bridgeDownload.byteLength);
	expect(new Uint8Array(xetDownload).length).toEqual(100_000);
	expect(new Uint8Array(xetDownload)).toEqual(new Uint8Array(bridgeDownload));
	});

	it("should load text correctly when offset_into_range starts in a chunk further than the first", async () => {
	const blob = new XetBlob({
	refreshUrl: "https://huggingface.co/api/models/celinah/xet-experiments/xet-read-token/main",
	hash: "794efea76d8cb372bbe1385d9e51c3384555f3281e629903ecb6abeff7d54eec",
	size: 62_914_580,
	});

	// Reconstruction info
	// {
	// "offset_into_first_range": 600000,
	// "terms":
	// [
	// {
	// "hash": "be748f77930d5929cabd510a15f2c30f2f460b639804ef79dea46affa04fd8b2",
	// "unpacked_length": 655360,
	// "range": { "start": 0, "end": 5 },
	// },
	// {
	// "hash": "be748f77930d5929cabd510a15f2c30f2f460b639804ef79dea46affa04fd8b2",
	// "unpacked_length": 655360,
	// "range": { "start": 0, "end": 5 },
	// },
	// ],
	// "fetch_info":
	// {
	// "be748f77930d5929cabd510a15f2c30f2f460b639804ef79dea46affa04fd8b2":
	// [
	// {
	// "range": { "start": 0, "end": 5 },
	// "url": "...",
	// "url_range": { "start": 0, "end": 2839 },
	// },
	// ],
	// },
	// }

	const text = await blob.slice(600_000, 700_000).text();
	const bridgeDownload = await fetch("https://huggingface.co/celinah/xet-experiments/resolve/main/large_text.txt", {
	headers: {
	Range: "bytes=600000-699999",
	},
	}).then((res) => res.text());

	console.log("xet", text.length, "bridge", bridgeDownload.length);
	expect(text.length).toBe(bridgeDownload.length);
	});

	describe("bg4_regoup_bytes", () => {
	it("should regroup bytes when the array is %4 length", () => {
	expect(bg4_regoup_bytes(new Uint8Array([1, 5, 2, 6, 3, 7, 4, 8]))).toEqual(
	new Uint8Array([1, 2, 3, 4, 5, 6, 7, 8])
	);
	});

	it("should regroup bytes when the array is %4 + 1 length", () => {
	expect(bg4_regoup_bytes(new Uint8Array([1, 5, 9, 2, 6, 3, 7, 4, 8]))).toEqual(
	new Uint8Array([1, 2, 3, 4, 5, 6, 7, 8, 9])
	);
	});

	it("should regroup bytes when the array is %4 + 2 length", () => {
	expect(bg4_regoup_bytes(new Uint8Array([1, 5, 9, 2, 6, 10, 3, 7, 4, 8]))).toEqual(
	new Uint8Array([1, 2, 3, 4, 5, 6, 7, 8, 9, 10])
	);
	});

	it("should regroup bytes when the array is %4 + 3 length", () => {
	expect(bg4_regoup_bytes(new Uint8Array([1, 5, 9, 2, 6, 10, 3, 7, 11, 4, 8]))).toEqual(
	new Uint8Array([1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11])
	);
	});
	});

	describe("when mocked", () => {
	describe("loading many chunks every read", () => {
	it("should load different slices", async () => {
	const chunk1Content = "hello";
	const chunk2Content = "world!";
	const debugged: Array<{ event: "read" \| string } & Record<string, unknown>> = [];

	const chunks = Array(1000)
	.fill(0)
	.flatMap(() => [makeChunk(chunk1Content), makeChunk(chunk2Content)]);

	const mergedChunks = await new Blob(chunks).arrayBuffer();
	const wholeText = (chunk1Content + chunk2Content).repeat(1000);

	const totalSize = wholeText.length;
	let fetchCount = 0;

	const blob = new XetBlob({
	hash: "test",
	size: totalSize,
	refreshUrl: "https://huggingface.co",
	listener: (e) => debugged.push(e),
	fetch: async function (_url, opts) {
	const url = new URL(_url as string);
	const headers = opts?.headers as Record<string, string> \| undefined;

	switch (url.hostname) {
	case "huggingface.co": {
	// This is a token
	return new Response(
	JSON.stringify({
	casUrl: "https://cas.co",
	accessToken: "boo",
	exp: 1_000_000,
	})
	);
	}
	case "cas.co": {
	// This is the reconstruction info
	const range = headers?.["Range"]?.slice("bytes=".length).split("-").map(Number);

	const start = range?.[0] ?? 0;
	// const end = range?.[1] ?? (totalSize - 1);

	return new Response(
	JSON.stringify({
	terms: Array(1000)
	.fill(0)
	.map(() => ({
	hash: "test",
	range: {
	start: 0,
	end: 2,
	},
	unpacked_length: chunk1Content.length + chunk2Content.length,
	})),
	fetch_info: {
	test: [
	{
	url: "https://fetch.co",
	range: { start: 0, end: 2 },
	url_range: {
	start: 0,
	end: mergedChunks.byteLength / 1000 - 1,
	},
	},
	],
	},
	offset_into_first_range: start,
	} satisfies ReconstructionInfo)
	);
	}
	case "fetch.co": {
	fetchCount++;
	return new Response(
	new ReadableStream({
	pull(controller) {
	controller.enqueue(new Uint8Array(mergedChunks));
	controller.close();
	},
	})
	//mergedChunks
	);
	}
	default:
	throw new Error("Unhandled URL");
	}
	},
	});

	const startIndexes = [0, 5, 11, 6, 12, 100, 2000, totalSize - 12, totalSize - 2];

	for (const index of startIndexes) {
	console.log("slice", index);
	const content = await blob.slice(index).text();
	expect(content.length).toBe(wholeText.length - index);
	expect(content.slice(0, 1000)).toEqual(wholeText.slice(index).slice(0, 1000));
	expect(debugged.filter((e) => e.event === "read").length).toBe(2); // 1 read + 1 undefined
	expect(fetchCount).toEqual(1);

	fetchCount = 0;
	debugged.length = 0;
	}
	});

	it("should load different slices when working with different XORBS", async () => {
	const chunk1Content = "hello";
	const chunk2Content = "world!";
	const debugged: Array<{ event: "read" \| string } & Record<string, unknown>> = [];

	const chunks = Array(1000)
	.fill(0)
	.flatMap(() => [makeChunk(chunk1Content), makeChunk(chunk2Content)]);

	const mergedChunks = await new Blob(chunks).arrayBuffer();
	const wholeText = (chunk1Content + chunk2Content).repeat(1000);

	const totalSize = wholeText.length;
	let fetchCount = 0;

	const blob = new XetBlob({
	hash: "test",
	size: totalSize,
	refreshUrl: "https://huggingface.co",
	listener: (e) => debugged.push(e),
	fetch: async function (_url, opts) {
	const url = new URL(_url as string);
	const headers = opts?.headers as Record<string, string> \| undefined;

	switch (url.hostname) {
	case "huggingface.co": {
	// This is a token
	return new Response(
	JSON.stringify({
	casUrl: "https://cas.co",
	accessToken: "boo",
	exp: 1_000_000,
	})
	);
	}
	case "cas.co": {
	// This is the reconstruction info
	const range = headers?.["Range"]?.slice("bytes=".length).split("-").map(Number);

	const start = range?.[0] ?? 0;
	// const end = range?.[1] ?? (totalSize - 1);

	return new Response(
	JSON.stringify({
	terms: Array(1000)
	.fill(0)
	.map((_, i) => ({
	hash: "test" + (i % 2),
	range: {
	start: 0,
	end: 2,
	},
	unpacked_length: chunk1Content.length + chunk2Content.length,
	})),
	fetch_info: {
	test0: [
	{
	url: "https://fetch.co",
	range: { start: 0, end: 2 },
	url_range: {
	start: 0,
	end: mergedChunks.byteLength - 1,
	},
	},
	],
	test1: [
	{
	url: "https://fetch.co",
	range: { start: 0, end: 2 },
	url_range: {
	start: 0,
	end: mergedChunks.byteLength - 1,
	},
	},
	],
	},
	offset_into_first_range: start,
	} satisfies ReconstructionInfo)
	);
	}
	case "fetch.co": {
	fetchCount++;
	return new Response(
	new ReadableStream({
	pull(controller) {
	controller.enqueue(new Uint8Array(mergedChunks));
	controller.close();
	},
	})
	//mergedChunks
	);
	}
	default:
	throw new Error("Unhandled URL");
	}
	},
	});

	const startIndexes = [0, 5, 11, 6, 12, 100, 2000, totalSize - 12, totalSize - 2];

	for (const index of startIndexes) {
	console.log("slice", index);
	const content = await blob.slice(index).text();
	expect(content.length).toBe(wholeText.length - index);
	expect(content.slice(0, 1000)).toEqual(wholeText.slice(index).slice(0, 1000));
	expect(debugged.filter((e) => e.event === "read").length).toBe(4); // 1 read + 1 undefined
	expect(fetchCount).toEqual(2);

	fetchCount = 0;
	debugged.length = 0;
	}
	});
	});

	describe("loading one chunk at a time", () => {
	it("should load different slices but not till the end", async () => {
	const chunk1Content = "hello";
	const chunk2Content = "world!";
	const debugged: Array<{ event: "read" \| string } & Record<string, unknown>> = [];

	const chunks = Array(1000)
	.fill(0)
	.flatMap(() => [makeChunk(chunk1Content), makeChunk(chunk2Content)]);

	const totalChunkLength = sum(chunks.map((x) => x.byteLength));
	const wholeText = (chunk1Content + chunk2Content).repeat(1000);

	const totalSize = wholeText.length;
	let fetchCount = 0;

	const blob = new XetBlob({
	hash: "test",
	size: totalSize,
	refreshUrl: "https://huggingface.co",
	listener: (e) => debugged.push(e),
	fetch: async function (_url, opts) {
	const url = new URL(_url as string);
	const headers = opts?.headers as Record<string, string> \| undefined;

	switch (url.hostname) {
	case "huggingface.co": {
	// This is a token
	return new Response(
	JSON.stringify({
	casUrl: "https://cas.co",
	accessToken: "boo",
	exp: 1_000_000,
	})
	);
	}
	case "cas.co": {
	// This is the reconstruction info
	const range = headers?.["Range"]?.slice("bytes=".length).split("-").map(Number);

	const start = range?.[0] ?? 0;
	// const end = range?.[1] ?? (totalSize - 1);

	return new Response(
	JSON.stringify({
	terms: [
	{
	hash: "test",
	range: {
	start: 0,
	end: 2000,
	},
	unpacked_length: chunk1Content.length + chunk2Content.length,
	},
	],
	fetch_info: {
	test: [
	{
	url: "https://fetch.co",
	range: { start: 0, end: 2000 },
	url_range: {
	start: 0,
	end: totalChunkLength - 1,
	},
	},
	],
	},
	offset_into_first_range: start,
	} satisfies ReconstructionInfo)
	);
	}
	case "fetch.co": {
	fetchCount++;
	return new Response(
	new ReadableStream({
	pull(controller) {
	for (const chunk of chunks) {
	controller.enqueue(chunk);
	}
	controller.close();
	},
	}),
	{
	headers: {
	"Content-Range": `bytes 0-${totalChunkLength - 1}/${totalChunkLength}`,
	ETag: `"test"`,
	"Content-Length": `${totalChunkLength}`,
	},
	}
	);
	}
	default:
	throw new Error("Unhandled URL");
	}
	},
	});

	const startIndexes = [0, 5, 11, 6, 12, 100, 2000];

	for (const index of startIndexes) {
	console.log("slice", index);
	const content = await blob.slice(index, 4000).text();
	expect(content.length).toBe(4000 - index);
	expect(content.slice(0, 1000)).toEqual(wholeText.slice(index).slice(0, 1000));
	expect(fetchCount).toEqual(1);

	fetchCount = 0;
	debugged.length = 0;
	}
	});

	it("should load different slices", async () => {
	const chunk1Content = "hello";
	const chunk2Content = "world!";
	const debugged: Array<{ event: "read" \| string } & Record<string, unknown>> = [];

	const chunks = Array(1000)
	.fill(0)
	.flatMap(() => [makeChunk(chunk1Content), makeChunk(chunk2Content)]);

	const totalChunkLength = sum(chunks.map((x) => x.byteLength));
	const wholeText = (chunk1Content + chunk2Content).repeat(1000);

	const totalSize = wholeText.length;
	let fetchCount = 0;

	const blob = new XetBlob({
	hash: "test",
	size: totalSize,
	refreshUrl: "https://huggingface.co",
	listener: (e) => debugged.push(e),
	fetch: async function (_url, opts) {
	const url = new URL(_url as string);
	const headers = opts?.headers as Record<string, string> \| undefined;

	switch (url.hostname) {
	case "huggingface.co": {
	// This is a token
	return new Response(
	JSON.stringify({
	casUrl: "https://cas.co",
	accessToken: "boo",
	exp: 1_000_000,
	})
	);
	}
	case "cas.co": {
	// This is the reconstruction info
	const range = headers?.["Range"]?.slice("bytes=".length).split("-").map(Number);

	const start = range?.[0] ?? 0;
	// const end = range?.[1] ?? (totalSize - 1);

	return new Response(
	JSON.stringify({
	terms: Array(1000)
	.fill(0)
	.map(() => ({
	hash: "test",
	range: {
	start: 0,
	end: 2,
	},
	unpacked_length: chunk1Content.length + chunk2Content.length,
	})),
	fetch_info: {
	test: [
	{
	url: "https://fetch.co",
	range: { start: 0, end: 2 },
	url_range: {
	start: 0,
	end: totalChunkLength - 1,
	},
	},
	],
	},
	offset_into_first_range: start,
	} satisfies ReconstructionInfo)
	);
	}
	case "fetch.co": {
	fetchCount++;
	return new Response(
	new ReadableStream({
	pull(controller) {
	for (const chunk of chunks) {
	controller.enqueue(chunk);
	}
	controller.close();
	},
	})
	);
	}
	default:
	throw new Error("Unhandled URL");
	}
	},
	});

	const startIndexes = [0, 5, 11, 6, 12, 100, 2000, totalSize - 12, totalSize - 2];

	for (const index of startIndexes) {
	console.log("slice", index);
	const content = await blob.slice(index).text();
	expect(content.length).toBe(wholeText.length - index);
	expect(content.slice(0, 1000)).toEqual(wholeText.slice(index).slice(0, 1000));
	expect(debugged.filter((e) => e.event === "read").length).toBe(2000 + 1); // 1 read for each chunk + 1 undefined
	expect(fetchCount).toEqual(1);

	fetchCount = 0;
	debugged.length = 0;
	}
	});
	});

	describe("loading at 29 bytes intervals", () => {
	it("should load different slices", async () => {
	const chunk1Content = "hello";
	const chunk2Content = "world!";
	const debugged: Array<{ event: "read" \| string } & Record<string, unknown>> = [];

	const chunks = Array(1000)
	.fill(0)
	.flatMap(() => [makeChunk(chunk1Content), makeChunk(chunk2Content)]);
	const mergedChunks = await new Blob(chunks).arrayBuffer();
	const splitChunks = splitChunk(new Uint8Array(mergedChunks), 29);

	const totalChunkLength = sum(chunks.map((x) => x.byteLength));
	const wholeText = (chunk1Content + chunk2Content).repeat(1000);

	const totalSize = wholeText.length;
	let fetchCount = 0;

	const blob = new XetBlob({
	hash: "test",
	size: totalSize,
	refreshUrl: "https://huggingface.co",
	listener: (e) => debugged.push(e),
	fetch: async function (_url, opts) {
	const url = new URL(_url as string);
	const headers = opts?.headers as Record<string, string> \| undefined;

	switch (url.hostname) {
	case "huggingface.co": {
	// This is a token
	return new Response(
	JSON.stringify({
	casUrl: "https://cas.co",
	accessToken: "boo",
	exp: 1_000_000,
	})
	);
	}
	case "cas.co": {
	// This is the reconstruction info
	const range = headers?.["Range"]?.slice("bytes=".length).split("-").map(Number);

	const start = range?.[0] ?? 0;
	// const end = range?.[1] ?? (totalSize - 1);

	return new Response(
	JSON.stringify({
	terms: Array(1000)
	.fill(0)
	.map(() => ({
	hash: "test",
	range: {
	start: 0,
	end: 2,
	},
	unpacked_length: chunk1Content.length + chunk2Content.length,
	})),
	fetch_info: {
	test: [
	{
	url: "https://fetch.co",
	range: { start: 0, end: 2 },
	url_range: {
	start: 0,
	end: totalChunkLength - 1,
	},
	},
	],
	},
	offset_into_first_range: start,
	} satisfies ReconstructionInfo)
	);
	}
	case "fetch.co": {
	fetchCount++;
	return new Response(
	new ReadableStream({
	pull(controller) {
	for (const chunk of splitChunks) {
	controller.enqueue(chunk);
	}
	controller.close();
	},
	})
	);
	}
	default:
	throw new Error("Unhandled URL");
	}
	},
	});

	const startIndexes = [0, 5, 11, 6, 12, 100, 2000, totalSize - 12, totalSize - 2];

	for (const index of startIndexes) {
	console.log("slice", index);
	const content = await blob.slice(index).text();
	expect(content.length).toBe(wholeText.length - index);
	expect(content.slice(0, 1000)).toEqual(wholeText.slice(index).slice(0, 1000));
	expect(debugged.filter((e) => e.event === "read").length).toBe(Math.ceil(totalChunkLength / 29) + 1); // 1 read for each chunk + 1 undefined
	expect(fetchCount).toEqual(1);

	fetchCount = 0;
	debugged.length = 0;
	}
	});
	});

	describe("loading one byte at a time", () => {
	it("should load different slices", async () => {
	const chunk1Content = "hello";
	const chunk2Content = "world!";
	const debugged: Array<{ event: "read" \| string } & Record<string, unknown>> = [];

	const chunks = Array(100)
	.fill(0)
	.flatMap(() => [makeChunk(chunk1Content), makeChunk(chunk2Content)])
	.flatMap((x) => splitChunk(x, 1));

	const totalChunkLength = sum(chunks.map((x) => x.byteLength));
	const wholeText = (chunk1Content + chunk2Content).repeat(100);

	const totalSize = wholeText.length;
	let fetchCount = 0;

	const blob = new XetBlob({
	hash: "test",
	size: totalSize,
	refreshUrl: "https://huggingface.co",
	listener: (e) => debugged.push(e),
	fetch: async function (_url, opts) {
	const url = new URL(_url as string);
	const headers = opts?.headers as Record<string, string> \| undefined;

	switch (url.hostname) {
	case "huggingface.co": {
	// This is a token
	return new Response(
	JSON.stringify({
	casUrl: "https://cas.co",
	accessToken: "boo",
	exp: 1_000_000,
	})
	);
	}
	case "cas.co": {
	// This is the reconstruction info
	const range = headers?.["Range"]?.slice("bytes=".length).split("-").map(Number);

	const start = range?.[0] ?? 0;
	// const end = range?.[1] ?? (totalSize - 1);

	return new Response(
	JSON.stringify({
	terms: Array(100)
	.fill(0)
	.map(() => ({
	hash: "test",
	range: {
	start: 0,
	end: 2,
	},
	unpacked_length: chunk1Content.length + chunk2Content.length,
	})),
	fetch_info: {
	test: [
	{
	url: "https://fetch.co",
	range: { start: 0, end: 2 },
	url_range: {
	start: 0,
	end: totalChunkLength - 1,
	},
	},
	],
	},
	offset_into_first_range: start,
	} satisfies ReconstructionInfo)
	);
	}
	case "fetch.co": {
	fetchCount++;
	return new Response(
	new ReadableStream({
	pull(controller) {
	for (const chunk of chunks) {
	controller.enqueue(chunk);
	}
	controller.close();
	},
	})
	);
	}
	default:
	throw new Error("Unhandled URL");
	}
	},
	});

	const startIndexes = [0, 5, 11, 6, 12, 100, totalSize - 12, totalSize - 2];

	for (const index of startIndexes) {
	console.log("slice", index);
	const content = await blob.slice(index).text();
	expect(content.length).toBe(wholeText.length - index);
	expect(content.slice(0, 1000)).toEqual(wholeText.slice(index).slice(0, 1000));
	expect(debugged.filter((e) => e.event === "read").length).toBe(totalChunkLength + 1); // 1 read for each chunk + 1 undefined
	expect(fetchCount).toEqual(1);

	fetchCount = 0;
	debugged.length = 0;
	}
	});
	});
	});
	});

	function makeChunk(content: string) {
	const encoded = new TextEncoder().encode(content);

	const array = new Uint8Array(encoded.length + 8);

	const dataView = new DataView(array.buffer);
	dataView.setUint8(0, 0); // version
	dataView.setUint8(1, encoded.length % 256); // Compressed length
	dataView.setUint8(2, (encoded.length >> 8) % 256); // Compressed length
	dataView.setUint8(3, (encoded.length >> 16) % 256); // Compressed length
	dataView.setUint8(4, 0); // Compression scheme
	dataView.setUint8(5, encoded.length % 256); // Uncompressed length
	dataView.setUint8(6, (encoded.length >> 8) % 256); // Uncompressed length
	dataView.setUint8(7, (encoded.length >> 16) % 256); // Uncompressed length

	array.set(encoded, 8);

	return array;
	}

	function splitChunk(chunk: Uint8Array, toLength: number): Uint8Array[] {
	const dataView = new DataView(chunk.buffer);
	return new Array(Math.ceil(chunk.byteLength / toLength)).fill(0).map((_, i) => {
	const array = new Uint8Array(Math.min(toLength, chunk.byteLength - i * toLength));

	for (let j = 0; j < array.byteLength; j++) {
	array[j] = dataView.getUint8(i * toLength + j);
	}
	return array;
	});
	}