Spaces:

pdufour
/

Qwen2-VL-2B-Instruct-ONNX-Q4-F16

Running

App Files Files Community

pdufour commited on Nov 19

Commit

44a6e1e

•

1 Parent(s): 104dfa1

Update index.js

Browse files

Files changed (1) hide show

index.js +1 -11

index.js CHANGED Viewed

@@ -19,7 +19,7 @@ const fileUpload = document.getElementById('upload');
 const imageContainer = document.getElementById('container');
 const example = document.getElementById('example');
-let ortSessionA, ortSessionB, ortSessionC;
 let config;
 async function initializeSessions() {
@@ -29,19 +29,16 @@ async function initializeSessions() {
     await getModelFile(ONNX_MODEL, `onnx/QwenVL_A_${QUANT}.onnx`),
     { executionProviders: ["webgpu"] }
   );
-  console.log({ortSessionA});
   ortSessionB = await ort.InferenceSession.create(
     await getModelFile(ONNX_MODEL, `onnx/QwenVL_B_${QUANT}.onnx`),
     { executionProviders: ["webgpu"] }
   );
-  console.log({ortSessionB});
   ortSessionC = await ort.InferenceSession.create(
     await getModelFile(ONNX_MODEL, `onnx/QwenVL_C_${QUANT}.onnx`),
     { executionProviders: ["webgpu"] }
   );
-  console.log({ortSessionC});
   config = (await getModelJSON(BASE_MODEL, "config.json"));
@@ -77,7 +74,6 @@ export async function imageTextToText(
   query,
   vision = true
 ) {
-  let ortSessionA, ortSessionB, ortSessionC, ortSessionD, ortSessionE;
   const prompt_head_len = new Tensor("int64", new BigInt64Array([5n]), [1]);
@@ -136,12 +132,6 @@ export async function imageTextToText(
   const dummy = new ort.Tensor("int32", new Int32Array([0]), []);
-  if (!ortSessionB) {
-    await ort.InferenceSession.create(
-      await getModelFile(ONNX_MODEL, `onnx/QwenVL_B_${QUANT}.onnx`),
-        { executionProviders: ["webgpu"] }
-    );
-  }
   let { hidden_states } = await ortSessionB.run({
     input_ids: input_ids,
     ids_len: ids_len,

 const imageContainer = document.getElementById('container');
 const example = document.getElementById('example');
+let ortSessionA, ortSessionB, ortSessionC, ortSessionD, ortSessionE;
 let config;
 async function initializeSessions() {
     await getModelFile(ONNX_MODEL, `onnx/QwenVL_A_${QUANT}.onnx`),
     { executionProviders: ["webgpu"] }
   );
   ortSessionB = await ort.InferenceSession.create(
     await getModelFile(ONNX_MODEL, `onnx/QwenVL_B_${QUANT}.onnx`),
     { executionProviders: ["webgpu"] }
   );
   ortSessionC = await ort.InferenceSession.create(
     await getModelFile(ONNX_MODEL, `onnx/QwenVL_C_${QUANT}.onnx`),
     { executionProviders: ["webgpu"] }
   );
   config = (await getModelJSON(BASE_MODEL, "config.json"));
   query,
   vision = true
 ) {
   const prompt_head_len = new Tensor("int64", new BigInt64Array([5n]), [1]);
   const dummy = new ort.Tensor("int32", new Int32Array([0]), []);
   let { hidden_states } = await ortSessionB.run({
     input_ids: input_ids,
     ids_len: ids_len,