Spaces:

pdufour
/

Qwen2-VL-2B-Instruct-ONNX-Q4-F16

Running

App Files Files Community

pdufour commited on Nov 19

Commit

192f46c

•

1 Parent(s): f28c74b

Update index.js

Browse files

Files changed (1) hide show

index.js +18 -18

index.js CHANGED Viewed

@@ -31,7 +31,7 @@ let currentQuery = '';
 async function initializeSessions() {
   status.textContent = 'Loading model...';
   ortSessionA = await ort.InferenceSession.create(
     await getModelFile(ONNX_MODEL, `onnx/QwenVL_A_${QUANT}.onnx`),
     { executionProviders: ["webgpu"] }
@@ -51,14 +51,14 @@ async function initializeSessions() {
     await getModelFile(ONNX_MODEL, `onnx/QwenVL_D_${QUANT}.onnx`),
     {
       executionProviders: ["webgpu"],
-    }
-    ortSessionE = await ort.InferenceSession.create(
-      await getModelFile(ONNX_MODEL, `onnx/QwenVL_E_${QUANT}.onnx`),
-      {
-        executionProviders: ["wasm"],
-      },
-    );
   );
@@ -126,11 +126,11 @@ export function float16ToInt64(float16Value) {
 async function handleQuery(imageUrl, query) {
-  console.log('handleQuery', {imageUrl}, {query});
   try {
     status.textContent = 'Analyzing...';
     const result = await imageTextToText(imageUrl, query, (out) => {
       output.textContent = out;
     });
@@ -160,9 +160,9 @@ export async function imageTextToText(
     "float16",
     new Uint16Array(
       config.num_hidden_layers *
-        config.num_key_value_heads *
-        MAX_SEQ_LENGTH *
-        (config.hidden_size / config.num_attention_heads)
     ).fill(0),
     [
       config.num_hidden_layers,
@@ -181,7 +181,7 @@ export async function imageTextToText(
   );
   let pos_factor = new Tensor("float16", new Uint16Array([0]), [1]);
   const tokenizer = await AutoTokenizer.from_pretrained(BASE_MODEL);
   const prompt = `\n<|im_start|>user\n<|vision_start|><|vision_end|>${query}<|im_end|>\n<|im_start|>assistant\n`;
   const token = await tokenizer(prompt, {
@@ -249,7 +249,7 @@ export async function imageTextToText(
     await ortSessionA.release();
     ortSessionA = null;
     ({ hidden_states, position_ids } = await ortSessionD.run({
       "hidden_states.1": hidden_states,
       image_embed,
@@ -333,7 +333,7 @@ export async function imageTextToText(
     } else {
       const decoded = tokenizer.decode([...token_id.data]);
       cb(output);
       output += decoded;
     }
   }
@@ -378,7 +378,7 @@ promptInput.addEventListener('keypress', (e) => {
 form.addEventListener('submit', (e) => {
   e.preventDefault();
   if (!currentImage || !currentQuery) {
     status.textContent = 'Please select an image and type a prompt';
   } else {

 async function initializeSessions() {
   status.textContent = 'Loading model...';
   ortSessionA = await ort.InferenceSession.create(
     await getModelFile(ONNX_MODEL, `onnx/QwenVL_A_${QUANT}.onnx`),
     { executionProviders: ["webgpu"] }
     await getModelFile(ONNX_MODEL, `onnx/QwenVL_D_${QUANT}.onnx`),
     {
       executionProviders: ["webgpu"],
+    };
+  ortSessionE = await ort.InferenceSession.create(
+    await getModelFile(ONNX_MODEL, `onnx/QwenVL_E_${QUANT}.onnx`),
+    {
+      executionProviders: ["wasm"],
+    },
+  );
   );
 async function handleQuery(imageUrl, query) {
+  console.log('handleQuery', { imageUrl }, { query });
   try {
     status.textContent = 'Analyzing...';
     const result = await imageTextToText(imageUrl, query, (out) => {
       output.textContent = out;
     });
     "float16",
     new Uint16Array(
       config.num_hidden_layers *
+      config.num_key_value_heads *
+      MAX_SEQ_LENGTH *
+      (config.hidden_size / config.num_attention_heads)
     ).fill(0),
     [
       config.num_hidden_layers,
   );
   let pos_factor = new Tensor("float16", new Uint16Array([0]), [1]);
   const tokenizer = await AutoTokenizer.from_pretrained(BASE_MODEL);
   const prompt = `\n<|im_start|>user\n<|vision_start|><|vision_end|>${query}<|im_end|>\n<|im_start|>assistant\n`;
   const token = await tokenizer(prompt, {
     await ortSessionA.release();
     ortSessionA = null;
     ({ hidden_states, position_ids } = await ortSessionD.run({
       "hidden_states.1": hidden_states,
       image_embed,
     } else {
       const decoded = tokenizer.decode([...token_id.data]);
       cb(output);
       output += decoded;
     }
   }
 form.addEventListener('submit', (e) => {
   e.preventDefault();
   if (!currentImage || !currentQuery) {
     status.textContent = 'Please select an image and type a prompt';
   } else {