Nvidia-Embed-V1

Build error

Tonic commited on Jan 15, 2024

Commit

200153d

verified ·

1 Parent(s): b85ac58

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -50,16 +50,17 @@ def last_token_pool(last_hidden_states: Tensor, attention_mask: Tensor) -> Tenso
 @spaces.GPU
 def compute_embeddings(selected_task, input_text, system_prompt):
-    max_length = 2042  # Define max_length here
     if selected_task == "None":
-        # Use the system prompt if 'None' is selected
-        processed_texts = [f'Instruct: {system_prompt}\nQuery: {input_text}']
     else:
-        # Use the task description from the tasks dictionary
         task_description = tasks[selected_task]
         processed_texts = [f'Instruct: {task_description}\nQuery: {input_text}']
     batch_dict = tokenizer(processed_texts, max_length=max_length - 1, return_attention_mask=False, padding=False, truncation=True)
     batch_dict['input_ids'] = [input_ids + [tokenizer.eos_token_id] for input_ids in batch_dict['input_ids']]
     batch_dict = tokenizer.pad(batch_dict, padding=True, return_attention_mask=True, return_tensors='pt')

 @spaces.GPU
 def compute_embeddings(selected_task, input_text, system_prompt):
+    max_length = 2042
     if selected_task == "None":
+        if system_prompt:
+            processed_texts = [f'Instruct: {system_prompt}\nQuery: {input_text}']
+        else:
+            processed_texts = [f'Query: {input_text}']
     else:
         task_description = tasks[selected_task]
         processed_texts = [f'Instruct: {task_description}\nQuery: {input_text}']
     batch_dict = tokenizer(processed_texts, max_length=max_length - 1, return_attention_mask=False, padding=False, truncation=True)
     batch_dict['input_ids'] = [input_ids + [tokenizer.eos_token_id] for input_ids in batch_dict['input_ids']]
     batch_dict = tokenizer.pad(batch_dict, padding=True, return_attention_mask=True, return_tensors='pt')