Benjamin Consolvo commited on
Commit
6128b93
1 Parent(s): 81fdd84

optimum intel

Browse files
Files changed (2) hide show
  1. app.py +10 -6
  2. requirements.txt +2 -1
app.py CHANGED
@@ -2,14 +2,18 @@ import gradio as gr
2
  from transformers import pipeline
3
  import time
4
 
5
- sparse_qa_pipeline = pipeline(task="question-answering",model="Intel/bert-base-uncased-squadv1.1-sparse-80-1x4-block-pruneofa")
 
 
 
 
 
 
6
  # sparse_qa_pipeline = pipeline(task="question-answering",model="Intel/distilbert-base-uncased-squadv1.1-sparse-80-1x4-block-pruneofa-int8")
7
 
8
- dense_qa_pipeline = pipeline(task="question-answering",model="csarron/bert-base-uncased-squad-v1")
9
- # dense_qa_pipeline = pipeline(task="question-answering",model="distilbert-base-uncased-distilled-squad")
10
 
11
- def greet(name):
12
- return "Hello " + name + "!!"
13
 
14
  def predict(context,question):
15
  '''
@@ -22,7 +26,7 @@ def predict(context,question):
22
  '''
23
 
24
  sparse_start_time = time.perf_counter()
25
- sparse_predictions = sparse_qa_pipeline(context=context,question=question)
26
  sparse_end_time = time.perf_counter()
27
  sparse_duration = (sparse_end_time - sparse_start_time) * 1000
28
  sparse_answer = sparse_predictions['answer']
 
2
  from transformers import pipeline
3
  import time
4
 
5
+ from optimum.intel.neural_compressor import IncQuantizedModelForQuestionAnswering
6
+
7
+ # model_id = "Intel/bert-base-uncased-squadv1.1-sparse-80-1x4-block-pruneofa"
8
+ model_id = "Intel/distilbert-base-uncased-squadv1.1-sparse-80-1x4-block-pruneofa-int8"
9
+ int8_model = IncQuantizedModelForQuestionAnswering.from_pretrained(model_id)
10
+
11
+ # sparse_qa_pipeline = pipeline(task="question-answering",model="Intel/bert-base-uncased-squadv1.1-sparse-80-1x4-block-pruneofa")
12
  # sparse_qa_pipeline = pipeline(task="question-answering",model="Intel/distilbert-base-uncased-squadv1.1-sparse-80-1x4-block-pruneofa-int8")
13
 
14
+ # dense_qa_pipeline = pipeline(task="question-answering",model="csarron/bert-base-uncased-squad-v1")
15
+ dense_qa_pipeline = pipeline(task="question-answering",model="distilbert-base-uncased-distilled-squad")
16
 
 
 
17
 
18
  def predict(context,question):
19
  '''
 
26
  '''
27
 
28
  sparse_start_time = time.perf_counter()
29
+ sparse_predictions = int8_model(context=context,question=question)
30
  sparse_end_time = time.perf_counter()
31
  sparse_duration = (sparse_end_time - sparse_start_time) * 1000
32
  sparse_answer = sparse_predictions['answer']
requirements.txt CHANGED
@@ -1,3 +1,4 @@
1
  transformers
2
  torch
3
- tensorflow
 
 
1
  transformers
2
  torch
3
+ tensorflow
4
+ optimum.intel