bettertransformer-demo / defaults.py
Felix Marty
hopefully stable
7d58e23
raw
history blame
1.05 kB
defaults_vanilla_single = {
"status": 200,
"prediction": "Positive",
"inf_latency": 7.66,
"peak_gpu_memory": 2706.21,
"end_to_end_latency": 309.65,
}
defaults_bt_single = {
"status": 200,
"prediction": "Positive",
"inf_latency": 6.01,
"peak_gpu_memory": 2706.22,
"end_to_end_latency": 303.53,
}
defaults_vanilla_spam = {
"throughput": 28.04,
"mean_inference_latency": 24.43,
"mean_peak_gpu_memory": 2907.92,
"mean_padding_ratio": 69.53,
"mean_sequence_length": 128.0,
"effective_batch_size": 4.3,
}
defaults_bt_spam = {
"throughput": 38.53,
"mean_inference_latency": 12.73,
"mean_peak_gpu_memory": 2761.64,
"mean_padding_ratio": 69.53,
"mean_sequence_length": 128.0,
"effective_batch_size": 4.7,
}
BATCH_SIZE = 8 # fixed!
HEADERS = {"Content-Type": "text/plain"}
ADDRESS_VANILLA = "http://3.83.142.46:8080/predictions/my_tc"
ADDRESS_BETTERTRANSFORMER = "http://3.95.136.2:8080/predictions/my_tc"
MODEL_NAME = "distilbert-base-uncased-finetuned-sst-2-english"