bettertransformer-demo / defaults.py
Felix Marty
update
bf38ec8
raw
history blame
1.04 kB
defaults_vanilla_single = {
"status": 200,
"prediction": "Accepted",
"inf_latency": 20.77,
"peak_gpu_memory": 2717.36,
"end_to_end_latency": 93.65,
}
defaults_bt_single = {
"status": 200,
"prediction": "Accepted",
"inf_latency": 20.77,
"peak_gpu_memory": 2717.36,
"end_to_end_latency": 93.65,
}
defaults_vanilla_spam = {
"throughput": 20,
"mean_inference_latency": 29.69,
"mean_peak_gpu_memory": 3620.9,
"mean_padding_ratio": 35.26,
"mean_sequence_length": 39.395,
"effective_batch_size": 8,
}
defaults_bt_spam = {
"throughput": 20,
"mean_inference_latency": 29.69,
"mean_peak_gpu_memory": 3620.9,
"mean_padding_ratio": 35.26,
"mean_sequence_length": 39.395,
"effective_batch_size": 8,
}
BATCH_SIZE = 8 # fixed!
HEADERS = {"Content-Type": "text/plain"}
ADDRESS_VANILLA = "http://3.83.142.46:8080/predictions/my_tc"
ADDRESS_BETTERTRANSFORMER = "http://3.95.136.2:8080/predictions/my_tc"
MODEL_NAME = "distilbert-base-uncased-finetuned-sst-2-english"