bettertransformer-demo / defaults.py
Felix Marty
turn off aws instances
6e19ff8
defaults_vanilla_single = {
"status": 200,
"prediction": "Positive",
"inf_latency": 6.25,
"peak_gpu_memory": 2706.21,
"end_to_end_latency": 81.95,
}
defaults_bt_single = {
"status": 200,
"prediction": "Positive",
"inf_latency": 4.96,
"peak_gpu_memory": 2706.22,
"end_to_end_latency": 78.69,
}
defaults_vanilla_spam = {
"throughput": 184.58,
"mean_inference_latency": 32.2,
"mean_peak_gpu_memory": 3046.26,
"mean_padding_ratio": 69.53,
"mean_sequence_length": 128.0,
"effective_batch_size": 8.0,
}
defaults_bt_spam = {
"throughput": 312.21,
"mean_inference_latency": 14.42,
"mean_peak_gpu_memory": 2798.78,
"mean_padding_ratio": 69.53,
"mean_sequence_length": 128.0,
"effective_batch_size": 8.0,
}
BATCH_SIZE = 8 # fixed!
HEADERS = {"Content-Type": "text/plain"}
ADDRESS_VANILLA = "http://3.83.142.46:8080/predictions/my_tc"
ADDRESS_BETTERTRANSFORMER = "http://3.95.136.2:8080/predictions/my_tc"
MODEL_NAME = "distilbert-base-uncased-finetuned-sst-2-english"