File size: 1,052 Bytes
35e3254
 
7d58e23
6e19ff8
7d58e23
6e19ff8
35e3254
 
 
 
7d58e23
6e19ff8
7d58e23
6e19ff8
35e3254
 
 
6e19ff8
 
 
7d58e23
 
6e19ff8
35e3254
 
 
6e19ff8
 
 
7d58e23
 
6e19ff8
35e3254
 
 
 
 
 
17ca086
7d58e23
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
defaults_vanilla_single = {
    "status": 200,
    "prediction": "Positive",
    "inf_latency": 6.25,
    "peak_gpu_memory": 2706.21,
    "end_to_end_latency": 81.95,
}

defaults_bt_single = {
    "status": 200,
    "prediction": "Positive",
    "inf_latency": 4.96,
    "peak_gpu_memory": 2706.22,
    "end_to_end_latency": 78.69,
}

defaults_vanilla_spam = {
    "throughput": 184.58,
    "mean_inference_latency": 32.2,
    "mean_peak_gpu_memory": 3046.26,
    "mean_padding_ratio": 69.53,
    "mean_sequence_length": 128.0,
    "effective_batch_size": 8.0,
}

defaults_bt_spam = {
    "throughput": 312.21,
    "mean_inference_latency": 14.42,
    "mean_peak_gpu_memory": 2798.78,
    "mean_padding_ratio": 69.53,
    "mean_sequence_length": 128.0,
    "effective_batch_size": 8.0,
}

BATCH_SIZE = 8  # fixed!

HEADERS = {"Content-Type": "text/plain"}
ADDRESS_VANILLA = "http://3.83.142.46:8080/predictions/my_tc"
ADDRESS_BETTERTRANSFORMER = "http://3.95.136.2:8080/predictions/my_tc"
MODEL_NAME = "distilbert-base-uncased-finetuned-sst-2-english"