ABCDEFGHIJKLMNOPQRSTUVWXYZAA
1
filenum_requestsdurationqpsslowestfastestaveragelat(.10)lat(.25)lat(.50)lat(.75)lat(.90)lat(.95)lat(.99)time for first requesttime to reach steady stategit
2
3
Distillbert
4
2 CORES warm verta/distilbert/1/output-amd.csv53954011.4540.75260.80440.77380.77840.79780.79780.79780.79780.7978
5
2 CORES warm verta/distilbert/1/output-amd.csv (second try)54053911.10070.75960.80510.77310.77820.79440.79440.79440.79440.7944
6
2 CORES warm verta/distilbert/1/output-amd.csv (MKL_DEBUG_CPU_TYPE=5)
54154010.47040.27470.28830.27790.28070.28590.28590.28590.28590.2859
7
warm verta/distilbert/1/output-intel.csv54053910.30430.25310.26350.25590.25750.26050.26640.27660.28090.2935
8
cold verta/distilbert/100.7s315s
9
cold verta/distilbert/100, overprovisioned nodes105s
10
warm verta/distilbert/100/output.csv5395354099.911.40510.11840.38120.19540.24190.37210.42170.59830.66130.803
11
warm verta/distilbert/100/output-2cores.csv 2 CPU53983539100.150.84030.12010.25860.16350.17720.21530.3190.41170.45940.574
12
13
warm : lambda/distilbert/1/output.csv54053910.60090.4650.49410.47340.48140.48850.50150.51990.53410.5738link
14
cold: lambda/distilbert-2/100/output.csv55928559100.0512.95020.43950.48520.46530.47040.47860.49090.5080.52530.593841.013879link
Tweakable in Verta
15
16
knative/results/warm_cloudrun_distilbert_1cpu_1qps.csv29929912.45960.3740.41610.37990.38550.39370.40560.45460.46780.4878
17
knative/results/warm_cloudrun_distilbert_1cpu_1qps.csv (cut)27127010.49330.38570.41670.39890.40510.41650.41650.41650.41650.4165
18
knative/results/warm_cloudrun_distilbert_2cpu_1qps.csv (cut)
54154010.58260.36670.39830.37250.37650.38480.4160.44010.45740.4971
19
knative/results/cold_cloudrun_distilbert_1cpu_100qps.csv4796959980.0819.55530.36790.77250.40870.44320.5290.63660.70680.78839.749610.829834*
20
knative/results/cold_cloudrun_distilbert_1cpu_envvars_100qps.csv48136598.9780.3618.58450.35520.8260.4120.44730.5340.65770.7120.77619.33437.836*
21
knative/results/cold_cloudrun_distilbert_2cpu_100qps.csv5108359985.2818.24940.35310.68810.39380.42130.47820.55590.62050.65369.24331452*
22
knative/results/cold_cloudrun_distilbert_2cpu_envvars_100qps.csv
5060759984.4918.71040.36180.72740.40050.43250.50750.61730.66970.70538.73768.233*
23
knative/results/warm_cloudrun_distilbert_1cpu_100qps.csv (cut)4571653984.8219.1260.36070.76010.41640.46810.57370.66020.7110.74959.027
24
knative/results/warm_cloudrun_distilbert_1cpu_envvars_100qps.csv (cut)
4459153982.7319.97680.36840.80760.420.47710.6290.68210.7230.76038.5836
25
knative/results/warm_cloudrun_distilbert_2cpu_100qps.csv (cut)4554254383.8717.79250.36530.74790.40950.44950.55130.64850.70640.74348.9639
26
knative/results/warm_cloudrun_distilbert_2cpu_envvars_100qps.csv (cut)
4535554782.9219.6590.36580.76650.44230.52760.62010.66840.72880.8899.0606
27
28
29
30
Bert
31
warm verta/bert/1/output-amd.csv444539.240.821.75391.16311.21721.17641.18231.21181.21181.21181.21181.2118
32
warm verta/bert/1/output-intel.csv54154010.81790.32650.38750.33540.36080.37480.40210.43770.48870.5416
33
2 CORES warm verta/bert/1/output-intel.csv54154011.07650.31630.39760.33070.360.37930.42780.48020.50320.5991
34
warm verta/bert/100/output.csv5399254099.992.67410.23790.66220.36270.48530.65220.74910.97631.11611.3553
35
warm verta/bert/100/output-2cores.csv 2 CPU53923539100.041.94410.21340.59690.3490.49770.56250.6780.87050.93761.2219
36
37
warm : lambda/bert/1/output.csv54053911.27890.88920.92350.90320.90780.91840.92890.94450.96471.058link
- add more cpu
38
cold: lambda/bert-2/100/output.csv55925558.91100.064.21870.84340.93660.90780.9170.92930.94550.96630.98781.073541.101874link
- number of parallel requests
39
40
41
42
knative/results/warm_cloudrun_bert_2cpu_envvars_1qps.csv (cut)
54154011.09990.70730.73730.72220.72790.73360.74240.75330.76160.7857
43
knative/results/warm_cloudrun_bert_1cpu_envvars_1qps.csv (cut)53153010.84370.71790.76160.73520.74350.76340.76340.76340.76340.7634
44
knative/results/cold_cloudrun_bert_2cpu_envvars_100qps.csv
4112559968.6619.96090.69061.36530.74710.77630.85541.05831.18511.278414.30915.832*
45
knative/results/warm_cloudrun_bert_1cpu_envvars_100qps.csv (cut)42940526.4281.5719.94510.69971.18450.78360.8380.95651.12811.22691.274212.2201
46
knative/results/warm_cloudrun_bert_1cpu_100qps.csv (cut)40578524.277.4119.99250.71661.21810.80660.89771.11451.24421.31441.371410.5467
47
knative/results/warm_cloudrun_bert_2cpu_envvars_100qps.csv (cut)42237534.4979.0219.99820.70691.23150.79460.93981.1571.25751.33561.42910.1936
48
knative/results/warm_cloudrun_bert_2cpu_100qps.csv (cut)43326538.9180.419.82570.69851.21520.78650.88451.05281.17921.2551.297612.0589
49
knative/results/warm_cloudrun_bert_2cpu_envvars_100qps.csv (cut)
39491536.9673.5419.94930.69821.22810.78990.8580.98441.17561.36061.582112.3521
50
51
52
53
54
ResNet
55
warm verta/resnet/1/output.csv54154010.08590.0590.06160.06020.06060.06140.06220.06310.06430.0665
56
warm verta/resnet/100/steady-output.csv (first 80% removed)
902490.02100.240.44570.06120.15120.0880.1080.13840.18690.23510.25560.3207
57
warm verta/resnet/100/output-2cores.csv 2 CPU53979540.0299.960.70050.06270.12690.08240.09090.12010.15050.18560.20880.2524
58
59
warm lambda/resnet/cold_run_1qps.csv52652510.52070.19990.23060.210.21480.22390.23780.25640.27160.3564
60
cold lambda/resnet/cold_run_1qps.csv5835990.9718.68990.19990.26270.21030.21550.22430.23840.25730.27350.3603
61
warm lambda/resnet/cold_run_100qps.csv52634526.01100.061.30350.18720.22250.20220.2070.21450.2270.24670.270.3476
62
cold lambda/resnet/cold_run_100qps.csv58481599.0297.6317.75170.18720.25060.20230.20720.21470.22740.24750.27150.3553
63
64
knative/results/warm_cloudrun_resnet_1cpu_100qps.csv (cut)4597853386.2619.94330.13690.50490.25080.29920.34130.39220.43990.476611.0069
65
knative/results/warm_cloudrun_resnet_2cpu_envvars_1qps.csv (cut)
54154010.21360.13970.15730.14650.15070.15580.16230.16890.1730.1885
66
knative/results/warm_cloudrun_resnet_2cpu_envvars_100qps.csv (cut)
4462949789.819.86940.14210.47560.25350.30240.36270.41390.45940.49268.4587
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100