piotr-szleg-bards-ai commited on
Commit
8530cb4
1 Parent(s): 58bb3ba

2024-02-09 09:57:45 Publish script update

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. app.py +1 -1
  2. data/2024-01-17 12:38:58.304815_summary.csv +0 -28
  3. data/2024-01-17 12:39:37.086623_time_of_day_comparison.csv +0 -12
  4. data/2024-01-18 10:30:01.312286_time_of_day_comparison.csv +0 -12
  5. data/2024-01-22 12:13:19.498935_general_plot.csv +0 -327
  6. data/2024-01-22 12:14:03.377435_general_plot.csv +0 -0
  7. data/2024-01-22 12:15:16.239311chunk_plots.csv +0 -0
  8. data/2024-01-22 12:23:47.756798_general_plot.csv +0 -327
  9. data/{2024-01-25 06:47:26.520416_general_plot.csv → 2024-01-25 12:22:00.759762_general_plot.csv} +140 -83
  10. data/2024-01-25 13:30:17.207984_summary.csv +59 -0
  11. data/2024-01-25 13:30:20.959750_time_of_day_comparison.csv +20 -0
  12. data/2024-01-25 13:34:46.224347_summary.csv +59 -0
  13. data/2024-01-26 11:01:41.169428_general_plot.csv +398 -0
  14. data/2024-01-26 11:04:35.555342_general_plot.csv +398 -0
  15. data/2024-01-26 11:06:20.415218_general_plot.csv +398 -0
  16. data/2024-01-26 11:19:58.683853_general_plot.csv +398 -0
  17. data/2024-01-26 11:20:49.179382_general_plot.csv +398 -0
  18. data/2024-01-26 11:22:32.771167_general_plot.csv +398 -0
  19. data/2024-01-26 16:13:38.191636_model_costs.csv +13 -0
  20. data/2024-01-26 16:16:56.390177_model_costs.csv +13 -0
  21. data/2024-01-26 16:19:55.237955_model_costs.csv +13 -0
  22. data/2024-01-26 16:21:10.212177_model_costs.csv +13 -0
  23. data/2024-01-26 16:21:34.661653_model_costs.csv +13 -0
  24. data/2024-01-26 16:25:47.914140_model_costs.csv +13 -0
  25. data/2024-01-26 16:32:54.481637_model_costs.csv +13 -0
  26. data/2024-01-26 16:43:36.843194_general_plot.csv +398 -0
  27. data/2024-01-26 16:44:14.180186_general_plot.csv +398 -0
  28. data/2024-01-30 13:08:12.199559_general_plot.csv +398 -0
  29. data/2024-01-30 18:39:54.448407_time_of_day_comparison.csv +27 -0
  30. data/2024-01-30 18:40:08.467683_summary.csv +75 -0
  31. data/2024-02-01 08:08:06.822774_time_of_day_comparison.csv +34 -0
  32. data/2024-02-02 10:02:32.863904_time_of_day_comparison.csv +58 -0
  33. data/2024-02-02 10:13:06.642849_general_plot.csv +428 -0
  34. data/2024-02-02 11:10:33.807657_general_plot.csv +293 -0
  35. data/2024-02-03 21:01:06.672013_time_of_day_comparison.csv +58 -0
  36. data/2024-02-03 22:21:49.754184_time_of_day_comparison.csv +267 -0
  37. data/2024-02-03 22:30:15.856748_time_of_day_comparison.csv +91 -0
  38. data/2024-02-03 22:31:14.132394_time_of_day_comparison.csv +91 -0
  39. data/2024-02-03 22:33:36.957992_time_of_day_comparison.csv +91 -0
  40. data/2024-02-03 22:42:23.322179_summary.csv +75 -0
  41. data/2024-02-03 22:42:30.259126_general_plot.csv +428 -0
  42. data/2024-02-05 12:03:42.452218_general_plot.csv +442 -0
  43. data/2024-02-05 12:03:45.281624_model_costs.csv +12 -0
  44. data/2024-02-05 23:33:22.947120_summary.csv +55 -0
  45. data/2024-02-06 07:53:19.636658_time_of_day_comparison.csv +91 -0
  46. data/2024-02-06 09:35:10.194145_time_of_day_comparison.csv +89 -0
  47. data/2024-02-06 09:42:04.306128_time_of_day_comparison.csv +89 -0
  48. data/2024-02-06 09:46:18.795794_time_of_day_comparison.csv +89 -0
  49. data/2024-02-06 09:49:19.637072_time_of_day_comparison.csv +89 -0
  50. data/2024-02-06 13:25:55.133644_general_plot.csv +284 -0
app.py CHANGED
@@ -27,7 +27,7 @@ To do that we added following text to the query:
27
 
28
  {}
29
 
30
- All of the call were made from the same machine with the same internet connection with usage of the LiteLLM library which may adds some time overhead compared to pure curl calls.
31
 
32
  Please take a look at the following project and let us know if you have any questions or suggestions.
33
  """
 
27
 
28
  {}
29
 
30
+ All of the call were made from the same machine with the same internet connection with usage of the LiteLLM library which may adds some time overhead compared to pure curl calls. Call were made from Poland, UTC +1.
31
 
32
  Please take a look at the following project and let us know if you have any questions or suggestions.
33
  """
data/2024-01-17 12:38:58.304815_summary.csv DELETED
@@ -1,28 +0,0 @@
1
- model,language,template_name,execution_time,characters_count,words_count,chunk_sizes,chunk_generation_times,chunk_generation_times_by_chunk_sizes
2
- Mistral-7B-Instruct-v0.2,english,call,,,,,,
3
- Mistral-7B-Instruct-v0.2,english,json,3.6487972736358643,303.5,51.0,3.570588235294118,0.03324383567361271,0.001449326305389626
4
- Mistral-7B-Instruct-v0.2,english,markdown,4.151226162910461,358.0,60.0,3.58,0.03327744722366333,0.0006092002057602237
5
- Mistral-7B-Instruct-v0.2,japanese,call,,,,,,
6
- Mistral-7B-Instruct-v0.2,japanese,json,0.9473649263381958,0.0,0.0,,,
7
- Mistral-7B-Instruct-v0.2,japanese,markdown,0.8581207990646362,0.0,0.0,,,
8
- Mixtral-8x7B-Instruct-v0.1,english,json,2.337923765182495,305.5,48.5,3.636904761904762,0.009715833834239416,0.00017000696402891426
9
- TinyLlama/TinyLlama-1.1B-Chat-v1.0,english,json,1.9294229745864868,334.0,55.5,3.5913978494623655,0.01203190895818895,0.0005004366755420837
10
- gemini-pro,english,json,,,,,,
11
- gpt-3.5-turbo,english,call,2.724249005317688,303.0,52.5,,,
12
- gpt-3.5-turbo,english,json,1.7111433148384094,282.25,48.5,4.342307692307692,0.017717334857353797,0.0006912943431051048
13
- gpt-3.5-turbo,english,markdown,2.6450350284576416,403.0,66.5,4.380434782608695,0.018466552962427555,0.0005482604451258303
14
- gpt-3.5-turbo,japanese,call,9.296517014503479,322.0,1.0,,,
15
- gpt-3.5-turbo,japanese,json,5.7430419921875,229.5,4.0,1.1167883211678833,0.02545691406639823,0.0004982973938963198
16
- gpt-3.5-turbo,japanese,markdown,8.998926281929016,369.5,1.0,1.098068350668648,0.024078829327451527,0.0006811250911499464
17
- llama-2-70b-chat,english,call,,,,,,
18
- llama-2-70b-chat,english,json,2.0344420671463013,292.0,43.5,3.4352941176470586,0.0120459423345678,0.0008612603182374274
19
- llama-2-70b-chat,english,markdown,3.0651516914367676,532.5,77.0,3.9444444444444446,0.013201815993697555,0.0003262027774235997
20
- llama-2-70b-chat,japanese,call,,,,,,
21
- llama-2-70b-chat,japanese,json,5.301165580749512,459.0,49.0,1.9827213822894167,0.015144962471453211,0.00037437952061093125
22
- llama-2-70b-chat,japanese,markdown,10.500205397605896,2586.5,395.5,4.664562669071235,0.016482780386027827,0.00010443909883635945
23
- zephyr-7b-beta,english,call,,,,,,
24
- zephyr-7b-beta,english,json,4.1515063643455505,357.5,60.0,3.8440860215053765,0.035762690087800385,0.0038104588643407896
25
- zephyr-7b-beta,english,markdown,4.133428335189819,348.0,62.0,3.625,0.0346326952179273,0.0010808045642794416
26
- zephyr-7b-beta,japanese,call,,,,,,
27
- zephyr-7b-beta,japanese,json,1.044502854347229,0.0,0.0,,,
28
- zephyr-7b-beta,japanese,markdown,0.8821841478347778,0.0,0.0,,,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
data/2024-01-17 12:39:37.086623_time_of_day_comparison.csv DELETED
@@ -1,12 +0,0 @@
1
- model,time_of_day,execution_time,characters_count,words_count
2
- Mistral-7B-Instruct-v0.2,morning,2.4013772904872894,165.375,27.75
3
- Mistral-7B-Instruct-v0.2,noon,,,
4
- Mixtral-8x7B-Instruct-v0.1,noon,2.337923765182495,305.5,48.5
5
- TinyLlama/TinyLlama-1.1B-Chat-v1.0,noon,1.9294229745864868,334.0,55.5
6
- gemini-pro,noon,,,
7
- gpt-3.5-turbo,morning,5.1754879752794904,316.3333333333333,28.25
8
- gpt-3.5-turbo,noon,5.12265948454539,338.6666666666667,32.666666666666664
9
- llama-2-70b-chat,morning,5.2554163336753845,967.5,141.25
10
- llama-2-70b-chat,noon,1.9137414693832397,292.0,43.5
11
- zephyr-7b-beta,morning,2.5529667139053345,176.375,30.5
12
- zephyr-7b-beta,noon,4.151261210441589,357.5,60.0
 
 
 
 
 
 
 
 
 
 
 
 
 
data/2024-01-18 10:30:01.312286_time_of_day_comparison.csv DELETED
@@ -1,12 +0,0 @@
1
- model,time_of_day,execution_time,characters_count,words_count
2
- Mistral-7B-Instruct-v0.2,morning,2.4013772904872894,165.375,27.75
3
- Mistral-7B-Instruct-v0.2,noon,2.43726247549057,165.375,27.75
4
- Mixtral-8x7B-Instruct-v0.1,noon,8.433558851480484,507.75,44.75
5
- TinyLlama/TinyLlama-1.1B-Chat-v1.0,noon,1.4488664865493774,162.0,27.625
6
- gemini-pro,noon,,,
7
- gpt-3.5-turbo,morning,5.1754879752794904,316.3333333333333,28.25
8
- gpt-3.5-turbo,noon,5.076187094052632,323.5833333333333,26.083333333333332
9
- llama-2-70b-chat,morning,5.2554163336753845,967.5,141.25
10
- llama-2-70b-chat,noon,5.080266445875168,967.5,141.25
11
- zephyr-7b-beta,morning,2.5529667139053345,176.375,30.5
12
- zephyr-7b-beta,noon,2.5973838567733765,176.25,30.375
 
 
 
 
 
 
 
 
 
 
 
 
 
data/2024-01-22 12:13:19.498935_general_plot.csv DELETED
@@ -1,327 +0,0 @@
1
- path,plot_object,description
2
- ./html/plots/response_times.html,"Figure({
3
- 'data': [{'alignmentgroup': 'True',
4
- 'hovertemplate': 'model=%{x}<br>execution_time=%{y}<extra></extra>',
5
- 'legendgroup': 'Mistral-7B-Instruct-v0.2',
6
- 'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
7
- 'name': 'Mistral-7B-Instruct-v0.2',
8
- 'offsetgroup': 'Mistral-7B-Instruct-v0.2',
9
- 'orientation': 'v',
10
- 'showlegend': True,
11
- 'textposition': 'auto',
12
- 'type': 'bar',
13
- 'x': array(['Mistral-7B-Instruct-v0.2'], dtype=object),
14
- 'xaxis': 'x',
15
- 'y': array([2.41931988]),
16
- 'yaxis': 'y'},
17
- {'alignmentgroup': 'True',
18
- 'hovertemplate': 'model=%{x}<br>execution_time=%{y}<extra></extra>',
19
- 'legendgroup': 'Mixtral-8x7B-Instruct-v0.1',
20
- 'marker': {'color': '#EF553B', 'pattern': {'shape': ''}},
21
- 'name': 'Mixtral-8x7B-Instruct-v0.1',
22
- 'offsetgroup': 'Mixtral-8x7B-Instruct-v0.1',
23
- 'orientation': 'v',
24
- 'showlegend': True,
25
- 'textposition': 'auto',
26
- 'type': 'bar',
27
- 'x': array(['Mixtral-8x7B-Instruct-v0.1'], dtype=object),
28
- 'xaxis': 'x',
29
- 'y': array([8.43355885]),
30
- 'yaxis': 'y'},
31
- {'alignmentgroup': 'True',
32
- 'hovertemplate': 'model=%{x}<br>execution_time=%{y}<extra></extra>',
33
- 'legendgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
34
- 'marker': {'color': '#00cc96', 'pattern': {'shape': ''}},
35
- 'name': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
36
- 'offsetgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
37
- 'orientation': 'v',
38
- 'showlegend': True,
39
- 'textposition': 'auto',
40
- 'type': 'bar',
41
- 'x': array(['TinyLlama/TinyLlama-1.1B-Chat-v1.0'], dtype=object),
42
- 'xaxis': 'x',
43
- 'y': array([1.44886649]),
44
- 'yaxis': 'y'},
45
- {'alignmentgroup': 'True',
46
- 'hovertemplate': 'model=%{x}<br>execution_time=%{y}<extra></extra>',
47
- 'legendgroup': 'gemini-pro',
48
- 'marker': {'color': '#ab63fa', 'pattern': {'shape': ''}},
49
- 'name': 'gemini-pro',
50
- 'offsetgroup': 'gemini-pro',
51
- 'orientation': 'v',
52
- 'showlegend': True,
53
- 'textposition': 'auto',
54
- 'type': 'bar',
55
- 'x': array(['gemini-pro'], dtype=object),
56
- 'xaxis': 'x',
57
- 'y': array([nan]),
58
- 'yaxis': 'y'},
59
- {'alignmentgroup': 'True',
60
- 'hovertemplate': 'model=%{x}<br>execution_time=%{y}<extra></extra>',
61
- 'legendgroup': 'gpt-3.5-turbo',
62
- 'marker': {'color': '#FFA15A', 'pattern': {'shape': ''}},
63
- 'name': 'gpt-3.5-turbo',
64
- 'offsetgroup': 'gpt-3.5-turbo',
65
- 'orientation': 'v',
66
- 'showlegend': True,
67
- 'textposition': 'auto',
68
- 'type': 'bar',
69
- 'x': array(['gpt-3.5-turbo'], dtype=object),
70
- 'xaxis': 'x',
71
- 'y': array([5.12583753]),
72
- 'yaxis': 'y'},
73
- {'alignmentgroup': 'True',
74
- 'hovertemplate': 'model=%{x}<br>execution_time=%{y}<extra></extra>',
75
- 'legendgroup': 'llama-2-70b-chat',
76
- 'marker': {'color': '#19d3f3', 'pattern': {'shape': ''}},
77
- 'name': 'llama-2-70b-chat',
78
- 'offsetgroup': 'llama-2-70b-chat',
79
- 'orientation': 'v',
80
- 'showlegend': True,
81
- 'textposition': 'auto',
82
- 'type': 'bar',
83
- 'x': array(['llama-2-70b-chat'], dtype=object),
84
- 'xaxis': 'x',
85
- 'y': array([5.16784139]),
86
- 'yaxis': 'y'},
87
- {'alignmentgroup': 'True',
88
- 'hovertemplate': 'model=%{x}<br>execution_time=%{y}<extra></extra>',
89
- 'legendgroup': 'zephyr-7b-beta',
90
- 'marker': {'color': '#FF6692', 'pattern': {'shape': ''}},
91
- 'name': 'zephyr-7b-beta',
92
- 'offsetgroup': 'zephyr-7b-beta',
93
- 'orientation': 'v',
94
- 'showlegend': True,
95
- 'textposition': 'auto',
96
- 'type': 'bar',
97
- 'x': array(['zephyr-7b-beta'], dtype=object),
98
- 'xaxis': 'x',
99
- 'y': array([2.57517529]),
100
- 'yaxis': 'y'}],
101
- 'layout': {'barmode': 'relative',
102
- 'legend': {'title': {'text': 'model'}, 'tracegroupgap': 0},
103
- 'margin': {'t': 60},
104
- 'template': '...',
105
- 'xaxis': {'anchor': 'y',
106
- 'categoryarray': [Mistral-7B-Instruct-v0.2,
107
- Mixtral-8x7B-Instruct-v0.1,
108
- TinyLlama/TinyLlama-1.1B-Chat-v1.0,
109
- gemini-pro, gpt-3.5-turbo,
110
- llama-2-70b-chat, zephyr-7b-beta],
111
- 'categoryorder': 'array',
112
- 'domain': [0.0, 1.0],
113
- 'title': {'text': 'model'}},
114
- 'yaxis': {'anchor': 'x', 'domain': [0.0, 1.0], 'title': {'text': 'execution_time'}}}
115
- })",Model endpoints response times
116
- ./html/plots/model_sizes.html,"Figure({
117
- 'data': [{'alignmentgroup': 'True',
118
- 'hovertemplate': 'color=gpt-3.5-turbo<br>x=%{x}<br>y=%{y}<extra></extra>',
119
- 'legendgroup': 'gpt-3.5-turbo',
120
- 'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
121
- 'name': 'gpt-3.5-turbo',
122
- 'offsetgroup': 'gpt-3.5-turbo',
123
- 'orientation': 'v',
124
- 'showlegend': True,
125
- 'textposition': 'auto',
126
- 'type': 'bar',
127
- 'x': array(['gpt-3.5-turbo'], dtype=object),
128
- 'xaxis': 'x',
129
- 'y': array([0.]),
130
- 'yaxis': 'y'},
131
- {'alignmentgroup': 'True',
132
- 'hovertemplate': 'color=llama-2-70b-chat<br>x=%{x}<br>y=%{y}<extra></extra>',
133
- 'legendgroup': 'llama-2-70b-chat',
134
- 'marker': {'color': '#EF553B', 'pattern': {'shape': ''}},
135
- 'name': 'llama-2-70b-chat',
136
- 'offsetgroup': 'llama-2-70b-chat',
137
- 'orientation': 'v',
138
- 'showlegend': True,
139
- 'textposition': 'auto',
140
- 'type': 'bar',
141
- 'x': array(['llama-2-70b-chat'], dtype=object),
142
- 'xaxis': 'x',
143
- 'y': array([0.]),
144
- 'yaxis': 'y'},
145
- {'alignmentgroup': 'True',
146
- 'hovertemplate': 'color=Mixtral-8x7B-Instruct-v0.1<br>x=%{x}<br>y=%{y}<extra></extra>',
147
- 'legendgroup': 'Mixtral-8x7B-Instruct-v0.1',
148
- 'marker': {'color': '#00cc96', 'pattern': {'shape': ''}},
149
- 'name': 'Mixtral-8x7B-Instruct-v0.1',
150
- 'offsetgroup': 'Mixtral-8x7B-Instruct-v0.1',
151
- 'orientation': 'v',
152
- 'showlegend': True,
153
- 'textposition': 'auto',
154
- 'type': 'bar',
155
- 'x': array(['Mixtral-8x7B-Instruct-v0.1'], dtype=object),
156
- 'xaxis': 'x',
157
- 'y': array([56.]),
158
- 'yaxis': 'y'},
159
- {'alignmentgroup': 'True',
160
- 'hovertemplate': 'color=zephyr-7b-beta<br>x=%{x}<br>y=%{y}<extra></extra>',
161
- 'legendgroup': 'zephyr-7b-beta',
162
- 'marker': {'color': '#ab63fa', 'pattern': {'shape': ''}},
163
- 'name': 'zephyr-7b-beta',
164
- 'offsetgroup': 'zephyr-7b-beta',
165
- 'orientation': 'v',
166
- 'showlegend': True,
167
- 'textposition': 'auto',
168
- 'type': 'bar',
169
- 'x': array(['zephyr-7b-beta'], dtype=object),
170
- 'xaxis': 'x',
171
- 'y': array([7.]),
172
- 'yaxis': 'y'},
173
- {'alignmentgroup': 'True',
174
- 'hovertemplate': 'color=Mistral-7B-Instruct-v0.2<br>x=%{x}<br>y=%{y}<extra></extra>',
175
- 'legendgroup': 'Mistral-7B-Instruct-v0.2',
176
- 'marker': {'color': '#FFA15A', 'pattern': {'shape': ''}},
177
- 'name': 'Mistral-7B-Instruct-v0.2',
178
- 'offsetgroup': 'Mistral-7B-Instruct-v0.2',
179
- 'orientation': 'v',
180
- 'showlegend': True,
181
- 'textposition': 'auto',
182
- 'type': 'bar',
183
- 'x': array(['Mistral-7B-Instruct-v0.2'], dtype=object),
184
- 'xaxis': 'x',
185
- 'y': array([7.]),
186
- 'yaxis': 'y'},
187
- {'alignmentgroup': 'True',
188
- 'hovertemplate': 'color=TinyLlama/TinyLlama-1.1B-Chat-v1.0<br>x=%{x}<br>y=%{y}<extra></extra>',
189
- 'legendgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
190
- 'marker': {'color': '#19d3f3', 'pattern': {'shape': ''}},
191
- 'name': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
192
- 'offsetgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
193
- 'orientation': 'v',
194
- 'showlegend': True,
195
- 'textposition': 'auto',
196
- 'type': 'bar',
197
- 'x': array(['TinyLlama/TinyLlama-1.1B-Chat-v1.0'], dtype=object),
198
- 'xaxis': 'x',
199
- 'y': array([1.1]),
200
- 'yaxis': 'y'},
201
- {'alignmentgroup': 'True',
202
- 'hovertemplate': 'color=gemini-pro<br>x=%{x}<br>y=%{y}<extra></extra>',
203
- 'legendgroup': 'gemini-pro',
204
- 'marker': {'color': '#FF6692', 'pattern': {'shape': ''}},
205
- 'name': 'gemini-pro',
206
- 'offsetgroup': 'gemini-pro',
207
- 'orientation': 'v',
208
- 'showlegend': True,
209
- 'textposition': 'auto',
210
- 'type': 'bar',
211
- 'x': array(['gemini-pro'], dtype=object),
212
- 'xaxis': 'x',
213
- 'y': array([0.]),
214
- 'yaxis': 'y'}],
215
- 'layout': {'barmode': 'relative',
216
- 'legend': {'title': {'text': 'color'}, 'tracegroupgap': 0},
217
- 'template': '...',
218
- 'title': {'text': 'Model sizes in billions of parameters'},
219
- 'xaxis': {'anchor': 'y', 'domain': [0.0, 1.0], 'title': {'text': 'x'}},
220
- 'yaxis': {'anchor': 'x', 'domain': [0.0, 1.0], 'title': {'text': 'y'}}}
221
- })",Model sizes in billions of parameters
222
- ./html/plots/execution_costs.html,"Figure({
223
- 'data': [{'alignmentgroup': 'True',
224
- 'hovertemplate': 'color=gpt-3.5-turbo<br>x=%{x}<br>y=%{y}<extra></extra>',
225
- 'legendgroup': 'gpt-3.5-turbo',
226
- 'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
227
- 'name': 'gpt-3.5-turbo',
228
- 'offsetgroup': 'gpt-3.5-turbo',
229
- 'orientation': 'v',
230
- 'showlegend': True,
231
- 'textposition': 'auto',
232
- 'type': 'bar',
233
- 'x': array(['gpt-3.5-turbo'], dtype=object),
234
- 'xaxis': 'x',
235
- 'y': array([0.2]),
236
- 'yaxis': 'y'},
237
- {'alignmentgroup': 'True',
238
- 'hovertemplate': 'color=llama-2-70b-chat<br>x=%{x}<br>y=%{y}<extra></extra>',
239
- 'legendgroup': 'llama-2-70b-chat',
240
- 'marker': {'color': '#EF553B', 'pattern': {'shape': ''}},
241
- 'name': 'llama-2-70b-chat',
242
- 'offsetgroup': 'llama-2-70b-chat',
243
- 'orientation': 'v',
244
- 'showlegend': True,
245
- 'textposition': 'auto',
246
- 'type': 'bar',
247
- 'x': array(['llama-2-70b-chat'], dtype=object),
248
- 'xaxis': 'x',
249
- 'y': array([0.03]),
250
- 'yaxis': 'y'},
251
- {'alignmentgroup': 'True',
252
- 'hovertemplate': 'color=Mixtral-8x7B-Instruct-v0.1<br>x=%{x}<br>y=%{y}<extra></extra>',
253
- 'legendgroup': 'Mixtral-8x7B-Instruct-v0.1',
254
- 'marker': {'color': '#00cc96', 'pattern': {'shape': ''}},
255
- 'name': 'Mixtral-8x7B-Instruct-v0.1',
256
- 'offsetgroup': 'Mixtral-8x7B-Instruct-v0.1',
257
- 'orientation': 'v',
258
- 'showlegend': True,
259
- 'textposition': 'auto',
260
- 'type': 'bar',
261
- 'x': array(['Mixtral-8x7B-Instruct-v0.1'], dtype=object),
262
- 'xaxis': 'x',
263
- 'y': array([0.135]),
264
- 'yaxis': 'y'},
265
- {'alignmentgroup': 'True',
266
- 'hovertemplate': 'color=zephyr-7b-beta<br>x=%{x}<br>y=%{y}<extra></extra>',
267
- 'legendgroup': 'zephyr-7b-beta',
268
- 'marker': {'color': '#ab63fa', 'pattern': {'shape': ''}},
269
- 'name': 'zephyr-7b-beta',
270
- 'offsetgroup': 'zephyr-7b-beta',
271
- 'orientation': 'v',
272
- 'showlegend': True,
273
- 'textposition': 'auto',
274
- 'type': 'bar',
275
- 'x': array(['zephyr-7b-beta'], dtype=object),
276
- 'xaxis': 'x',
277
- 'y': array([55.45703704]),
278
- 'yaxis': 'y'},
279
- {'alignmentgroup': 'True',
280
- 'hovertemplate': 'color=Mistral-7B-Instruct-v0.2<br>x=%{x}<br>y=%{y}<extra></extra>',
281
- 'legendgroup': 'Mistral-7B-Instruct-v0.2',
282
- 'marker': {'color': '#FFA15A', 'pattern': {'shape': ''}},
283
- 'name': 'Mistral-7B-Instruct-v0.2',
284
- 'offsetgroup': 'Mistral-7B-Instruct-v0.2',
285
- 'orientation': 'v',
286
- 'showlegend': True,
287
- 'textposition': 'auto',
288
- 'type': 'bar',
289
- 'x': array(['Mistral-7B-Instruct-v0.2'], dtype=object),
290
- 'xaxis': 'x',
291
- 'y': array([55.45703704]),
292
- 'yaxis': 'y'},
293
- {'alignmentgroup': 'True',
294
- 'hovertemplate': 'color=TinyLlama/TinyLlama-1.1B-Chat-v1.0<br>x=%{x}<br>y=%{y}<extra></extra>',
295
- 'legendgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
296
- 'marker': {'color': '#19d3f3', 'pattern': {'shape': ''}},
297
- 'name': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
298
- 'offsetgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
299
- 'orientation': 'v',
300
- 'showlegend': True,
301
- 'textposition': 'auto',
302
- 'type': 'bar',
303
- 'x': array(['TinyLlama/TinyLlama-1.1B-Chat-v1.0'], dtype=object),
304
- 'xaxis': 'x',
305
- 'y': array([25.59555556]),
306
- 'yaxis': 'y'},
307
- {'alignmentgroup': 'True',
308
- 'hovertemplate': 'color=gemini-pro<br>x=%{x}<br>y=%{y}<extra></extra>',
309
- 'legendgroup': 'gemini-pro',
310
- 'marker': {'color': '#FF6692', 'pattern': {'shape': ''}},
311
- 'name': 'gemini-pro',
312
- 'offsetgroup': 'gemini-pro',
313
- 'orientation': 'v',
314
- 'showlegend': True,
315
- 'textposition': 'auto',
316
- 'type': 'bar',
317
- 'x': array(['gemini-pro'], dtype=object),
318
- 'xaxis': 'x',
319
- 'y': array([0.05]),
320
- 'yaxis': 'y'}],
321
- 'layout': {'barmode': 'relative',
322
- 'legend': {'title': {'text': 'color'}, 'tracegroupgap': 0},
323
- 'template': '...',
324
- 'title': {'text': 'Costs of execution of a sample query 1000 times'},
325
- 'xaxis': {'anchor': 'y', 'domain': [0.0, 1.0], 'title': {'text': 'x'}},
326
- 'yaxis': {'anchor': 'x', 'domain': [0.0, 1.0], 'title': {'text': 'y'}}}
327
- })",Costs of execution of a sample query 1000 times
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
data/2024-01-22 12:14:03.377435_general_plot.csv DELETED
The diff for this file is too large to render. See raw diff
 
data/2024-01-22 12:15:16.239311chunk_plots.csv DELETED
The diff for this file is too large to render. See raw diff
 
data/2024-01-22 12:23:47.756798_general_plot.csv DELETED
@@ -1,327 +0,0 @@
1
- path,plot_object,description,plot_json
2
- ./html/plots/response_times.html,"Figure({
3
- 'data': [{'alignmentgroup': 'True',
4
- 'hovertemplate': 'model=%{x}<br>execution_time=%{y}<extra></extra>',
5
- 'legendgroup': 'Mistral-7B-Instruct-v0.2',
6
- 'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
7
- 'name': 'Mistral-7B-Instruct-v0.2',
8
- 'offsetgroup': 'Mistral-7B-Instruct-v0.2',
9
- 'orientation': 'v',
10
- 'showlegend': True,
11
- 'textposition': 'auto',
12
- 'type': 'bar',
13
- 'x': array(['Mistral-7B-Instruct-v0.2'], dtype=object),
14
- 'xaxis': 'x',
15
- 'y': array([2.41931988]),
16
- 'yaxis': 'y'},
17
- {'alignmentgroup': 'True',
18
- 'hovertemplate': 'model=%{x}<br>execution_time=%{y}<extra></extra>',
19
- 'legendgroup': 'Mixtral-8x7B-Instruct-v0.1',
20
- 'marker': {'color': '#EF553B', 'pattern': {'shape': ''}},
21
- 'name': 'Mixtral-8x7B-Instruct-v0.1',
22
- 'offsetgroup': 'Mixtral-8x7B-Instruct-v0.1',
23
- 'orientation': 'v',
24
- 'showlegend': True,
25
- 'textposition': 'auto',
26
- 'type': 'bar',
27
- 'x': array(['Mixtral-8x7B-Instruct-v0.1'], dtype=object),
28
- 'xaxis': 'x',
29
- 'y': array([8.43355885]),
30
- 'yaxis': 'y'},
31
- {'alignmentgroup': 'True',
32
- 'hovertemplate': 'model=%{x}<br>execution_time=%{y}<extra></extra>',
33
- 'legendgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
34
- 'marker': {'color': '#00cc96', 'pattern': {'shape': ''}},
35
- 'name': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
36
- 'offsetgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
37
- 'orientation': 'v',
38
- 'showlegend': True,
39
- 'textposition': 'auto',
40
- 'type': 'bar',
41
- 'x': array(['TinyLlama/TinyLlama-1.1B-Chat-v1.0'], dtype=object),
42
- 'xaxis': 'x',
43
- 'y': array([1.44886649]),
44
- 'yaxis': 'y'},
45
- {'alignmentgroup': 'True',
46
- 'hovertemplate': 'model=%{x}<br>execution_time=%{y}<extra></extra>',
47
- 'legendgroup': 'gemini-pro',
48
- 'marker': {'color': '#ab63fa', 'pattern': {'shape': ''}},
49
- 'name': 'gemini-pro',
50
- 'offsetgroup': 'gemini-pro',
51
- 'orientation': 'v',
52
- 'showlegend': True,
53
- 'textposition': 'auto',
54
- 'type': 'bar',
55
- 'x': array(['gemini-pro'], dtype=object),
56
- 'xaxis': 'x',
57
- 'y': array([nan]),
58
- 'yaxis': 'y'},
59
- {'alignmentgroup': 'True',
60
- 'hovertemplate': 'model=%{x}<br>execution_time=%{y}<extra></extra>',
61
- 'legendgroup': 'gpt-3.5-turbo',
62
- 'marker': {'color': '#FFA15A', 'pattern': {'shape': ''}},
63
- 'name': 'gpt-3.5-turbo',
64
- 'offsetgroup': 'gpt-3.5-turbo',
65
- 'orientation': 'v',
66
- 'showlegend': True,
67
- 'textposition': 'auto',
68
- 'type': 'bar',
69
- 'x': array(['gpt-3.5-turbo'], dtype=object),
70
- 'xaxis': 'x',
71
- 'y': array([5.12583753]),
72
- 'yaxis': 'y'},
73
- {'alignmentgroup': 'True',
74
- 'hovertemplate': 'model=%{x}<br>execution_time=%{y}<extra></extra>',
75
- 'legendgroup': 'llama-2-70b-chat',
76
- 'marker': {'color': '#19d3f3', 'pattern': {'shape': ''}},
77
- 'name': 'llama-2-70b-chat',
78
- 'offsetgroup': 'llama-2-70b-chat',
79
- 'orientation': 'v',
80
- 'showlegend': True,
81
- 'textposition': 'auto',
82
- 'type': 'bar',
83
- 'x': array(['llama-2-70b-chat'], dtype=object),
84
- 'xaxis': 'x',
85
- 'y': array([5.16784139]),
86
- 'yaxis': 'y'},
87
- {'alignmentgroup': 'True',
88
- 'hovertemplate': 'model=%{x}<br>execution_time=%{y}<extra></extra>',
89
- 'legendgroup': 'zephyr-7b-beta',
90
- 'marker': {'color': '#FF6692', 'pattern': {'shape': ''}},
91
- 'name': 'zephyr-7b-beta',
92
- 'offsetgroup': 'zephyr-7b-beta',
93
- 'orientation': 'v',
94
- 'showlegend': True,
95
- 'textposition': 'auto',
96
- 'type': 'bar',
97
- 'x': array(['zephyr-7b-beta'], dtype=object),
98
- 'xaxis': 'x',
99
- 'y': array([2.57517529]),
100
- 'yaxis': 'y'}],
101
- 'layout': {'barmode': 'relative',
102
- 'legend': {'title': {'text': 'model'}, 'tracegroupgap': 0},
103
- 'margin': {'t': 60},
104
- 'template': '...',
105
- 'xaxis': {'anchor': 'y',
106
- 'categoryarray': [Mistral-7B-Instruct-v0.2,
107
- Mixtral-8x7B-Instruct-v0.1,
108
- TinyLlama/TinyLlama-1.1B-Chat-v1.0,
109
- gemini-pro, gpt-3.5-turbo,
110
- llama-2-70b-chat, zephyr-7b-beta],
111
- 'categoryorder': 'array',
112
- 'domain': [0.0, 1.0],
113
- 'title': {'text': 'model'}},
114
- 'yaxis': {'anchor': 'x', 'domain': [0.0, 1.0], 'title': {'text': 'execution_time'}}}
115
- })",Model endpoints response times,"{""data"":[{""alignmentgroup"":""True"",""hovertemplate"":""model=%{x}\u003cbr\u003eexecution_time=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral-7B-Instruct-v0.2"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""Mistral-7B-Instruct-v0.2"",""offsetgroup"":""Mistral-7B-Instruct-v0.2"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""Mistral-7B-Instruct-v0.2""],""xaxis"":""x"",""y"":[2.4193198829889297],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{x}\u003cbr\u003eexecution_time=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mixtral-8x7B-Instruct-v0.1"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""Mixtral-8x7B-Instruct-v0.1"",""offsetgroup"":""Mixtral-8x7B-Instruct-v0.1"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""Mixtral-8x7B-Instruct-v0.1""],""xaxis"":""x"",""y"":[8.433558851480484],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{x}\u003cbr\u003eexecution_time=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""offsetgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0""],""xaxis"":""x"",""y"":[1.4488664865493774],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{x}\u003cbr\u003eexecution_time=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gemini-pro"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""gemini-pro"",""offsetgroup"":""gemini-pro"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gemini-pro""],""xaxis"":""x"",""y"":[null],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{x}\u003cbr\u003eexecution_time=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-3.5-turbo"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""gpt-3.5-turbo"",""offsetgroup"":""gpt-3.5-turbo"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gpt-3.5-turbo""],""xaxis"":""x"",""y"":[5.125837534666061],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{x}\u003cbr\u003eexecution_time=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""llama-2-70b-chat"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""llama-2-70b-chat"",""offsetgroup"":""llama-2-70b-chat"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""llama-2-70b-chat""],""xaxis"":""x"",""y"":[5.167841389775276],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{x}\u003cbr\u003eexecution_time=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""zephyr-7b-beta"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""zephyr-7b-beta"",""offsetgroup"":""zephyr-7b-beta"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""zephyr-7b-beta""],""xaxis"":""x"",""y"":[2.5751752853393555],""yaxis"":""y"",""type"":""bar""}],""layout"":{""template"":{""data"":{""histogram2dcontour"":[{""type"":""histogram2dcontour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""choropleth"":[{""type"":""choropleth"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""histogram2d"":[{""type"":""histogram2d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmap"":[{""type"":""heatmap"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmapgl"":[{""type"":""heatmapgl"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""contourcarpet"":[{""type"":""contourcarpet"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""contour"":[{""type"":""contour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""surface"":[{""type"":""surface"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""mesh3d"":[{""type"":""mesh3d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""scatter"":[{""fillpattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2},""type"":""scatter""}],""parcoords"":[{""type"":""parcoords"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolargl"":[{""type"":""scatterpolargl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""bar"":[{""error_x"":{""color"":""#2a3f5f""},""error_y"":{""color"":""#2a3f5f""},""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""bar""}],""scattergeo"":[{""type"":""scattergeo"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolar"":[{""type"":""scatterpolar"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""histogram"":[{""marker"":{""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""histogram""}],""scattergl"":[{""type"":""scattergl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatter3d"":[{""type"":""scatter3d"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattermapbox"":[{""type"":""scattermapbox"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterternary"":[{""type"":""scatterternary"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattercarpet"":[{""type"":""scattercarpet"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""carpet"":[{""aaxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""baxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""type"":""carpet""}],""table"":[{""cells"":{""fill"":{""color"":""#EBF0F8""},""line"":{""color"":""white""}},""header"":{""fill"":{""color"":""#C8D4E3""},""line"":{""color"":""white""}},""type"":""table""}],""barpolar"":[{""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""barpolar""}],""pie"":[{""automargin"":true,""type"":""pie""}]},""layout"":{""autotypenumbers"":""strict"",""colorway"":[""#636efa"",""#EF553B"",""#00cc96"",""#ab63fa"",""#FFA15A"",""#19d3f3"",""#FF6692"",""#B6E880"",""#FF97FF"",""#FECB52""],""font"":{""color"":""#2a3f5f""},""hovermode"":""closest"",""hoverlabel"":{""align"":""left""},""paper_bgcolor"":""white"",""plot_bgcolor"":""#E5ECF6"",""polar"":{""bgcolor"":""#E5ECF6"",""angularaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""radialaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""ternary"":{""bgcolor"":""#E5ECF6"",""aaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""baxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""caxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""coloraxis"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""colorscale"":{""sequential"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""sequentialminus"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""diverging"":[[0,""#8e0152""],[0.1,""#c51b7d""],[0.2,""#de77ae""],[0.3,""#f1b6da""],[0.4,""#fde0ef""],[0.5,""#f7f7f7""],[0.6,""#e6f5d0""],[0.7,""#b8e186""],[0.8,""#7fbc41""],[0.9,""#4d9221""],[1,""#276419""]]},""xaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""yaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""scene"":{""xaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""yaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""zaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2}},""shapedefaults"":{""line"":{""color"":""#2a3f5f""}},""annotationdefaults"":{""arrowcolor"":""#2a3f5f"",""arrowhead"":0,""arrowwidth"":1},""geo"":{""bgcolor"":""white"",""landcolor"":""#E5ECF6"",""subunitcolor"":""white"",""showland"":true,""showlakes"":true,""lakecolor"":""white""},""title"":{""x"":0.05},""mapbox"":{""style"":""light""}}},""xaxis"":{""anchor"":""y"",""domain"":[0.0,1.0],""title"":{""text"":""model""},""categoryorder"":""array"",""categoryarray"":[""Mistral-7B-Instruct-v0.2"",""Mixtral-8x7B-Instruct-v0.1"",""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""gemini-pro"",""gpt-3.5-turbo"",""llama-2-70b-chat"",""zephyr-7b-beta""]},""yaxis"":{""anchor"":""x"",""domain"":[0.0,1.0],""title"":{""text"":""execution_time""}},""legend"":{""title"":{""text"":""model""},""tracegroupgap"":0},""margin"":{""t"":60},""barmode"":""relative""}}"
116
- ./html/plots/model_sizes.html,"Figure({
117
- 'data': [{'alignmentgroup': 'True',
118
- 'hovertemplate': 'color=gpt-3.5-turbo<br>x=%{x}<br>y=%{y}<extra></extra>',
119
- 'legendgroup': 'gpt-3.5-turbo',
120
- 'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
121
- 'name': 'gpt-3.5-turbo',
122
- 'offsetgroup': 'gpt-3.5-turbo',
123
- 'orientation': 'v',
124
- 'showlegend': True,
125
- 'textposition': 'auto',
126
- 'type': 'bar',
127
- 'x': array(['gpt-3.5-turbo'], dtype=object),
128
- 'xaxis': 'x',
129
- 'y': array([0.]),
130
- 'yaxis': 'y'},
131
- {'alignmentgroup': 'True',
132
- 'hovertemplate': 'color=llama-2-70b-chat<br>x=%{x}<br>y=%{y}<extra></extra>',
133
- 'legendgroup': 'llama-2-70b-chat',
134
- 'marker': {'color': '#EF553B', 'pattern': {'shape': ''}},
135
- 'name': 'llama-2-70b-chat',
136
- 'offsetgroup': 'llama-2-70b-chat',
137
- 'orientation': 'v',
138
- 'showlegend': True,
139
- 'textposition': 'auto',
140
- 'type': 'bar',
141
- 'x': array(['llama-2-70b-chat'], dtype=object),
142
- 'xaxis': 'x',
143
- 'y': array([0.]),
144
- 'yaxis': 'y'},
145
- {'alignmentgroup': 'True',
146
- 'hovertemplate': 'color=Mixtral-8x7B-Instruct-v0.1<br>x=%{x}<br>y=%{y}<extra></extra>',
147
- 'legendgroup': 'Mixtral-8x7B-Instruct-v0.1',
148
- 'marker': {'color': '#00cc96', 'pattern': {'shape': ''}},
149
- 'name': 'Mixtral-8x7B-Instruct-v0.1',
150
- 'offsetgroup': 'Mixtral-8x7B-Instruct-v0.1',
151
- 'orientation': 'v',
152
- 'showlegend': True,
153
- 'textposition': 'auto',
154
- 'type': 'bar',
155
- 'x': array(['Mixtral-8x7B-Instruct-v0.1'], dtype=object),
156
- 'xaxis': 'x',
157
- 'y': array([56.]),
158
- 'yaxis': 'y'},
159
- {'alignmentgroup': 'True',
160
- 'hovertemplate': 'color=zephyr-7b-beta<br>x=%{x}<br>y=%{y}<extra></extra>',
161
- 'legendgroup': 'zephyr-7b-beta',
162
- 'marker': {'color': '#ab63fa', 'pattern': {'shape': ''}},
163
- 'name': 'zephyr-7b-beta',
164
- 'offsetgroup': 'zephyr-7b-beta',
165
- 'orientation': 'v',
166
- 'showlegend': True,
167
- 'textposition': 'auto',
168
- 'type': 'bar',
169
- 'x': array(['zephyr-7b-beta'], dtype=object),
170
- 'xaxis': 'x',
171
- 'y': array([7.]),
172
- 'yaxis': 'y'},
173
- {'alignmentgroup': 'True',
174
- 'hovertemplate': 'color=Mistral-7B-Instruct-v0.2<br>x=%{x}<br>y=%{y}<extra></extra>',
175
- 'legendgroup': 'Mistral-7B-Instruct-v0.2',
176
- 'marker': {'color': '#FFA15A', 'pattern': {'shape': ''}},
177
- 'name': 'Mistral-7B-Instruct-v0.2',
178
- 'offsetgroup': 'Mistral-7B-Instruct-v0.2',
179
- 'orientation': 'v',
180
- 'showlegend': True,
181
- 'textposition': 'auto',
182
- 'type': 'bar',
183
- 'x': array(['Mistral-7B-Instruct-v0.2'], dtype=object),
184
- 'xaxis': 'x',
185
- 'y': array([7.]),
186
- 'yaxis': 'y'},
187
- {'alignmentgroup': 'True',
188
- 'hovertemplate': 'color=TinyLlama/TinyLlama-1.1B-Chat-v1.0<br>x=%{x}<br>y=%{y}<extra></extra>',
189
- 'legendgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
190
- 'marker': {'color': '#19d3f3', 'pattern': {'shape': ''}},
191
- 'name': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
192
- 'offsetgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
193
- 'orientation': 'v',
194
- 'showlegend': True,
195
- 'textposition': 'auto',
196
- 'type': 'bar',
197
- 'x': array(['TinyLlama/TinyLlama-1.1B-Chat-v1.0'], dtype=object),
198
- 'xaxis': 'x',
199
- 'y': array([1.1]),
200
- 'yaxis': 'y'},
201
- {'alignmentgroup': 'True',
202
- 'hovertemplate': 'color=gemini-pro<br>x=%{x}<br>y=%{y}<extra></extra>',
203
- 'legendgroup': 'gemini-pro',
204
- 'marker': {'color': '#FF6692', 'pattern': {'shape': ''}},
205
- 'name': 'gemini-pro',
206
- 'offsetgroup': 'gemini-pro',
207
- 'orientation': 'v',
208
- 'showlegend': True,
209
- 'textposition': 'auto',
210
- 'type': 'bar',
211
- 'x': array(['gemini-pro'], dtype=object),
212
- 'xaxis': 'x',
213
- 'y': array([0.]),
214
- 'yaxis': 'y'}],
215
- 'layout': {'barmode': 'relative',
216
- 'legend': {'title': {'text': 'color'}, 'tracegroupgap': 0},
217
- 'template': '...',
218
- 'title': {'text': 'Model sizes in billions of parameters'},
219
- 'xaxis': {'anchor': 'y', 'domain': [0.0, 1.0], 'title': {'text': 'x'}},
220
- 'yaxis': {'anchor': 'x', 'domain': [0.0, 1.0], 'title': {'text': 'y'}}}
221
- })",Model sizes in billions of parameters,"{""data"":[{""alignmentgroup"":""True"",""hovertemplate"":""color=gpt-3.5-turbo\u003cbr\u003ex=%{x}\u003cbr\u003ey=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-3.5-turbo"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""gpt-3.5-turbo"",""offsetgroup"":""gpt-3.5-turbo"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gpt-3.5-turbo""],""xaxis"":""x"",""y"":[0.0],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""color=llama-2-70b-chat\u003cbr\u003ex=%{x}\u003cbr\u003ey=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""llama-2-70b-chat"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""llama-2-70b-chat"",""offsetgroup"":""llama-2-70b-chat"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""llama-2-70b-chat""],""xaxis"":""x"",""y"":[0.0],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""color=Mixtral-8x7B-Instruct-v0.1\u003cbr\u003ex=%{x}\u003cbr\u003ey=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mixtral-8x7B-Instruct-v0.1"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""Mixtral-8x7B-Instruct-v0.1"",""offsetgroup"":""Mixtral-8x7B-Instruct-v0.1"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""Mixtral-8x7B-Instruct-v0.1""],""xaxis"":""x"",""y"":[56.0],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""color=zephyr-7b-beta\u003cbr\u003ex=%{x}\u003cbr\u003ey=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""zephyr-7b-beta"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""zephyr-7b-beta"",""offsetgroup"":""zephyr-7b-beta"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""zephyr-7b-beta""],""xaxis"":""x"",""y"":[7.0],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""color=Mistral-7B-Instruct-v0.2\u003cbr\u003ex=%{x}\u003cbr\u003ey=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral-7B-Instruct-v0.2"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""Mistral-7B-Instruct-v0.2"",""offsetgroup"":""Mistral-7B-Instruct-v0.2"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""Mistral-7B-Instruct-v0.2""],""xaxis"":""x"",""y"":[7.0],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""color=TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0\u003cbr\u003ex=%{x}\u003cbr\u003ey=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""offsetgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0""],""xaxis"":""x"",""y"":[1.1],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""color=gemini-pro\u003cbr\u003ex=%{x}\u003cbr\u003ey=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gemini-pro"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""gemini-pro"",""offsetgroup"":""gemini-pro"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gemini-pro""],""xaxis"":""x"",""y"":[0.0],""yaxis"":""y"",""type"":""bar""}],""layout"":{""template"":{""data"":{""histogram2dcontour"":[{""type"":""histogram2dcontour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""choropleth"":[{""type"":""choropleth"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""histogram2d"":[{""type"":""histogram2d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmap"":[{""type"":""heatmap"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmapgl"":[{""type"":""heatmapgl"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""contourcarpet"":[{""type"":""contourcarpet"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""contour"":[{""type"":""contour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""surface"":[{""type"":""surface"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""mesh3d"":[{""type"":""mesh3d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""scatter"":[{""fillpattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2},""type"":""scatter""}],""parcoords"":[{""type"":""parcoords"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolargl"":[{""type"":""scatterpolargl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""bar"":[{""error_x"":{""color"":""#2a3f5f""},""error_y"":{""color"":""#2a3f5f""},""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""bar""}],""scattergeo"":[{""type"":""scattergeo"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolar"":[{""type"":""scatterpolar"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""histogram"":[{""marker"":{""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""histogram""}],""scattergl"":[{""type"":""scattergl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatter3d"":[{""type"":""scatter3d"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattermapbox"":[{""type"":""scattermapbox"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterternary"":[{""type"":""scatterternary"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattercarpet"":[{""type"":""scattercarpet"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""carpet"":[{""aaxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""baxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""type"":""carpet""}],""table"":[{""cells"":{""fill"":{""color"":""#EBF0F8""},""line"":{""color"":""white""}},""header"":{""fill"":{""color"":""#C8D4E3""},""line"":{""color"":""white""}},""type"":""table""}],""barpolar"":[{""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""barpolar""}],""pie"":[{""automargin"":true,""type"":""pie""}]},""layout"":{""autotypenumbers"":""strict"",""colorway"":[""#636efa"",""#EF553B"",""#00cc96"",""#ab63fa"",""#FFA15A"",""#19d3f3"",""#FF6692"",""#B6E880"",""#FF97FF"",""#FECB52""],""font"":{""color"":""#2a3f5f""},""hovermode"":""closest"",""hoverlabel"":{""align"":""left""},""paper_bgcolor"":""white"",""plot_bgcolor"":""#E5ECF6"",""polar"":{""bgcolor"":""#E5ECF6"",""angularaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""radialaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""ternary"":{""bgcolor"":""#E5ECF6"",""aaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""baxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""caxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""coloraxis"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""colorscale"":{""sequential"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""sequentialminus"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""diverging"":[[0,""#8e0152""],[0.1,""#c51b7d""],[0.2,""#de77ae""],[0.3,""#f1b6da""],[0.4,""#fde0ef""],[0.5,""#f7f7f7""],[0.6,""#e6f5d0""],[0.7,""#b8e186""],[0.8,""#7fbc41""],[0.9,""#4d9221""],[1,""#276419""]]},""xaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""yaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""scene"":{""xaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""yaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""zaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2}},""shapedefaults"":{""line"":{""color"":""#2a3f5f""}},""annotationdefaults"":{""arrowcolor"":""#2a3f5f"",""arrowhead"":0,""arrowwidth"":1},""geo"":{""bgcolor"":""white"",""landcolor"":""#E5ECF6"",""subunitcolor"":""white"",""showland"":true,""showlakes"":true,""lakecolor"":""white""},""title"":{""x"":0.05},""mapbox"":{""style"":""light""}}},""xaxis"":{""anchor"":""y"",""domain"":[0.0,1.0],""title"":{""text"":""x""}},""yaxis"":{""anchor"":""x"",""domain"":[0.0,1.0],""title"":{""text"":""y""}},""legend"":{""title"":{""text"":""color""},""tracegroupgap"":0},""title"":{""text"":""Model sizes in billions of parameters""},""barmode"":""relative""}}"
222
- ./html/plots/execution_costs.html,"Figure({
223
- 'data': [{'alignmentgroup': 'True',
224
- 'hovertemplate': 'color=gpt-3.5-turbo<br>x=%{x}<br>y=%{y}<extra></extra>',
225
- 'legendgroup': 'gpt-3.5-turbo',
226
- 'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
227
- 'name': 'gpt-3.5-turbo',
228
- 'offsetgroup': 'gpt-3.5-turbo',
229
- 'orientation': 'v',
230
- 'showlegend': True,
231
- 'textposition': 'auto',
232
- 'type': 'bar',
233
- 'x': array(['gpt-3.5-turbo'], dtype=object),
234
- 'xaxis': 'x',
235
- 'y': array([0.2]),
236
- 'yaxis': 'y'},
237
- {'alignmentgroup': 'True',
238
- 'hovertemplate': 'color=llama-2-70b-chat<br>x=%{x}<br>y=%{y}<extra></extra>',
239
- 'legendgroup': 'llama-2-70b-chat',
240
- 'marker': {'color': '#EF553B', 'pattern': {'shape': ''}},
241
- 'name': 'llama-2-70b-chat',
242
- 'offsetgroup': 'llama-2-70b-chat',
243
- 'orientation': 'v',
244
- 'showlegend': True,
245
- 'textposition': 'auto',
246
- 'type': 'bar',
247
- 'x': array(['llama-2-70b-chat'], dtype=object),
248
- 'xaxis': 'x',
249
- 'y': array([0.03]),
250
- 'yaxis': 'y'},
251
- {'alignmentgroup': 'True',
252
- 'hovertemplate': 'color=Mixtral-8x7B-Instruct-v0.1<br>x=%{x}<br>y=%{y}<extra></extra>',
253
- 'legendgroup': 'Mixtral-8x7B-Instruct-v0.1',
254
- 'marker': {'color': '#00cc96', 'pattern': {'shape': ''}},
255
- 'name': 'Mixtral-8x7B-Instruct-v0.1',
256
- 'offsetgroup': 'Mixtral-8x7B-Instruct-v0.1',
257
- 'orientation': 'v',
258
- 'showlegend': True,
259
- 'textposition': 'auto',
260
- 'type': 'bar',
261
- 'x': array(['Mixtral-8x7B-Instruct-v0.1'], dtype=object),
262
- 'xaxis': 'x',
263
- 'y': array([0.135]),
264
- 'yaxis': 'y'},
265
- {'alignmentgroup': 'True',
266
- 'hovertemplate': 'color=zephyr-7b-beta<br>x=%{x}<br>y=%{y}<extra></extra>',
267
- 'legendgroup': 'zephyr-7b-beta',
268
- 'marker': {'color': '#ab63fa', 'pattern': {'shape': ''}},
269
- 'name': 'zephyr-7b-beta',
270
- 'offsetgroup': 'zephyr-7b-beta',
271
- 'orientation': 'v',
272
- 'showlegend': True,
273
- 'textposition': 'auto',
274
- 'type': 'bar',
275
- 'x': array(['zephyr-7b-beta'], dtype=object),
276
- 'xaxis': 'x',
277
- 'y': array([55.45703704]),
278
- 'yaxis': 'y'},
279
- {'alignmentgroup': 'True',
280
- 'hovertemplate': 'color=Mistral-7B-Instruct-v0.2<br>x=%{x}<br>y=%{y}<extra></extra>',
281
- 'legendgroup': 'Mistral-7B-Instruct-v0.2',
282
- 'marker': {'color': '#FFA15A', 'pattern': {'shape': ''}},
283
- 'name': 'Mistral-7B-Instruct-v0.2',
284
- 'offsetgroup': 'Mistral-7B-Instruct-v0.2',
285
- 'orientation': 'v',
286
- 'showlegend': True,
287
- 'textposition': 'auto',
288
- 'type': 'bar',
289
- 'x': array(['Mistral-7B-Instruct-v0.2'], dtype=object),
290
- 'xaxis': 'x',
291
- 'y': array([55.45703704]),
292
- 'yaxis': 'y'},
293
- {'alignmentgroup': 'True',
294
- 'hovertemplate': 'color=TinyLlama/TinyLlama-1.1B-Chat-v1.0<br>x=%{x}<br>y=%{y}<extra></extra>',
295
- 'legendgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
296
- 'marker': {'color': '#19d3f3', 'pattern': {'shape': ''}},
297
- 'name': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
298
- 'offsetgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
299
- 'orientation': 'v',
300
- 'showlegend': True,
301
- 'textposition': 'auto',
302
- 'type': 'bar',
303
- 'x': array(['TinyLlama/TinyLlama-1.1B-Chat-v1.0'], dtype=object),
304
- 'xaxis': 'x',
305
- 'y': array([25.59555556]),
306
- 'yaxis': 'y'},
307
- {'alignmentgroup': 'True',
308
- 'hovertemplate': 'color=gemini-pro<br>x=%{x}<br>y=%{y}<extra></extra>',
309
- 'legendgroup': 'gemini-pro',
310
- 'marker': {'color': '#FF6692', 'pattern': {'shape': ''}},
311
- 'name': 'gemini-pro',
312
- 'offsetgroup': 'gemini-pro',
313
- 'orientation': 'v',
314
- 'showlegend': True,
315
- 'textposition': 'auto',
316
- 'type': 'bar',
317
- 'x': array(['gemini-pro'], dtype=object),
318
- 'xaxis': 'x',
319
- 'y': array([0.05]),
320
- 'yaxis': 'y'}],
321
- 'layout': {'barmode': 'relative',
322
- 'legend': {'title': {'text': 'color'}, 'tracegroupgap': 0},
323
- 'template': '...',
324
- 'title': {'text': 'Costs of execution of a sample query 1000 times'},
325
- 'xaxis': {'anchor': 'y', 'domain': [0.0, 1.0], 'title': {'text': 'x'}},
326
- 'yaxis': {'anchor': 'x', 'domain': [0.0, 1.0], 'title': {'text': 'y'}}}
327
- })",Costs of execution of a sample query 1000 times,"{""data"":[{""alignmentgroup"":""True"",""hovertemplate"":""color=gpt-3.5-turbo\u003cbr\u003ex=%{x}\u003cbr\u003ey=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-3.5-turbo"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""gpt-3.5-turbo"",""offsetgroup"":""gpt-3.5-turbo"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gpt-3.5-turbo""],""xaxis"":""x"",""y"":[0.2],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""color=llama-2-70b-chat\u003cbr\u003ex=%{x}\u003cbr\u003ey=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""llama-2-70b-chat"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""llama-2-70b-chat"",""offsetgroup"":""llama-2-70b-chat"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""llama-2-70b-chat""],""xaxis"":""x"",""y"":[0.030000000000000006],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""color=Mixtral-8x7B-Instruct-v0.1\u003cbr\u003ex=%{x}\u003cbr\u003ey=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mixtral-8x7B-Instruct-v0.1"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""Mixtral-8x7B-Instruct-v0.1"",""offsetgroup"":""Mixtral-8x7B-Instruct-v0.1"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""Mixtral-8x7B-Instruct-v0.1""],""xaxis"":""x"",""y"":[0.135],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""color=zephyr-7b-beta\u003cbr\u003ex=%{x}\u003cbr\u003ey=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""zephyr-7b-beta"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""zephyr-7b-beta"",""offsetgroup"":""zephyr-7b-beta"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""zephyr-7b-beta""],""xaxis"":""x"",""y"":[55.45703703703705],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""color=Mistral-7B-Instruct-v0.2\u003cbr\u003ex=%{x}\u003cbr\u003ey=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral-7B-Instruct-v0.2"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""Mistral-7B-Instruct-v0.2"",""offsetgroup"":""Mistral-7B-Instruct-v0.2"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""Mistral-7B-Instruct-v0.2""],""xaxis"":""x"",""y"":[55.45703703703705],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""color=TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0\u003cbr\u003ex=%{x}\u003cbr\u003ey=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""offsetgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0""],""xaxis"":""x"",""y"":[25.59555555555556],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""color=gemini-pro\u003cbr\u003ex=%{x}\u003cbr\u003ey=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gemini-pro"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""gemini-pro"",""offsetgroup"":""gemini-pro"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gemini-pro""],""xaxis"":""x"",""y"":[0.05],""yaxis"":""y"",""type"":""bar""}],""layout"":{""template"":{""data"":{""histogram2dcontour"":[{""type"":""histogram2dcontour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""choropleth"":[{""type"":""choropleth"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""histogram2d"":[{""type"":""histogram2d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmap"":[{""type"":""heatmap"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmapgl"":[{""type"":""heatmapgl"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""contourcarpet"":[{""type"":""contourcarpet"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""contour"":[{""type"":""contour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""surface"":[{""type"":""surface"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""mesh3d"":[{""type"":""mesh3d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""scatter"":[{""fillpattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2},""type"":""scatter""}],""parcoords"":[{""type"":""parcoords"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolargl"":[{""type"":""scatterpolargl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""bar"":[{""error_x"":{""color"":""#2a3f5f""},""error_y"":{""color"":""#2a3f5f""},""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""bar""}],""scattergeo"":[{""type"":""scattergeo"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolar"":[{""type"":""scatterpolar"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""histogram"":[{""marker"":{""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""histogram""}],""scattergl"":[{""type"":""scattergl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatter3d"":[{""type"":""scatter3d"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattermapbox"":[{""type"":""scattermapbox"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterternary"":[{""type"":""scatterternary"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattercarpet"":[{""type"":""scattercarpet"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""carpet"":[{""aaxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""baxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""type"":""carpet""}],""table"":[{""cells"":{""fill"":{""color"":""#EBF0F8""},""line"":{""color"":""white""}},""header"":{""fill"":{""color"":""#C8D4E3""},""line"":{""color"":""white""}},""type"":""table""}],""barpolar"":[{""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""barpolar""}],""pie"":[{""automargin"":true,""type"":""pie""}]},""layout"":{""autotypenumbers"":""strict"",""colorway"":[""#636efa"",""#EF553B"",""#00cc96"",""#ab63fa"",""#FFA15A"",""#19d3f3"",""#FF6692"",""#B6E880"",""#FF97FF"",""#FECB52""],""font"":{""color"":""#2a3f5f""},""hovermode"":""closest"",""hoverlabel"":{""align"":""left""},""paper_bgcolor"":""white"",""plot_bgcolor"":""#E5ECF6"",""polar"":{""bgcolor"":""#E5ECF6"",""angularaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""radialaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""ternary"":{""bgcolor"":""#E5ECF6"",""aaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""baxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""caxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""coloraxis"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""colorscale"":{""sequential"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""sequentialminus"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""diverging"":[[0,""#8e0152""],[0.1,""#c51b7d""],[0.2,""#de77ae""],[0.3,""#f1b6da""],[0.4,""#fde0ef""],[0.5,""#f7f7f7""],[0.6,""#e6f5d0""],[0.7,""#b8e186""],[0.8,""#7fbc41""],[0.9,""#4d9221""],[1,""#276419""]]},""xaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""yaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""scene"":{""xaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""yaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""zaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2}},""shapedefaults"":{""line"":{""color"":""#2a3f5f""}},""annotationdefaults"":{""arrowcolor"":""#2a3f5f"",""arrowhead"":0,""arrowwidth"":1},""geo"":{""bgcolor"":""white"",""landcolor"":""#E5ECF6"",""subunitcolor"":""white"",""showland"":true,""showlakes"":true,""lakecolor"":""white""},""title"":{""x"":0.05},""mapbox"":{""style"":""light""}}},""xaxis"":{""anchor"":""y"",""domain"":[0.0,1.0],""title"":{""text"":""x""}},""yaxis"":{""anchor"":""x"",""domain"":[0.0,1.0],""title"":{""text"":""y""}},""legend"":{""title"":{""text"":""color""},""tracegroupgap"":0},""title"":{""text"":""Costs of execution of a sample query 1000 times""},""barmode"":""relative""}}"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
data/{2024-01-25 06:47:26.520416_general_plot.csv → 2024-01-25 12:22:00.759762_general_plot.csv} RENAMED
@@ -12,7 +12,7 @@ path,plot_object,description,comment,plot_json
12
  'type': 'bar',
13
  'x': array(['Mistral-7B-Instruct-v0.2'], dtype=object),
14
  'xaxis': 'x',
15
- 'y': array([2.41931988]),
16
  'yaxis': 'y'},
17
  {'alignmentgroup': 'True',
18
  'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
@@ -26,7 +26,7 @@ path,plot_object,description,comment,plot_json
26
  'type': 'bar',
27
  'x': array(['Mixtral-8x7B-Instruct-v0.1'], dtype=object),
28
  'xaxis': 'x',
29
- 'y': array([8.43355885]),
30
  'yaxis': 'y'},
31
  {'alignmentgroup': 'True',
32
  'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
@@ -40,143 +40,136 @@ path,plot_object,description,comment,plot_json
40
  'type': 'bar',
41
  'x': array(['TinyLlama/TinyLlama-1.1B-Chat-v1.0'], dtype=object),
42
  'xaxis': 'x',
43
- 'y': array([1.44886649]),
44
  'yaxis': 'y'},
45
  {'alignmentgroup': 'True',
46
  'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
47
- 'legendgroup': 'gemini-pro',
48
  'marker': {'color': '#ab63fa', 'pattern': {'shape': ''}},
49
- 'name': 'gemini-pro',
50
- 'offsetgroup': 'gemini-pro',
51
  'orientation': 'v',
52
  'showlegend': True,
53
  'textposition': 'auto',
54
  'type': 'bar',
55
- 'x': array(['gemini-pro'], dtype=object),
56
  'xaxis': 'x',
57
- 'y': array([nan]),
58
  'yaxis': 'y'},
59
  {'alignmentgroup': 'True',
60
  'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
61
- 'legendgroup': 'gpt-3.5-turbo',
62
  'marker': {'color': '#FFA15A', 'pattern': {'shape': ''}},
63
- 'name': 'gpt-3.5-turbo',
64
- 'offsetgroup': 'gpt-3.5-turbo',
65
  'orientation': 'v',
66
  'showlegend': True,
67
  'textposition': 'auto',
68
  'type': 'bar',
69
- 'x': array(['gpt-3.5-turbo'], dtype=object),
70
  'xaxis': 'x',
71
- 'y': array([5.12583753]),
72
  'yaxis': 'y'},
73
  {'alignmentgroup': 'True',
74
  'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
75
- 'legendgroup': 'llama-2-70b-chat',
76
  'marker': {'color': '#19d3f3', 'pattern': {'shape': ''}},
77
- 'name': 'llama-2-70b-chat',
78
- 'offsetgroup': 'llama-2-70b-chat',
79
  'orientation': 'v',
80
  'showlegend': True,
81
  'textposition': 'auto',
82
  'type': 'bar',
83
- 'x': array(['llama-2-70b-chat'], dtype=object),
84
  'xaxis': 'x',
85
- 'y': array([5.16784139]),
86
  'yaxis': 'y'},
87
  {'alignmentgroup': 'True',
88
  'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
89
- 'legendgroup': 'zephyr-7b-beta',
90
  'marker': {'color': '#FF6692', 'pattern': {'shape': ''}},
91
- 'name': 'zephyr-7b-beta',
92
- 'offsetgroup': 'zephyr-7b-beta',
93
  'orientation': 'v',
94
  'showlegend': True,
95
  'textposition': 'auto',
96
  'type': 'bar',
97
- 'x': array(['zephyr-7b-beta'], dtype=object),
98
  'xaxis': 'x',
99
- 'y': array([2.57517529]),
100
- 'yaxis': 'y'}],
101
- 'layout': {'barmode': 'relative',
102
- 'legend': {'title': {'text': 'Model'}, 'tracegroupgap': 0},
103
- 'template': '...',
104
- 'title': {'text': 'Model endpoints response times'},
105
- 'xaxis': {'anchor': 'y',
106
- 'categoryarray': [Mistral-7B-Instruct-v0.2,
107
- Mixtral-8x7B-Instruct-v0.1,
108
- TinyLlama/TinyLlama-1.1B-Chat-v1.0,
109
- gemini-pro, gpt-3.5-turbo,
110
- llama-2-70b-chat, zephyr-7b-beta],
111
- 'categoryorder': 'array',
112
- 'domain': [0.0, 1.0],
113
- 'title': {'text': 'Model'}},
114
- 'yaxis': {'anchor': 'x', 'domain': [0.0, 1.0], 'title': {'text': 'Execution time (s)'}}}
115
- })",Model endpoints response times,,"{""data"":[{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral-7B-Instruct-v0.2"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""Mistral-7B-Instruct-v0.2"",""offsetgroup"":""Mistral-7B-Instruct-v0.2"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""Mistral-7B-Instruct-v0.2""],""xaxis"":""x"",""y"":[2.4193198829889297],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mixtral-8x7B-Instruct-v0.1"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""Mixtral-8x7B-Instruct-v0.1"",""offsetgroup"":""Mixtral-8x7B-Instruct-v0.1"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""Mixtral-8x7B-Instruct-v0.1""],""xaxis"":""x"",""y"":[8.433558851480484],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""offsetgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0""],""xaxis"":""x"",""y"":[1.4488664865493774],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gemini-pro"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""gemini-pro"",""offsetgroup"":""gemini-pro"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gemini-pro""],""xaxis"":""x"",""y"":[null],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-3.5-turbo"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""gpt-3.5-turbo"",""offsetgroup"":""gpt-3.5-turbo"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gpt-3.5-turbo""],""xaxis"":""x"",""y"":[5.125837534666061],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""llama-2-70b-chat"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""llama-2-70b-chat"",""offsetgroup"":""llama-2-70b-chat"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""llama-2-70b-chat""],""xaxis"":""x"",""y"":[5.167841389775276],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""zephyr-7b-beta"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""zephyr-7b-beta"",""offsetgroup"":""zephyr-7b-beta"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""zephyr-7b-beta""],""xaxis"":""x"",""y"":[2.5751752853393555],""yaxis"":""y"",""type"":""bar""}],""layout"":{""template"":{""data"":{""histogram2dcontour"":[{""type"":""histogram2dcontour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""choropleth"":[{""type"":""choropleth"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""histogram2d"":[{""type"":""histogram2d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmap"":[{""type"":""heatmap"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmapgl"":[{""type"":""heatmapgl"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""contourcarpet"":[{""type"":""contourcarpet"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""contour"":[{""type"":""contour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""surface"":[{""type"":""surface"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""mesh3d"":[{""type"":""mesh3d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""scatter"":[{""fillpattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2},""type"":""scatter""}],""parcoords"":[{""type"":""parcoords"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolargl"":[{""type"":""scatterpolargl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""bar"":[{""error_x"":{""color"":""#2a3f5f""},""error_y"":{""color"":""#2a3f5f""},""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""bar""}],""scattergeo"":[{""type"":""scattergeo"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolar"":[{""type"":""scatterpolar"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""histogram"":[{""marker"":{""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""histogram""}],""scattergl"":[{""type"":""scattergl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatter3d"":[{""type"":""scatter3d"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattermapbox"":[{""type"":""scattermapbox"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterternary"":[{""type"":""scatterternary"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattercarpet"":[{""type"":""scattercarpet"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""carpet"":[{""aaxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""baxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""type"":""carpet""}],""table"":[{""cells"":{""fill"":{""color"":""#EBF0F8""},""line"":{""color"":""white""}},""header"":{""fill"":{""color"":""#C8D4E3""},""line"":{""color"":""white""}},""type"":""table""}],""barpolar"":[{""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""barpolar""}],""pie"":[{""automargin"":true,""type"":""pie""}]},""layout"":{""autotypenumbers"":""strict"",""colorway"":[""#636efa"",""#EF553B"",""#00cc96"",""#ab63fa"",""#FFA15A"",""#19d3f3"",""#FF6692"",""#B6E880"",""#FF97FF"",""#FECB52""],""font"":{""color"":""#2a3f5f""},""hovermode"":""closest"",""hoverlabel"":{""align"":""left""},""paper_bgcolor"":""white"",""plot_bgcolor"":""#E5ECF6"",""polar"":{""bgcolor"":""#E5ECF6"",""angularaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""radialaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""ternary"":{""bgcolor"":""#E5ECF6"",""aaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""baxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""caxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""coloraxis"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""colorscale"":{""sequential"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""sequentialminus"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""diverging"":[[0,""#8e0152""],[0.1,""#c51b7d""],[0.2,""#de77ae""],[0.3,""#f1b6da""],[0.4,""#fde0ef""],[0.5,""#f7f7f7""],[0.6,""#e6f5d0""],[0.7,""#b8e186""],[0.8,""#7fbc41""],[0.9,""#4d9221""],[1,""#276419""]]},""xaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""yaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""scene"":{""xaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""yaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""zaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2}},""shapedefaults"":{""line"":{""color"":""#2a3f5f""}},""annotationdefaults"":{""arrowcolor"":""#2a3f5f"",""arrowhead"":0,""arrowwidth"":1},""geo"":{""bgcolor"":""white"",""landcolor"":""#E5ECF6"",""subunitcolor"":""white"",""showland"":true,""showlakes"":true,""lakecolor"":""white""},""title"":{""x"":0.05},""mapbox"":{""style"":""light""}}},""xaxis"":{""anchor"":""y"",""domain"":[0.0,1.0],""title"":{""text"":""Model""},""categoryorder"":""array"",""categoryarray"":[""Mistral-7B-Instruct-v0.2"",""Mixtral-8x7B-Instruct-v0.1"",""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""gemini-pro"",""gpt-3.5-turbo"",""llama-2-70b-chat"",""zephyr-7b-beta""]},""yaxis"":{""anchor"":""x"",""domain"":[0.0,1.0],""title"":{""text"":""Execution time (s)""}},""legend"":{""title"":{""text"":""Model""},""tracegroupgap"":0},""title"":{""text"":""Model endpoints response times""},""barmode"":""relative""}}"
116
- ./html/plots/model_sizes.html,"Figure({
117
- 'data': [{'alignmentgroup': 'True',
118
- 'hovertemplate': 'Model=%{x}<br>Model size (B params)=%{y}<extra></extra>',
119
- 'legendgroup': 'Mixtral-8x7B-Instruct-v0.1',
120
- 'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
121
- 'name': 'Mixtral-8x7B-Instruct-v0.1',
122
- 'offsetgroup': 'Mixtral-8x7B-Instruct-v0.1',
123
  'orientation': 'v',
124
  'showlegend': True,
125
  'textposition': 'auto',
126
  'type': 'bar',
127
- 'x': array(['Mixtral-8x7B-Instruct-v0.1'], dtype=object),
128
  'xaxis': 'x',
129
- 'y': array([56.]),
130
  'yaxis': 'y'},
131
  {'alignmentgroup': 'True',
132
- 'hovertemplate': 'Model=%{x}<br>Model size (B params)=%{y}<extra></extra>',
133
- 'legendgroup': 'zephyr-7b-beta',
134
- 'marker': {'color': '#EF553B', 'pattern': {'shape': ''}},
135
- 'name': 'zephyr-7b-beta',
136
- 'offsetgroup': 'zephyr-7b-beta',
137
  'orientation': 'v',
138
  'showlegend': True,
139
  'textposition': 'auto',
140
  'type': 'bar',
141
- 'x': array(['zephyr-7b-beta'], dtype=object),
142
  'xaxis': 'x',
143
- 'y': array([7.]),
144
  'yaxis': 'y'},
145
  {'alignmentgroup': 'True',
146
- 'hovertemplate': 'Model=%{x}<br>Model size (B params)=%{y}<extra></extra>',
147
- 'legendgroup': 'Mistral-7B-Instruct-v0.2',
148
- 'marker': {'color': '#00cc96', 'pattern': {'shape': ''}},
149
- 'name': 'Mistral-7B-Instruct-v0.2',
150
- 'offsetgroup': 'Mistral-7B-Instruct-v0.2',
151
  'orientation': 'v',
152
  'showlegend': True,
153
  'textposition': 'auto',
154
  'type': 'bar',
155
- 'x': array(['Mistral-7B-Instruct-v0.2'], dtype=object),
156
  'xaxis': 'x',
157
- 'y': array([7.]),
158
  'yaxis': 'y'},
159
  {'alignmentgroup': 'True',
160
- 'hovertemplate': 'Model=%{x}<br>Model size (B params)=%{y}<extra></extra>',
161
- 'legendgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
162
- 'marker': {'color': '#ab63fa', 'pattern': {'shape': ''}},
163
- 'name': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
164
- 'offsetgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
165
  'orientation': 'v',
166
  'showlegend': True,
167
  'textposition': 'auto',
168
  'type': 'bar',
169
- 'x': array(['TinyLlama/TinyLlama-1.1B-Chat-v1.0'], dtype=object),
170
  'xaxis': 'x',
171
- 'y': array([1.1]),
172
  'yaxis': 'y'}],
173
  'layout': {'barmode': 'relative',
174
  'legend': {'title': {'text': 'Model'}, 'tracegroupgap': 0},
175
  'template': '...',
176
- 'title': {'text': 'Model sizes in billions of parameters'},
177
- 'xaxis': {'anchor': 'y', 'domain': [0.0, 1.0], 'title': {'text': 'Model'}},
178
- 'yaxis': {'anchor': 'x', 'domain': [0.0, 1.0], 'title': {'text': 'Model size (B params)'}}}
179
- })",Model sizes in billions of parameters,Note that some models have undisclosed sizes,"{""data"":[{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eModel size (B params)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mixtral-8x7B-Instruct-v0.1"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""Mixtral-8x7B-Instruct-v0.1"",""offsetgroup"":""Mixtral-8x7B-Instruct-v0.1"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""Mixtral-8x7B-Instruct-v0.1""],""xaxis"":""x"",""y"":[56.0],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eModel size (B params)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""zephyr-7b-beta"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""zephyr-7b-beta"",""offsetgroup"":""zephyr-7b-beta"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""zephyr-7b-beta""],""xaxis"":""x"",""y"":[7.0],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eModel size (B params)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral-7B-Instruct-v0.2"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""Mistral-7B-Instruct-v0.2"",""offsetgroup"":""Mistral-7B-Instruct-v0.2"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""Mistral-7B-Instruct-v0.2""],""xaxis"":""x"",""y"":[7.0],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eModel size (B params)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""offsetgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0""],""xaxis"":""x"",""y"":[1.1],""yaxis"":""y"",""type"":""bar""}],""layout"":{""template"":{""data"":{""histogram2dcontour"":[{""type"":""histogram2dcontour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""choropleth"":[{""type"":""choropleth"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""histogram2d"":[{""type"":""histogram2d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmap"":[{""type"":""heatmap"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmapgl"":[{""type"":""heatmapgl"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""contourcarpet"":[{""type"":""contourcarpet"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""contour"":[{""type"":""contour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""surface"":[{""type"":""surface"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""mesh3d"":[{""type"":""mesh3d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""scatter"":[{""fillpattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2},""type"":""scatter""}],""parcoords"":[{""type"":""parcoords"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolargl"":[{""type"":""scatterpolargl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""bar"":[{""error_x"":{""color"":""#2a3f5f""},""error_y"":{""color"":""#2a3f5f""},""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""bar""}],""scattergeo"":[{""type"":""scattergeo"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolar"":[{""type"":""scatterpolar"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""histogram"":[{""marker"":{""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""histogram""}],""scattergl"":[{""type"":""scattergl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatter3d"":[{""type"":""scatter3d"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattermapbox"":[{""type"":""scattermapbox"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterternary"":[{""type"":""scatterternary"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattercarpet"":[{""type"":""scattercarpet"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""carpet"":[{""aaxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""baxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""type"":""carpet""}],""table"":[{""cells"":{""fill"":{""color"":""#EBF0F8""},""line"":{""color"":""white""}},""header"":{""fill"":{""color"":""#C8D4E3""},""line"":{""color"":""white""}},""type"":""table""}],""barpolar"":[{""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""barpolar""}],""pie"":[{""automargin"":true,""type"":""pie""}]},""layout"":{""autotypenumbers"":""strict"",""colorway"":[""#636efa"",""#EF553B"",""#00cc96"",""#ab63fa"",""#FFA15A"",""#19d3f3"",""#FF6692"",""#B6E880"",""#FF97FF"",""#FECB52""],""font"":{""color"":""#2a3f5f""},""hovermode"":""closest"",""hoverlabel"":{""align"":""left""},""paper_bgcolor"":""white"",""plot_bgcolor"":""#E5ECF6"",""polar"":{""bgcolor"":""#E5ECF6"",""angularaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""radialaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""ternary"":{""bgcolor"":""#E5ECF6"",""aaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""baxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""caxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""coloraxis"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""colorscale"":{""sequential"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""sequentialminus"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""diverging"":[[0,""#8e0152""],[0.1,""#c51b7d""],[0.2,""#de77ae""],[0.3,""#f1b6da""],[0.4,""#fde0ef""],[0.5,""#f7f7f7""],[0.6,""#e6f5d0""],[0.7,""#b8e186""],[0.8,""#7fbc41""],[0.9,""#4d9221""],[1,""#276419""]]},""xaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""yaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""scene"":{""xaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""yaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""zaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2}},""shapedefaults"":{""line"":{""color"":""#2a3f5f""}},""annotationdefaults"":{""arrowcolor"":""#2a3f5f"",""arrowhead"":0,""arrowwidth"":1},""geo"":{""bgcolor"":""white"",""landcolor"":""#E5ECF6"",""subunitcolor"":""white"",""showland"":true,""showlakes"":true,""lakecolor"":""white""},""title"":{""x"":0.05},""mapbox"":{""style"":""light""}}},""xaxis"":{""anchor"":""y"",""domain"":[0.0,1.0],""title"":{""text"":""Model""}},""yaxis"":{""anchor"":""x"",""domain"":[0.0,1.0],""title"":{""text"":""Model size (B params)""}},""legend"":{""title"":{""text"":""Model""},""tracegroupgap"":0},""title"":{""text"":""Model sizes in billions of parameters""},""barmode"":""relative""}}"
 
 
 
 
 
 
 
 
 
180
  ./html/plots/execution_costs.html,"Figure({
181
  'data': [{'alignmentgroup': 'True',
182
  'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
@@ -190,7 +183,7 @@ path,plot_object,description,comment,plot_json
190
  'type': 'bar',
191
  'x': array(['gpt-3.5-turbo', 'gpt-3.5-turbo'], dtype=object),
192
  'xaxis': 'x',
193
- 'y': array([0.002944, 0.002944]),
194
  'yaxis': 'y'},
195
  {'alignmentgroup': 'True',
196
  'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
@@ -204,7 +197,7 @@ path,plot_object,description,comment,plot_json
204
  'type': 'bar',
205
  'x': array(['gpt-4-turbo'], dtype=object),
206
  'xaxis': 'x',
207
- 'y': array([0.]),
208
  'yaxis': 'y'},
209
  {'alignmentgroup': 'True',
210
  'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
@@ -218,7 +211,7 @@ path,plot_object,description,comment,plot_json
218
  'type': 'bar',
219
  'x': array(['gpt-4'], dtype=object),
220
  'xaxis': 'x',
221
- 'y': array([0.]),
222
  'yaxis': 'y'},
223
  {'alignmentgroup': 'True',
224
  'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
@@ -232,7 +225,7 @@ path,plot_object,description,comment,plot_json
232
  'type': 'bar',
233
  'x': array(['llama-2-70b-chat'], dtype=object),
234
  'xaxis': 'x',
235
- 'y': array([0.00078]),
236
  'yaxis': 'y'},
237
  {'alignmentgroup': 'True',
238
  'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
@@ -246,7 +239,7 @@ path,plot_object,description,comment,plot_json
246
  'type': 'bar',
247
  'x': array(['Mixtral-8x7B-Instruct-v0.1'], dtype=object),
248
  'xaxis': 'x',
249
- 'y': array([0.0010602]),
250
  'yaxis': 'y'},
251
  {'alignmentgroup': 'True',
252
  'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
@@ -302,7 +295,7 @@ path,plot_object,description,comment,plot_json
302
  'type': 'bar',
303
  'x': array(['gemini-pro'], dtype=object),
304
  'xaxis': 'x',
305
- 'y': array([0.000205]),
306
  'yaxis': 'y'},
307
  {'alignmentgroup': 'True',
308
  'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
@@ -316,7 +309,7 @@ path,plot_object,description,comment,plot_json
316
  'type': 'bar',
317
  'x': array(['chat-bison'], dtype=object),
318
  'xaxis': 'x',
319
- 'y': array([0.]),
320
  'yaxis': 'y'},
321
  {'alignmentgroup': 'True',
322
  'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
@@ -330,12 +323,76 @@ path,plot_object,description,comment,plot_json
330
  'type': 'bar',
331
  'x': array(['chat-bison-32k'], dtype=object),
332
  'xaxis': 'x',
333
- 'y': array([0.]),
334
  'yaxis': 'y'}],
335
  'layout': {'barmode': 'relative',
336
  'legend': {'title': {'text': 'Model'}, 'tracegroupgap': 0},
337
  'template': '...',
338
- 'title': {'text': 'Costs of execution of 12 test queries per model'},
339
  'xaxis': {'anchor': 'y', 'domain': [0.0, 1.0], 'title': {'text': 'Model'}},
340
  'yaxis': {'anchor': 'x', 'domain': [0.0, 1.0], 'title': {'text': 'Execution cost ($)'}}}
341
- })",Costs of execution of 12 test queries per model,Note that some providers bill by token count and some by execution time. In the second case we used averaged pausing and resuming time to calculate the cost and assumed that all queries have been done in one session. Also note that for now the Gemini-Pro model is free for under 60 queries per minute.,"{""data"":[{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-3.5-turbo"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""gpt-3.5-turbo"",""offsetgroup"":""gpt-3.5-turbo"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gpt-3.5-turbo"",""gpt-3.5-turbo""],""xaxis"":""x"",""y"":[0.002944,0.002944],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4-turbo"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""gpt-4-turbo"",""offsetgroup"":""gpt-4-turbo"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gpt-4-turbo""],""xaxis"":""x"",""y"":[0.0],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""gpt-4"",""offsetgroup"":""gpt-4"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gpt-4""],""xaxis"":""x"",""y"":[0.0],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""llama-2-70b-chat"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""llama-2-70b-chat"",""offsetgroup"":""llama-2-70b-chat"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""llama-2-70b-chat""],""xaxis"":""x"",""y"":[0.00078],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mixtral-8x7B-Instruct-v0.1"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""Mixtral-8x7B-Instruct-v0.1"",""offsetgroup"":""Mixtral-8x7B-Instruct-v0.1"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""Mixtral-8x7B-Instruct-v0.1""],""xaxis"":""x"",""y"":[0.0010602],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""zephyr-7b-beta"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""zephyr-7b-beta"",""offsetgroup"":""zephyr-7b-beta"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""zephyr-7b-beta""],""xaxis"":""x"",""y"":[55.45703703703705],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral-7B-Instruct-v0.2"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""Mistral-7B-Instruct-v0.2"",""offsetgroup"":""Mistral-7B-Instruct-v0.2"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""Mistral-7B-Instruct-v0.2""],""xaxis"":""x"",""y"":[55.45703703703705],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""offsetgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0""],""xaxis"":""x"",""y"":[25.59555555555556],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gemini-pro"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""gemini-pro"",""offsetgroup"":""gemini-pro"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gemini-pro""],""xaxis"":""x"",""y"":[0.000205],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""chat-bison"",""offsetgroup"":""chat-bison"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""chat-bison""],""xaxis"":""x"",""y"":[0.0],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison-32k"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""chat-bison-32k"",""offsetgroup"":""chat-bison-32k"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""chat-bison-32k""],""xaxis"":""x"",""y"":[0.0],""yaxis"":""y"",""type"":""bar""}],""layout"":{""template"":{""data"":{""histogram2dcontour"":[{""type"":""histogram2dcontour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""choropleth"":[{""type"":""choropleth"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""histogram2d"":[{""type"":""histogram2d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmap"":[{""type"":""heatmap"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmapgl"":[{""type"":""heatmapgl"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""contourcarpet"":[{""type"":""contourcarpet"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""contour"":[{""type"":""contour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""surface"":[{""type"":""surface"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""mesh3d"":[{""type"":""mesh3d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""scatter"":[{""fillpattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2},""type"":""scatter""}],""parcoords"":[{""type"":""parcoords"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolargl"":[{""type"":""scatterpolargl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""bar"":[{""error_x"":{""color"":""#2a3f5f""},""error_y"":{""color"":""#2a3f5f""},""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""bar""}],""scattergeo"":[{""type"":""scattergeo"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolar"":[{""type"":""scatterpolar"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""histogram"":[{""marker"":{""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""histogram""}],""scattergl"":[{""type"":""scattergl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatter3d"":[{""type"":""scatter3d"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattermapbox"":[{""type"":""scattermapbox"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterternary"":[{""type"":""scatterternary"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattercarpet"":[{""type"":""scattercarpet"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""carpet"":[{""aaxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""baxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""type"":""carpet""}],""table"":[{""cells"":{""fill"":{""color"":""#EBF0F8""},""line"":{""color"":""white""}},""header"":{""fill"":{""color"":""#C8D4E3""},""line"":{""color"":""white""}},""type"":""table""}],""barpolar"":[{""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""barpolar""}],""pie"":[{""automargin"":true,""type"":""pie""}]},""layout"":{""autotypenumbers"":""strict"",""colorway"":[""#636efa"",""#EF553B"",""#00cc96"",""#ab63fa"",""#FFA15A"",""#19d3f3"",""#FF6692"",""#B6E880"",""#FF97FF"",""#FECB52""],""font"":{""color"":""#2a3f5f""},""hovermode"":""closest"",""hoverlabel"":{""align"":""left""},""paper_bgcolor"":""white"",""plot_bgcolor"":""#E5ECF6"",""polar"":{""bgcolor"":""#E5ECF6"",""angularaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""radialaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""ternary"":{""bgcolor"":""#E5ECF6"",""aaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""baxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""caxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""coloraxis"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""colorscale"":{""sequential"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""sequentialminus"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""diverging"":[[0,""#8e0152""],[0.1,""#c51b7d""],[0.2,""#de77ae""],[0.3,""#f1b6da""],[0.4,""#fde0ef""],[0.5,""#f7f7f7""],[0.6,""#e6f5d0""],[0.7,""#b8e186""],[0.8,""#7fbc41""],[0.9,""#4d9221""],[1,""#276419""]]},""xaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""yaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""scene"":{""xaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""yaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""zaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2}},""shapedefaults"":{""line"":{""color"":""#2a3f5f""}},""annotationdefaults"":{""arrowcolor"":""#2a3f5f"",""arrowhead"":0,""arrowwidth"":1},""geo"":{""bgcolor"":""white"",""landcolor"":""#E5ECF6"",""subunitcolor"":""white"",""showland"":true,""showlakes"":true,""lakecolor"":""white""},""title"":{""x"":0.05},""mapbox"":{""style"":""light""}}},""xaxis"":{""anchor"":""y"",""domain"":[0.0,1.0],""title"":{""text"":""Model""}},""yaxis"":{""anchor"":""x"",""domain"":[0.0,1.0],""title"":{""text"":""Execution cost ($)""}},""legend"":{""title"":{""text"":""Model""},""tracegroupgap"":0},""title"":{""text"":""Costs of execution of 12 test queries per model""},""barmode"":""relative""}}"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
12
  'type': 'bar',
13
  'x': array(['Mistral-7B-Instruct-v0.2'], dtype=object),
14
  'xaxis': 'x',
15
+ 'y': array([3.17454003]),
16
  'yaxis': 'y'},
17
  {'alignmentgroup': 'True',
18
  'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
 
26
  'type': 'bar',
27
  'x': array(['Mixtral-8x7B-Instruct-v0.1'], dtype=object),
28
  'xaxis': 'x',
29
+ 'y': array([7.14219763]),
30
  'yaxis': 'y'},
31
  {'alignmentgroup': 'True',
32
  'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
 
40
  'type': 'bar',
41
  'x': array(['TinyLlama/TinyLlama-1.1B-Chat-v1.0'], dtype=object),
42
  'xaxis': 'x',
43
+ 'y': array([1.29026454]),
44
  'yaxis': 'y'},
45
  {'alignmentgroup': 'True',
46
  'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
47
+ 'legendgroup': 'chat-bison',
48
  'marker': {'color': '#ab63fa', 'pattern': {'shape': ''}},
49
+ 'name': 'chat-bison',
50
+ 'offsetgroup': 'chat-bison',
51
  'orientation': 'v',
52
  'showlegend': True,
53
  'textposition': 'auto',
54
  'type': 'bar',
55
+ 'x': array(['chat-bison'], dtype=object),
56
  'xaxis': 'x',
57
+ 'y': array([3.89024363]),
58
  'yaxis': 'y'},
59
  {'alignmentgroup': 'True',
60
  'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
61
+ 'legendgroup': 'chat-bison-32k',
62
  'marker': {'color': '#FFA15A', 'pattern': {'shape': ''}},
63
+ 'name': 'chat-bison-32k',
64
+ 'offsetgroup': 'chat-bison-32k',
65
  'orientation': 'v',
66
  'showlegend': True,
67
  'textposition': 'auto',
68
  'type': 'bar',
69
+ 'x': array(['chat-bison-32k'], dtype=object),
70
  'xaxis': 'x',
71
+ 'y': array([4.12817777]),
72
  'yaxis': 'y'},
73
  {'alignmentgroup': 'True',
74
  'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
75
+ 'legendgroup': 'gemini-pro',
76
  'marker': {'color': '#19d3f3', 'pattern': {'shape': ''}},
77
+ 'name': 'gemini-pro',
78
+ 'offsetgroup': 'gemini-pro',
79
  'orientation': 'v',
80
  'showlegend': True,
81
  'textposition': 'auto',
82
  'type': 'bar',
83
+ 'x': array(['gemini-pro'], dtype=object),
84
  'xaxis': 'x',
85
+ 'y': array([4.72138064]),
86
  'yaxis': 'y'},
87
  {'alignmentgroup': 'True',
88
  'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
89
+ 'legendgroup': 'gpt-3.5-turbo',
90
  'marker': {'color': '#FF6692', 'pattern': {'shape': ''}},
91
+ 'name': 'gpt-3.5-turbo',
92
+ 'offsetgroup': 'gpt-3.5-turbo',
93
  'orientation': 'v',
94
  'showlegend': True,
95
  'textposition': 'auto',
96
  'type': 'bar',
97
+ 'x': array(['gpt-3.5-turbo'], dtype=object),
98
  'xaxis': 'x',
99
+ 'y': array([5.28237349]),
100
+ 'yaxis': 'y'},
101
+ {'alignmentgroup': 'True',
102
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
103
+ 'legendgroup': 'gpt-4',
104
+ 'marker': {'color': '#B6E880', 'pattern': {'shape': ''}},
105
+ 'name': 'gpt-4',
106
+ 'offsetgroup': 'gpt-4',
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
107
  'orientation': 'v',
108
  'showlegend': True,
109
  'textposition': 'auto',
110
  'type': 'bar',
111
+ 'x': array(['gpt-4'], dtype=object),
112
  'xaxis': 'x',
113
+ 'y': array([15.52184566]),
114
  'yaxis': 'y'},
115
  {'alignmentgroup': 'True',
116
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
117
+ 'legendgroup': 'gpt-4-turbo',
118
+ 'marker': {'color': '#FF97FF', 'pattern': {'shape': ''}},
119
+ 'name': 'gpt-4-turbo',
120
+ 'offsetgroup': 'gpt-4-turbo',
121
  'orientation': 'v',
122
  'showlegend': True,
123
  'textposition': 'auto',
124
  'type': 'bar',
125
+ 'x': array(['gpt-4-turbo'], dtype=object),
126
  'xaxis': 'x',
127
+ 'y': array([14.00852903]),
128
  'yaxis': 'y'},
129
  {'alignmentgroup': 'True',
130
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
131
+ 'legendgroup': 'llama-2-70b-chat',
132
+ 'marker': {'color': '#FECB52', 'pattern': {'shape': ''}},
133
+ 'name': 'llama-2-70b-chat',
134
+ 'offsetgroup': 'llama-2-70b-chat',
135
  'orientation': 'v',
136
  'showlegend': True,
137
  'textposition': 'auto',
138
  'type': 'bar',
139
+ 'x': array(['llama-2-70b-chat'], dtype=object),
140
  'xaxis': 'x',
141
+ 'y': array([6.0658799]),
142
  'yaxis': 'y'},
143
  {'alignmentgroup': 'True',
144
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
145
+ 'legendgroup': 'zephyr-7b-beta',
146
+ 'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
147
+ 'name': 'zephyr-7b-beta',
148
+ 'offsetgroup': 'zephyr-7b-beta',
149
  'orientation': 'v',
150
  'showlegend': True,
151
  'textposition': 'auto',
152
  'type': 'bar',
153
+ 'x': array(['zephyr-7b-beta'], dtype=object),
154
  'xaxis': 'x',
155
+ 'y': array([3.23879932]),
156
  'yaxis': 'y'}],
157
  'layout': {'barmode': 'relative',
158
  'legend': {'title': {'text': 'Model'}, 'tracegroupgap': 0},
159
  'template': '...',
160
+ 'title': {'text': 'Model endpoints response times'},
161
+ 'xaxis': {'anchor': 'y',
162
+ 'categoryarray': [Mistral-7B-Instruct-v0.2,
163
+ Mixtral-8x7B-Instruct-v0.1,
164
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,
165
+ chat-bison, chat-bison-32k, gemini-pro,
166
+ gpt-3.5-turbo, gpt-4, gpt-4-turbo,
167
+ llama-2-70b-chat, zephyr-7b-beta],
168
+ 'categoryorder': 'array',
169
+ 'domain': [0.0, 1.0],
170
+ 'title': {'text': 'Model'}},
171
+ 'yaxis': {'anchor': 'x', 'domain': [0.0, 1.0], 'title': {'text': 'Execution time (s)'}}}
172
+ })",Model endpoints response times,,"{""data"":[{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral-7B-Instruct-v0.2"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""Mistral-7B-Instruct-v0.2"",""offsetgroup"":""Mistral-7B-Instruct-v0.2"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""Mistral-7B-Instruct-v0.2""],""xaxis"":""x"",""y"":[3.174540030956268],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mixtral-8x7B-Instruct-v0.1"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""Mixtral-8x7B-Instruct-v0.1"",""offsetgroup"":""Mixtral-8x7B-Instruct-v0.1"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""Mixtral-8x7B-Instruct-v0.1""],""xaxis"":""x"",""y"":[7.142197625471814],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""offsetgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0""],""xaxis"":""x"",""y"":[1.2902645373344421],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""chat-bison"",""offsetgroup"":""chat-bison"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""chat-bison""],""xaxis"":""x"",""y"":[3.890243631601334],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison-32k"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""chat-bison-32k"",""offsetgroup"":""chat-bison-32k"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""chat-bison-32k""],""xaxis"":""x"",""y"":[4.128177767992019],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gemini-pro"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""gemini-pro"",""offsetgroup"":""gemini-pro"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gemini-pro""],""xaxis"":""x"",""y"":[4.72138064004937],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-3.5-turbo"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""gpt-3.5-turbo"",""offsetgroup"":""gpt-3.5-turbo"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gpt-3.5-turbo""],""xaxis"":""x"",""y"":[5.282373493889353],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""gpt-4"",""offsetgroup"":""gpt-4"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gpt-4""],""xaxis"":""x"",""y"":[15.5218456586202],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4-turbo"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""gpt-4-turbo"",""offsetgroup"":""gpt-4-turbo"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gpt-4-turbo""],""xaxis"":""x"",""y"":[14.008529031276703],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""llama-2-70b-chat"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""llama-2-70b-chat"",""offsetgroup"":""llama-2-70b-chat"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""llama-2-70b-chat""],""xaxis"":""x"",""y"":[6.06587989590749],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""zephyr-7b-beta"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""zephyr-7b-beta"",""offsetgroup"":""zephyr-7b-beta"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""zephyr-7b-beta""],""xaxis"":""x"",""y"":[3.2387993240356447],""yaxis"":""y"",""type"":""bar""}],""layout"":{""template"":{""data"":{""histogram2dcontour"":[{""type"":""histogram2dcontour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""choropleth"":[{""type"":""choropleth"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""histogram2d"":[{""type"":""histogram2d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmap"":[{""type"":""heatmap"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmapgl"":[{""type"":""heatmapgl"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""contourcarpet"":[{""type"":""contourcarpet"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""contour"":[{""type"":""contour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""surface"":[{""type"":""surface"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""mesh3d"":[{""type"":""mesh3d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""scatter"":[{""fillpattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2},""type"":""scatter""}],""parcoords"":[{""type"":""parcoords"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolargl"":[{""type"":""scatterpolargl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""bar"":[{""error_x"":{""color"":""#2a3f5f""},""error_y"":{""color"":""#2a3f5f""},""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""bar""}],""scattergeo"":[{""type"":""scattergeo"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolar"":[{""type"":""scatterpolar"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""histogram"":[{""marker"":{""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""histogram""}],""scattergl"":[{""type"":""scattergl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatter3d"":[{""type"":""scatter3d"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattermapbox"":[{""type"":""scattermapbox"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterternary"":[{""type"":""scatterternary"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattercarpet"":[{""type"":""scattercarpet"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""carpet"":[{""aaxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""baxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""type"":""carpet""}],""table"":[{""cells"":{""fill"":{""color"":""#EBF0F8""},""line"":{""color"":""white""}},""header"":{""fill"":{""color"":""#C8D4E3""},""line"":{""color"":""white""}},""type"":""table""}],""barpolar"":[{""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""barpolar""}],""pie"":[{""automargin"":true,""type"":""pie""}]},""layout"":{""autotypenumbers"":""strict"",""colorway"":[""#636efa"",""#EF553B"",""#00cc96"",""#ab63fa"",""#FFA15A"",""#19d3f3"",""#FF6692"",""#B6E880"",""#FF97FF"",""#FECB52""],""font"":{""color"":""#2a3f5f""},""hovermode"":""closest"",""hoverlabel"":{""align"":""left""},""paper_bgcolor"":""white"",""plot_bgcolor"":""#E5ECF6"",""polar"":{""bgcolor"":""#E5ECF6"",""angularaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""radialaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""ternary"":{""bgcolor"":""#E5ECF6"",""aaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""baxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""caxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""coloraxis"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""colorscale"":{""sequential"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""sequentialminus"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""diverging"":[[0,""#8e0152""],[0.1,""#c51b7d""],[0.2,""#de77ae""],[0.3,""#f1b6da""],[0.4,""#fde0ef""],[0.5,""#f7f7f7""],[0.6,""#e6f5d0""],[0.7,""#b8e186""],[0.8,""#7fbc41""],[0.9,""#4d9221""],[1,""#276419""]]},""xaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""yaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""scene"":{""xaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""yaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""zaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2}},""shapedefaults"":{""line"":{""color"":""#2a3f5f""}},""annotationdefaults"":{""arrowcolor"":""#2a3f5f"",""arrowhead"":0,""arrowwidth"":1},""geo"":{""bgcolor"":""white"",""landcolor"":""#E5ECF6"",""subunitcolor"":""white"",""showland"":true,""showlakes"":true,""lakecolor"":""white""},""title"":{""x"":0.05},""mapbox"":{""style"":""light""}}},""xaxis"":{""anchor"":""y"",""domain"":[0.0,1.0],""title"":{""text"":""Model""},""categoryorder"":""array"",""categoryarray"":[""Mistral-7B-Instruct-v0.2"",""Mixtral-8x7B-Instruct-v0.1"",""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""chat-bison"",""chat-bison-32k"",""gemini-pro"",""gpt-3.5-turbo"",""gpt-4"",""gpt-4-turbo"",""llama-2-70b-chat"",""zephyr-7b-beta""]},""yaxis"":{""anchor"":""x"",""domain"":[0.0,1.0],""title"":{""text"":""Execution time (s)""}},""legend"":{""title"":{""text"":""Model""},""tracegroupgap"":0},""title"":{""text"":""Model endpoints response times""},""barmode"":""relative""}}"
173
  ./html/plots/execution_costs.html,"Figure({
174
  'data': [{'alignmentgroup': 'True',
175
  'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
 
183
  'type': 'bar',
184
  'x': array(['gpt-3.5-turbo', 'gpt-3.5-turbo'], dtype=object),
185
  'xaxis': 'x',
186
+ 'y': array([0.144438, 0.144438]),
187
  'yaxis': 'y'},
188
  {'alignmentgroup': 'True',
189
  'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
 
197
  'type': 'bar',
198
  'x': array(['gpt-4-turbo'], dtype=object),
199
  'xaxis': 'x',
200
+ 'y': array([0.44014]),
201
  'yaxis': 'y'},
202
  {'alignmentgroup': 'True',
203
  'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
 
211
  'type': 'bar',
212
  'x': array(['gpt-4'], dtype=object),
213
  'xaxis': 'x',
214
+ 'y': array([1.1724]),
215
  'yaxis': 'y'},
216
  {'alignmentgroup': 'True',
217
  'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
 
225
  'type': 'bar',
226
  'x': array(['llama-2-70b-chat'], dtype=object),
227
  'xaxis': 'x',
228
+ 'y': array([0.0186864]),
229
  'yaxis': 'y'},
230
  {'alignmentgroup': 'True',
231
  'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
 
239
  'type': 'bar',
240
  'x': array(['Mixtral-8x7B-Instruct-v0.1'], dtype=object),
241
  'xaxis': 'x',
242
+ 'y': array([0.0781551]),
243
  'yaxis': 'y'},
244
  {'alignmentgroup': 'True',
245
  'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
 
295
  'type': 'bar',
296
  'x': array(['gemini-pro'], dtype=object),
297
  'xaxis': 'x',
298
+ 'y': array([0.022971]),
299
  'yaxis': 'y'},
300
  {'alignmentgroup': 'True',
301
  'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
 
309
  'type': 'bar',
310
  'x': array(['chat-bison'], dtype=object),
311
  'xaxis': 'x',
312
+ 'y': array([0.008985]),
313
  'yaxis': 'y'},
314
  {'alignmentgroup': 'True',
315
  'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
 
323
  'type': 'bar',
324
  'x': array(['chat-bison-32k'], dtype=object),
325
  'xaxis': 'x',
326
+ 'y': array([0.0089655]),
327
  'yaxis': 'y'}],
328
  'layout': {'barmode': 'relative',
329
  'legend': {'title': {'text': 'Model'}, 'tracegroupgap': 0},
330
  'template': '...',
331
+ 'title': {'text': 'Costs of execution of 80 test queries per model'},
332
  'xaxis': {'anchor': 'y', 'domain': [0.0, 1.0], 'title': {'text': 'Model'}},
333
  'yaxis': {'anchor': 'x', 'domain': [0.0, 1.0], 'title': {'text': 'Execution cost ($)'}}}
334
+ })",Costs of execution of 80 test queries per model,Note that some providers bill by token count and some by execution time. In the second case we used averaged pausing and resuming time to calculate the cost and assumed that all queries have been done in one session. Also note that for now the Gemini-Pro model is free for under 60 queries per minute.,"{""data"":[{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-3.5-turbo"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""gpt-3.5-turbo"",""offsetgroup"":""gpt-3.5-turbo"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gpt-3.5-turbo"",""gpt-3.5-turbo""],""xaxis"":""x"",""y"":[0.144438,0.144438],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4-turbo"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""gpt-4-turbo"",""offsetgroup"":""gpt-4-turbo"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gpt-4-turbo""],""xaxis"":""x"",""y"":[0.44014],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""gpt-4"",""offsetgroup"":""gpt-4"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gpt-4""],""xaxis"":""x"",""y"":[1.1724],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""llama-2-70b-chat"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""llama-2-70b-chat"",""offsetgroup"":""llama-2-70b-chat"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""llama-2-70b-chat""],""xaxis"":""x"",""y"":[0.0186864],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mixtral-8x7B-Instruct-v0.1"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""Mixtral-8x7B-Instruct-v0.1"",""offsetgroup"":""Mixtral-8x7B-Instruct-v0.1"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""Mixtral-8x7B-Instruct-v0.1""],""xaxis"":""x"",""y"":[0.07815509999999999],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""zephyr-7b-beta"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""zephyr-7b-beta"",""offsetgroup"":""zephyr-7b-beta"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""zephyr-7b-beta""],""xaxis"":""x"",""y"":[55.45703703703705],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral-7B-Instruct-v0.2"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""Mistral-7B-Instruct-v0.2"",""offsetgroup"":""Mistral-7B-Instruct-v0.2"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""Mistral-7B-Instruct-v0.2""],""xaxis"":""x"",""y"":[55.45703703703705],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""offsetgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0""],""xaxis"":""x"",""y"":[25.59555555555556],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gemini-pro"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""gemini-pro"",""offsetgroup"":""gemini-pro"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gemini-pro""],""xaxis"":""x"",""y"":[0.022971],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""chat-bison"",""offsetgroup"":""chat-bison"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""chat-bison""],""xaxis"":""x"",""y"":[0.008985],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison-32k"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""chat-bison-32k"",""offsetgroup"":""chat-bison-32k"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""chat-bison-32k""],""xaxis"":""x"",""y"":[0.0089655],""yaxis"":""y"",""type"":""bar""}],""layout"":{""template"":{""data"":{""histogram2dcontour"":[{""type"":""histogram2dcontour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""choropleth"":[{""type"":""choropleth"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""histogram2d"":[{""type"":""histogram2d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmap"":[{""type"":""heatmap"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmapgl"":[{""type"":""heatmapgl"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""contourcarpet"":[{""type"":""contourcarpet"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""contour"":[{""type"":""contour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""surface"":[{""type"":""surface"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""mesh3d"":[{""type"":""mesh3d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""scatter"":[{""fillpattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2},""type"":""scatter""}],""parcoords"":[{""type"":""parcoords"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolargl"":[{""type"":""scatterpolargl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""bar"":[{""error_x"":{""color"":""#2a3f5f""},""error_y"":{""color"":""#2a3f5f""},""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""bar""}],""scattergeo"":[{""type"":""scattergeo"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolar"":[{""type"":""scatterpolar"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""histogram"":[{""marker"":{""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""histogram""}],""scattergl"":[{""type"":""scattergl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatter3d"":[{""type"":""scatter3d"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattermapbox"":[{""type"":""scattermapbox"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterternary"":[{""type"":""scatterternary"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattercarpet"":[{""type"":""scattercarpet"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""carpet"":[{""aaxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""baxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""type"":""carpet""}],""table"":[{""cells"":{""fill"":{""color"":""#EBF0F8""},""line"":{""color"":""white""}},""header"":{""fill"":{""color"":""#C8D4E3""},""line"":{""color"":""white""}},""type"":""table""}],""barpolar"":[{""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""barpolar""}],""pie"":[{""automargin"":true,""type"":""pie""}]},""layout"":{""autotypenumbers"":""strict"",""colorway"":[""#636efa"",""#EF553B"",""#00cc96"",""#ab63fa"",""#FFA15A"",""#19d3f3"",""#FF6692"",""#B6E880"",""#FF97FF"",""#FECB52""],""font"":{""color"":""#2a3f5f""},""hovermode"":""closest"",""hoverlabel"":{""align"":""left""},""paper_bgcolor"":""white"",""plot_bgcolor"":""#E5ECF6"",""polar"":{""bgcolor"":""#E5ECF6"",""angularaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""radialaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""ternary"":{""bgcolor"":""#E5ECF6"",""aaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""baxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""caxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""coloraxis"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""colorscale"":{""sequential"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""sequentialminus"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""diverging"":[[0,""#8e0152""],[0.1,""#c51b7d""],[0.2,""#de77ae""],[0.3,""#f1b6da""],[0.4,""#fde0ef""],[0.5,""#f7f7f7""],[0.6,""#e6f5d0""],[0.7,""#b8e186""],[0.8,""#7fbc41""],[0.9,""#4d9221""],[1,""#276419""]]},""xaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""yaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""scene"":{""xaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""yaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""zaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2}},""shapedefaults"":{""line"":{""color"":""#2a3f5f""}},""annotationdefaults"":{""arrowcolor"":""#2a3f5f"",""arrowhead"":0,""arrowwidth"":1},""geo"":{""bgcolor"":""white"",""landcolor"":""#E5ECF6"",""subunitcolor"":""white"",""showland"":true,""showlakes"":true,""lakecolor"":""white""},""title"":{""x"":0.05},""mapbox"":{""style"":""light""}}},""xaxis"":{""anchor"":""y"",""domain"":[0.0,1.0],""title"":{""text"":""Model""}},""yaxis"":{""anchor"":""x"",""domain"":[0.0,1.0],""title"":{""text"":""Execution cost ($)""}},""legend"":{""title"":{""text"":""Model""},""tracegroupgap"":0},""title"":{""text"":""Costs of execution of 80 test queries per model""},""barmode"":""relative""}}"
335
+ ./html/plots/model_sizes.html,"Figure({
336
+ 'data': [{'alignmentgroup': 'True',
337
+ 'hovertemplate': 'Model=%{x}<br>Model size (B params)=%{y}<extra></extra>',
338
+ 'legendgroup': 'Mixtral-8x7B-Instruct-v0.1',
339
+ 'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
340
+ 'name': 'Mixtral-8x7B-Instruct-v0.1',
341
+ 'offsetgroup': 'Mixtral-8x7B-Instruct-v0.1',
342
+ 'orientation': 'v',
343
+ 'showlegend': True,
344
+ 'textposition': 'auto',
345
+ 'type': 'bar',
346
+ 'x': array(['Mixtral-8x7B-Instruct-v0.1'], dtype=object),
347
+ 'xaxis': 'x',
348
+ 'y': array([56.]),
349
+ 'yaxis': 'y'},
350
+ {'alignmentgroup': 'True',
351
+ 'hovertemplate': 'Model=%{x}<br>Model size (B params)=%{y}<extra></extra>',
352
+ 'legendgroup': 'zephyr-7b-beta',
353
+ 'marker': {'color': '#EF553B', 'pattern': {'shape': ''}},
354
+ 'name': 'zephyr-7b-beta',
355
+ 'offsetgroup': 'zephyr-7b-beta',
356
+ 'orientation': 'v',
357
+ 'showlegend': True,
358
+ 'textposition': 'auto',
359
+ 'type': 'bar',
360
+ 'x': array(['zephyr-7b-beta'], dtype=object),
361
+ 'xaxis': 'x',
362
+ 'y': array([7.]),
363
+ 'yaxis': 'y'},
364
+ {'alignmentgroup': 'True',
365
+ 'hovertemplate': 'Model=%{x}<br>Model size (B params)=%{y}<extra></extra>',
366
+ 'legendgroup': 'Mistral-7B-Instruct-v0.2',
367
+ 'marker': {'color': '#00cc96', 'pattern': {'shape': ''}},
368
+ 'name': 'Mistral-7B-Instruct-v0.2',
369
+ 'offsetgroup': 'Mistral-7B-Instruct-v0.2',
370
+ 'orientation': 'v',
371
+ 'showlegend': True,
372
+ 'textposition': 'auto',
373
+ 'type': 'bar',
374
+ 'x': array(['Mistral-7B-Instruct-v0.2'], dtype=object),
375
+ 'xaxis': 'x',
376
+ 'y': array([7.]),
377
+ 'yaxis': 'y'},
378
+ {'alignmentgroup': 'True',
379
+ 'hovertemplate': 'Model=%{x}<br>Model size (B params)=%{y}<extra></extra>',
380
+ 'legendgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
381
+ 'marker': {'color': '#ab63fa', 'pattern': {'shape': ''}},
382
+ 'name': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
383
+ 'offsetgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
384
+ 'orientation': 'v',
385
+ 'showlegend': True,
386
+ 'textposition': 'auto',
387
+ 'type': 'bar',
388
+ 'x': array(['TinyLlama/TinyLlama-1.1B-Chat-v1.0'], dtype=object),
389
+ 'xaxis': 'x',
390
+ 'y': array([1.1]),
391
+ 'yaxis': 'y'}],
392
+ 'layout': {'barmode': 'relative',
393
+ 'legend': {'title': {'text': 'Model'}, 'tracegroupgap': 0},
394
+ 'template': '...',
395
+ 'title': {'text': 'Model sizes in billions of parameters'},
396
+ 'xaxis': {'anchor': 'y', 'domain': [0.0, 1.0], 'title': {'text': 'Model'}},
397
+ 'yaxis': {'anchor': 'x', 'domain': [0.0, 1.0], 'title': {'text': 'Model size (B params)'}}}
398
+ })",Model sizes in billions of parameters,Note that some models have undisclosed sizes,"{""data"":[{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eModel size (B params)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mixtral-8x7B-Instruct-v0.1"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""Mixtral-8x7B-Instruct-v0.1"",""offsetgroup"":""Mixtral-8x7B-Instruct-v0.1"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""Mixtral-8x7B-Instruct-v0.1""],""xaxis"":""x"",""y"":[56.0],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eModel size (B params)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""zephyr-7b-beta"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""zephyr-7b-beta"",""offsetgroup"":""zephyr-7b-beta"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""zephyr-7b-beta""],""xaxis"":""x"",""y"":[7.0],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eModel size (B params)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral-7B-Instruct-v0.2"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""Mistral-7B-Instruct-v0.2"",""offsetgroup"":""Mistral-7B-Instruct-v0.2"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""Mistral-7B-Instruct-v0.2""],""xaxis"":""x"",""y"":[7.0],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eModel size (B params)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""offsetgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0""],""xaxis"":""x"",""y"":[1.1],""yaxis"":""y"",""type"":""bar""}],""layout"":{""template"":{""data"":{""histogram2dcontour"":[{""type"":""histogram2dcontour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""choropleth"":[{""type"":""choropleth"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""histogram2d"":[{""type"":""histogram2d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmap"":[{""type"":""heatmap"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmapgl"":[{""type"":""heatmapgl"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""contourcarpet"":[{""type"":""contourcarpet"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""contour"":[{""type"":""contour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""surface"":[{""type"":""surface"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""mesh3d"":[{""type"":""mesh3d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""scatter"":[{""fillpattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2},""type"":""scatter""}],""parcoords"":[{""type"":""parcoords"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolargl"":[{""type"":""scatterpolargl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""bar"":[{""error_x"":{""color"":""#2a3f5f""},""error_y"":{""color"":""#2a3f5f""},""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""bar""}],""scattergeo"":[{""type"":""scattergeo"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolar"":[{""type"":""scatterpolar"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""histogram"":[{""marker"":{""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""histogram""}],""scattergl"":[{""type"":""scattergl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatter3d"":[{""type"":""scatter3d"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattermapbox"":[{""type"":""scattermapbox"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterternary"":[{""type"":""scatterternary"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattercarpet"":[{""type"":""scattercarpet"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""carpet"":[{""aaxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""baxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""type"":""carpet""}],""table"":[{""cells"":{""fill"":{""color"":""#EBF0F8""},""line"":{""color"":""white""}},""header"":{""fill"":{""color"":""#C8D4E3""},""line"":{""color"":""white""}},""type"":""table""}],""barpolar"":[{""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""barpolar""}],""pie"":[{""automargin"":true,""type"":""pie""}]},""layout"":{""autotypenumbers"":""strict"",""colorway"":[""#636efa"",""#EF553B"",""#00cc96"",""#ab63fa"",""#FFA15A"",""#19d3f3"",""#FF6692"",""#B6E880"",""#FF97FF"",""#FECB52""],""font"":{""color"":""#2a3f5f""},""hovermode"":""closest"",""hoverlabel"":{""align"":""left""},""paper_bgcolor"":""white"",""plot_bgcolor"":""#E5ECF6"",""polar"":{""bgcolor"":""#E5ECF6"",""angularaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""radialaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""ternary"":{""bgcolor"":""#E5ECF6"",""aaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""baxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""caxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""coloraxis"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""colorscale"":{""sequential"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""sequentialminus"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""diverging"":[[0,""#8e0152""],[0.1,""#c51b7d""],[0.2,""#de77ae""],[0.3,""#f1b6da""],[0.4,""#fde0ef""],[0.5,""#f7f7f7""],[0.6,""#e6f5d0""],[0.7,""#b8e186""],[0.8,""#7fbc41""],[0.9,""#4d9221""],[1,""#276419""]]},""xaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""yaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""scene"":{""xaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""yaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""zaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2}},""shapedefaults"":{""line"":{""color"":""#2a3f5f""}},""annotationdefaults"":{""arrowcolor"":""#2a3f5f"",""arrowhead"":0,""arrowwidth"":1},""geo"":{""bgcolor"":""white"",""landcolor"":""#E5ECF6"",""subunitcolor"":""white"",""showland"":true,""showlakes"":true,""lakecolor"":""white""},""title"":{""x"":0.05},""mapbox"":{""style"":""light""}}},""xaxis"":{""anchor"":""y"",""domain"":[0.0,1.0],""title"":{""text"":""Model""}},""yaxis"":{""anchor"":""x"",""domain"":[0.0,1.0],""title"":{""text"":""Model size (B params)""}},""legend"":{""title"":{""text"":""Model""},""tracegroupgap"":0},""title"":{""text"":""Model sizes in billions of parameters""},""barmode"":""relative""}}"
data/2024-01-25 13:30:17.207984_summary.csv ADDED
@@ -0,0 +1,59 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ model,language,template_name,execution_time,characters_count,words_count,chunk_sizes_mean,chunk_sizes_min,chunk_sizes_max,chunk_generation_times_mean,chunk_generation_times_min,chunk_generation_times_max
2
+ Mistral-7B-Instruct-v0.2,english,call,,,,,,,,,
3
+ Mistral-7B-Instruct-v0.2,english,json,7.318650853633881,222.2,35.95,4.157156220767072,1.0,14.0,0.10865272596910582,0.00024437904357910156,60.7178213596344
4
+ Mistral-7B-Instruct-v0.2,english,markdown,2.8044421672821045,238.15,38.35,4.148954703832753,1.0,14.0,0.03463017442085187,0.020945072174072266,0.25538039207458496
5
+ Mistral-7B-Instruct-v0.2,japanese,call,,,,,,,,,
6
+ Mistral-7B-Instruct-v0.2,japanese,json,1.929928070306778,37.9,2.95,1.3882783882783882,1.0,11.0,0.039187116718990896,0.020466089248657227,0.23994874954223633
7
+ Mistral-7B-Instruct-v0.2,japanese,markdown,1.8897509932518006,28.85,1.15,1.088679245283019,1.0,4.0,0.0396594097029488,0.0004932880401611328,0.2205650806427002
8
+ Mixtral-8x7B-Instruct-v0.1,english,call,,,,,,,,,
9
+ Mixtral-8x7B-Instruct-v0.1,english,json,3.181837737560272,394.95,61.5,4.355665839536807,1.0,15.0,0.015196637342151676,0.0002071857452392578,1.011472463607788
10
+ Mixtral-8x7B-Instruct-v0.1,english,markdown,3.399144798517227,654.4,105.05,4.374331550802139,1.0,14.0,0.013296874289844125,0.00021576881408691406,0.5904912948608398
11
+ Mixtral-8x7B-Instruct-v0.1,japanese,call,,,,,,,,,
12
+ Mixtral-8x7B-Instruct-v0.1,japanese,json,8.82588157138309,532.425,56.35,2.0712896323672436,1.0,15.0,0.027260187998098102,0.0002186298370361328,76.45081758499146
13
+ Mixtral-8x7B-Instruct-v0.1,japanese,markdown,12.566328430175782,460.6,5.7,1.0741604477611941,1.0,9.0,0.01511352992991903,0.00021529197692871094,0.8098442554473877
14
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,english,call,,,,,,,,,
15
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,english,json,1.3998499751091003,203.15,34.6,4.120689655172414,1.0,13.0,0.01180358711652775,0.0003421306610107422,0.13397955894470215
16
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,english,markdown,1.4005955815315247,179.5,30.65,3.847802786709539,1.0,14.0,0.01265179331535184,0.0003273487091064453,0.13492584228515625
17
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,japanese,call,,,,,,,,,
18
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,japanese,json,1.2260903775691987,48.35,5.8,1.95748987854251,1.0,13.0,0.01474765992840292,0.00041413307189941406,0.18952107429504395
19
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,japanese,markdown,1.1986963748931885,51.55,6.85,2.0415841584158416,1.0,10.0,0.014000740617808729,0.0005300045013427734,0.16827392578125
20
+ chat-bison,english,call,,,,,,,,,
21
+ chat-bison,english,json,3.446989095211029,550.05,86.0,89.4390243902439,1.0,138.0,0.4258628240445765,0.0006544589996337891,2.2015340328216553
22
+ chat-bison,japanese,call,,,,,,,,,
23
+ chat-bison,japanese,json,4.333498167991638,246.1,12.0,33.48299319727891,3.0,124.0,0.47770044917152044,0.0005426406860351562,3.5425846576690674
24
+ chat-bison-32k,english,call,,,,,,,,,
25
+ chat-bison-32k,english,json,3.74513863325119,538.4,84.25,88.26229508196721,1.0,134.0,0.47832588094179745,0.0006556510925292969,3.0114917755126953
26
+ chat-bison-32k,japanese,call,,,,,,,,,
27
+ chat-bison-32k,japanese,json,4.5112169027328495,241.45,11.8,35.77037037037037,6.0,124.0,0.5467217816246881,0.0005869865417480469,4.387756824493408
28
+ gemini-pro,english,call,,,,,,,,,
29
+ gemini-pro,english,json,3.6837018529574075,557.475,87.225,175.58267716535434,4.0,988.0,1.0232121174729716,0.0006723403930664062,8.669384241104126
30
+ gemini-pro,english,markdown,4.207570552825928,663.8,109.05,139.74736842105264,19.0,472.0,0.7348335742950439,0.0007510185241699219,2.7830429077148438
31
+ gemini-pro,japanese,call,,,,,,,,,
32
+ gemini-pro,japanese,json,4.794884290013995,189.55,4.05,64.2542372881356,4.0,215.0,1.1180692850533178,0.0006062984466552734,5.698127031326294
33
+ gemini-pro,japanese,markdown,7.311563323525822,392.7,7.75,62.832,15.0,203.0,0.9826514282226563,0.0006639957427978516,13.754565954208374
34
+ gpt-3.5-turbo,english,call,3.409479808062315,671.15625,108.59375,,,,,,
35
+ gpt-3.5-turbo,english,json,2.650409721559094,564.6451612903226,90.98387096774194,5.037122302158274,1.0,16.0,0.017705622920029456,0.0005590915679931641,0.4925534725189209
36
+ gpt-3.5-turbo,english,markdown,3.1277945737044015,649.3333333333334,103.75,5.186023294509152,1.0,16.0,0.019346605402459322,0.0006084442138671875,1.127073049545288
37
+ gpt-3.5-turbo,japanese,call,8.916680586142618,375.1875,4.9375,,,,,,
38
+ gpt-3.5-turbo,japanese,json,6.141976299932447,244.75806451612902,3.306451612903226,1.1217474866942638,1.0,7.0,0.0232258041112258,0.0005545616149902344,13.75982117652893
39
+ gpt-3.5-turbo,japanese,markdown,8.25130424045381,315.5,1.3636363636363635,1.1153784348385023,1.0,10.0,0.025426305415027686,0.0005831718444824219,13.71114993095398
40
+ gpt-4,english,call,10.59899697303772,538.45,83.7,,,,,,
41
+ gpt-4,english,json,9.713180017471313,558.35,87.5,4.971950133570792,1.0,16.0,0.07619813660479824,0.0005440711975097656,1.9534873962402344
42
+ gpt-4,japanese,call,22.77469485684445,242.1,1.2,,,,,,
43
+ gpt-4,japanese,json,19.565327330639487,217.85,4.1,1.1505149194613151,1.0,7.0,0.09166746716213503,0.0005655288696289062,2.1393778324127197
44
+ gpt-4-turbo,english,call,9.345100498199463,550.9,84.9,,,,,,
45
+ gpt-4-turbo,english,json,8.325499892234802,686.55,105.4,5.042600073448402,1.0,17.0,0.05410054322774035,0.0007143020629882812,0.755082368850708
46
+ gpt-4-turbo,japanese,call,18.703535676002502,222.35,3.6,,,,,,
47
+ gpt-4-turbo,japanese,json,19.659980058670044,272.5,6.0,1.181956191715463,1.0,8.0,0.07962745783567377,0.0006952285766601562,13.252992153167725
48
+ llama-2-70b-chat,english,call,,,,,,,,,
49
+ llama-2-70b-chat,english,json,3.55666184425354,427.6363636363636,65.81818181818181,4.172062084257206,1.0,14.0,0.01772472985303587,0.00021791458129882812,0.5100884437561035
50
+ llama-2-70b-chat,english,markdown,6.183407843112946,1169.7727272727273,184.1818181818182,4.07263807564488,1.0,16.0,0.01361775794423896,0.0002124309539794922,0.5661592483520508
51
+ llama-2-70b-chat,japanese,call,,,,,,,,,
52
+ llama-2-70b-chat,japanese,json,4.945841180650811,350.4761904761905,42.642857142857146,2.46483590087073,1.0,15.0,0.01905980879878806,0.00021982192993164062,0.35228896141052246
53
+ llama-2-70b-chat,japanese,markdown,14.294062587949965,1299.1818181818182,172.5,2.8476636445152934,1.0,16.0,0.02320206142747451,0.0002117156982421875,76.44498753547668
54
+ zephyr-7b-beta,english,call,,,,,,,,,
55
+ zephyr-7b-beta,english,json,2.845248854160309,238.1,39.2,4.274685816876122,1.0,14.0,0.03622233246986485,0.0003070831298828125,0.4896988868713379
56
+ zephyr-7b-beta,english,markdown,7.618257820606232,238.65,38.75,4.358904109589041,1.0,15.0,0.1235110485390441,0.00040459632873535156,75.15552616119385
57
+ zephyr-7b-beta,japanese,call,,,,,,,,,
58
+ zephyr-7b-beta,japanese,json,1.921021181344986,29.75,3.3,1.1829025844930416,1.0,7.0,0.042037644869764565,0.018090486526489258,0.4599947929382324
59
+ zephyr-7b-beta,japanese,markdown,1.8884475827217102,26.6,1.75,1.0350194552529184,1.0,4.0,0.04097196471366437,0.02583909034729004,0.4606599807739258
data/2024-01-25 13:30:20.959750_time_of_day_comparison.csv ADDED
@@ -0,0 +1,20 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ model,time_of_day,execution_time,characters_count,words_count
2
+ Mistral-7B-Instruct-v0.2,afternoon,,,
3
+ Mistral-7B-Instruct-v0.2,evening,,,
4
+ Mistral-7B-Instruct-v0.2,morning,3.174540030956268,113.0,16.27
5
+ Mixtral-8x7B-Instruct-v0.1,morning,7.142197625471814,494.9583333333333,57.74166666666667
6
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,morning,1.2902645373344421,106.18,16.74
7
+ chat-bison,morning,3.890243631601334,398.075,49.0
8
+ chat-bison-32k,morning,4.128177767992019,389.925,48.025
9
+ gemini-pro,morning,4.72138064004937,425.09166666666664,49.891666666666666
10
+ gpt-3.5-turbo,afternoon,4.666725277900696,302.1666666666667,32.0
11
+ gpt-3.5-turbo,evening,4.351089119911194,305.25,28.5
12
+ gpt-3.5-turbo,morning,5.336839800789242,479.2785714285714,53.92142857142857
13
+ gpt-4,morning,15.5218456586202,389.1875,44.125
14
+ gpt-4-turbo,morning,14.008529031276703,433.075,49.975
15
+ llama-2-70b-chat,afternoon,2.1692867279052734,292.0,43.5
16
+ llama-2-70b-chat,evening,5.552149415016174,967.5,141.25
17
+ llama-2-70b-chat,morning,6.175082007679371,662.7416666666667,94.30833333333334
18
+ zephyr-7b-beta,afternoon,,,
19
+ zephyr-7b-beta,evening,,,
20
+ zephyr-7b-beta,morning,3.2387993240356447,112.57,17.26
data/2024-01-25 13:34:46.224347_summary.csv ADDED
@@ -0,0 +1,59 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ model,language,template_name,execution_time,characters_count,words_count,chunk_sizes_mean,chunk_sizes_min,chunk_sizes_max,chunk_generation_times_mean,chunk_generation_times_min,chunk_generation_times_max
2
+ Mistral-7B-Instruct-v0.2,english,call,,,,,,,,,
3
+ Mistral-7B-Instruct-v0.2,english,json,7.318650853633881,222.2,35.95,4.157156220767072,1.0,14.0,0.10865272596910582,0.00024437904357910156,60.7178213596344
4
+ Mistral-7B-Instruct-v0.2,english,markdown,2.8044421672821045,238.15,38.35,4.148954703832753,1.0,14.0,0.03463017442085187,0.020945072174072266,0.25538039207458496
5
+ Mistral-7B-Instruct-v0.2,japanese,call,,,,,,,,,
6
+ Mistral-7B-Instruct-v0.2,japanese,json,1.929928070306778,37.9,2.95,1.3882783882783882,1.0,11.0,0.039187116718990896,0.020466089248657227,0.23994874954223633
7
+ Mistral-7B-Instruct-v0.2,japanese,markdown,1.8897509932518006,28.85,1.15,1.088679245283019,1.0,4.0,0.0396594097029488,0.0004932880401611328,0.2205650806427002
8
+ Mixtral-8x7B-Instruct-v0.1,english,call,,,,,,,,,
9
+ Mixtral-8x7B-Instruct-v0.1,english,json,3.181837737560272,394.95,61.5,4.355665839536807,1.0,15.0,0.015196637342151676,0.0002071857452392578,1.011472463607788
10
+ Mixtral-8x7B-Instruct-v0.1,english,markdown,3.399144798517227,654.4,105.05,4.374331550802139,1.0,14.0,0.013296874289844125,0.00021576881408691406,0.5904912948608398
11
+ Mixtral-8x7B-Instruct-v0.1,japanese,call,,,,,,,,,
12
+ Mixtral-8x7B-Instruct-v0.1,japanese,json,8.82588157138309,532.425,56.35,2.0712896323672436,1.0,15.0,0.027260187998098102,0.0002186298370361328,76.45081758499146
13
+ Mixtral-8x7B-Instruct-v0.1,japanese,markdown,12.566328430175782,460.6,5.7,1.0741604477611941,1.0,9.0,0.01511352992991903,0.00021529197692871094,0.8098442554473877
14
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,english,call,,,,,,,,,
15
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,english,json,1.3998499751091003,203.15,34.6,4.120689655172414,1.0,13.0,0.01180358711652775,0.0003421306610107422,0.13397955894470215
16
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,english,markdown,1.4005955815315247,179.5,30.65,3.847802786709539,1.0,14.0,0.01265179331535184,0.0003273487091064453,0.13492584228515625
17
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,japanese,call,,,,,,,,,
18
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,japanese,json,1.2260903775691987,48.35,5.8,1.95748987854251,1.0,13.0,0.01474765992840292,0.00041413307189941406,0.18952107429504395
19
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,japanese,markdown,1.1986963748931885,51.55,6.85,2.0415841584158416,1.0,10.0,0.014000740617808729,0.0005300045013427734,0.16827392578125
20
+ chat-bison,english,call,,,,,,,,,
21
+ chat-bison,english,json,3.446989095211029,550.05,86.0,89.4390243902439,1.0,138.0,0.4258628240445765,0.0006544589996337891,2.2015340328216553
22
+ chat-bison,japanese,call,,,,,,,,,
23
+ chat-bison,japanese,json,4.333498167991638,246.1,12.0,33.48299319727891,3.0,124.0,0.47770044917152044,0.0005426406860351562,3.5425846576690674
24
+ chat-bison-32k,english,call,,,,,,,,,
25
+ chat-bison-32k,english,json,3.74513863325119,538.4,84.25,88.26229508196721,1.0,134.0,0.47832588094179745,0.0006556510925292969,3.0114917755126953
26
+ chat-bison-32k,japanese,call,,,,,,,,,
27
+ chat-bison-32k,japanese,json,4.5112169027328495,241.45,11.8,35.77037037037037,6.0,124.0,0.5467217816246881,0.0005869865417480469,4.387756824493408
28
+ gemini-pro,english,call,,,,,,,,,
29
+ gemini-pro,english,json,3.6837018529574075,557.475,87.225,175.58267716535434,4.0,988.0,1.0232121174729716,0.0006723403930664062,8.669384241104126
30
+ gemini-pro,english,markdown,4.207570552825928,663.8,109.05,139.74736842105264,19.0,472.0,0.7348335742950439,0.0007510185241699219,2.7830429077148438
31
+ gemini-pro,japanese,call,,,,,,,,,
32
+ gemini-pro,japanese,json,4.794884290013995,189.55,4.05,64.2542372881356,4.0,215.0,1.1180692850533178,0.0006062984466552734,5.698127031326294
33
+ gemini-pro,japanese,markdown,7.311563323525822,392.7,7.75,62.832,15.0,203.0,0.9826514282226563,0.0006639957427978516,13.754565954208374
34
+ gpt-3.5-turbo,english,call,3.409479808062315,671.15625,108.59375,,,,,,
35
+ gpt-3.5-turbo,english,json,2.650409721559094,564.6451612903226,90.98387096774194,5.037122302158274,1.0,16.0,0.017705622920029456,0.0005590915679931641,0.4925534725189209
36
+ gpt-3.5-turbo,english,markdown,3.1277945737044015,649.3333333333334,103.75,5.186023294509152,1.0,16.0,0.019346605402459322,0.0006084442138671875,1.127073049545288
37
+ gpt-3.5-turbo,japanese,call,8.916680586142618,375.1875,4.9375,,,,,,
38
+ gpt-3.5-turbo,japanese,json,6.141976299932447,244.75806451612902,3.306451612903226,1.1217474866942638,1.0,7.0,0.0232258041112258,0.0005545616149902344,13.75982117652893
39
+ gpt-3.5-turbo,japanese,markdown,8.25130424045381,315.5,1.3636363636363635,1.1153784348385023,1.0,10.0,0.025426305415027686,0.0005831718444824219,13.71114993095398
40
+ gpt-4,english,call,10.59899697303772,538.45,83.7,,,,,,
41
+ gpt-4,english,json,9.713180017471313,558.35,87.5,4.971950133570792,1.0,16.0,0.07619813660479824,0.0005440711975097656,1.9534873962402344
42
+ gpt-4,japanese,call,22.77469485684445,242.1,1.2,,,,,,
43
+ gpt-4,japanese,json,19.565327330639487,217.85,4.1,1.1505149194613151,1.0,7.0,0.09166746716213503,0.0005655288696289062,2.1393778324127197
44
+ gpt-4-turbo,english,call,9.345100498199463,550.9,84.9,,,,,,
45
+ gpt-4-turbo,english,json,8.325499892234802,686.55,105.4,5.042600073448402,1.0,17.0,0.05410054322774035,0.0007143020629882812,0.755082368850708
46
+ gpt-4-turbo,japanese,call,18.703535676002502,222.35,3.6,,,,,,
47
+ gpt-4-turbo,japanese,json,19.659980058670044,272.5,6.0,1.181956191715463,1.0,8.0,0.07962745783567377,0.0006952285766601562,13.252992153167725
48
+ llama-2-70b-chat,english,call,,,,,,,,,
49
+ llama-2-70b-chat,english,json,3.55666184425354,427.6363636363636,65.81818181818181,4.172062084257206,1.0,14.0,0.01772472985303587,0.00021791458129882812,0.5100884437561035
50
+ llama-2-70b-chat,english,markdown,6.183407843112946,1169.7727272727273,184.1818181818182,4.07263807564488,1.0,16.0,0.01361775794423896,0.0002124309539794922,0.5661592483520508
51
+ llama-2-70b-chat,japanese,call,,,,,,,,,
52
+ llama-2-70b-chat,japanese,json,4.945841180650811,350.4761904761905,42.642857142857146,2.46483590087073,1.0,15.0,0.01905980879878806,0.00021982192993164062,0.35228896141052246
53
+ llama-2-70b-chat,japanese,markdown,14.294062587949965,1299.1818181818182,172.5,2.8476636445152934,1.0,16.0,0.02320206142747451,0.0002117156982421875,76.44498753547668
54
+ zephyr-7b-beta,english,call,,,,,,,,,
55
+ zephyr-7b-beta,english,json,2.845248854160309,238.1,39.2,4.274685816876122,1.0,14.0,0.03622233246986485,0.0003070831298828125,0.4896988868713379
56
+ zephyr-7b-beta,english,markdown,7.618257820606232,238.65,38.75,4.358904109589041,1.0,15.0,0.1235110485390441,0.00040459632873535156,75.15552616119385
57
+ zephyr-7b-beta,japanese,call,,,,,,,,,
58
+ zephyr-7b-beta,japanese,json,1.921021181344986,29.75,3.3,1.1829025844930416,1.0,7.0,0.042037644869764565,0.018090486526489258,0.4599947929382324
59
+ zephyr-7b-beta,japanese,markdown,1.8884475827217102,26.6,1.75,1.0350194552529184,1.0,4.0,0.04097196471366437,0.02583909034729004,0.4606599807739258
data/2024-01-26 11:01:41.169428_general_plot.csv ADDED
@@ -0,0 +1,398 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ path,plot_object,description,comment,plot_json
2
+ ./html/plots/response_times.html,"Figure({
3
+ 'data': [{'alignmentgroup': 'True',
4
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
5
+ 'legendgroup': 'Mistral-7B-Instruct-v0.2',
6
+ 'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
7
+ 'name': 'Mistral-7B-Instruct-v0.2',
8
+ 'offsetgroup': 'Mistral-7B-Instruct-v0.2',
9
+ 'orientation': 'v',
10
+ 'showlegend': True,
11
+ 'textposition': 'auto',
12
+ 'type': 'bar',
13
+ 'x': array(['Mistral-7B-Instruct-v0.2'], dtype=object),
14
+ 'xaxis': 'x',
15
+ 'y': array([3.17454003]),
16
+ 'yaxis': 'y'},
17
+ {'alignmentgroup': 'True',
18
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
19
+ 'legendgroup': 'Mixtral-8x7B-Instruct-v0.1',
20
+ 'marker': {'color': '#EF553B', 'pattern': {'shape': ''}},
21
+ 'name': 'Mixtral-8x7B-Instruct-v0.1',
22
+ 'offsetgroup': 'Mixtral-8x7B-Instruct-v0.1',
23
+ 'orientation': 'v',
24
+ 'showlegend': True,
25
+ 'textposition': 'auto',
26
+ 'type': 'bar',
27
+ 'x': array(['Mixtral-8x7B-Instruct-v0.1'], dtype=object),
28
+ 'xaxis': 'x',
29
+ 'y': array([7.14219763]),
30
+ 'yaxis': 'y'},
31
+ {'alignmentgroup': 'True',
32
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
33
+ 'legendgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
34
+ 'marker': {'color': '#00cc96', 'pattern': {'shape': ''}},
35
+ 'name': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
36
+ 'offsetgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
37
+ 'orientation': 'v',
38
+ 'showlegend': True,
39
+ 'textposition': 'auto',
40
+ 'type': 'bar',
41
+ 'x': array(['TinyLlama/TinyLlama-1.1B-Chat-v1.0'], dtype=object),
42
+ 'xaxis': 'x',
43
+ 'y': array([1.29026454]),
44
+ 'yaxis': 'y'},
45
+ {'alignmentgroup': 'True',
46
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
47
+ 'legendgroup': 'chat-bison',
48
+ 'marker': {'color': '#ab63fa', 'pattern': {'shape': ''}},
49
+ 'name': 'chat-bison',
50
+ 'offsetgroup': 'chat-bison',
51
+ 'orientation': 'v',
52
+ 'showlegend': True,
53
+ 'textposition': 'auto',
54
+ 'type': 'bar',
55
+ 'x': array(['chat-bison'], dtype=object),
56
+ 'xaxis': 'x',
57
+ 'y': array([3.89024363]),
58
+ 'yaxis': 'y'},
59
+ {'alignmentgroup': 'True',
60
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
61
+ 'legendgroup': 'chat-bison-32k',
62
+ 'marker': {'color': '#FFA15A', 'pattern': {'shape': ''}},
63
+ 'name': 'chat-bison-32k',
64
+ 'offsetgroup': 'chat-bison-32k',
65
+ 'orientation': 'v',
66
+ 'showlegend': True,
67
+ 'textposition': 'auto',
68
+ 'type': 'bar',
69
+ 'x': array(['chat-bison-32k'], dtype=object),
70
+ 'xaxis': 'x',
71
+ 'y': array([4.12817777]),
72
+ 'yaxis': 'y'},
73
+ {'alignmentgroup': 'True',
74
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
75
+ 'legendgroup': 'gemini-pro',
76
+ 'marker': {'color': '#19d3f3', 'pattern': {'shape': ''}},
77
+ 'name': 'gemini-pro',
78
+ 'offsetgroup': 'gemini-pro',
79
+ 'orientation': 'v',
80
+ 'showlegend': True,
81
+ 'textposition': 'auto',
82
+ 'type': 'bar',
83
+ 'x': array(['gemini-pro'], dtype=object),
84
+ 'xaxis': 'x',
85
+ 'y': array([4.72138064]),
86
+ 'yaxis': 'y'},
87
+ {'alignmentgroup': 'True',
88
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
89
+ 'legendgroup': 'gpt-3.5-turbo',
90
+ 'marker': {'color': '#FF6692', 'pattern': {'shape': ''}},
91
+ 'name': 'gpt-3.5-turbo',
92
+ 'offsetgroup': 'gpt-3.5-turbo',
93
+ 'orientation': 'v',
94
+ 'showlegend': True,
95
+ 'textposition': 'auto',
96
+ 'type': 'bar',
97
+ 'x': array(['gpt-3.5-turbo'], dtype=object),
98
+ 'xaxis': 'x',
99
+ 'y': array([5.28237349]),
100
+ 'yaxis': 'y'},
101
+ {'alignmentgroup': 'True',
102
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
103
+ 'legendgroup': 'gpt-4',
104
+ 'marker': {'color': '#B6E880', 'pattern': {'shape': ''}},
105
+ 'name': 'gpt-4',
106
+ 'offsetgroup': 'gpt-4',
107
+ 'orientation': 'v',
108
+ 'showlegend': True,
109
+ 'textposition': 'auto',
110
+ 'type': 'bar',
111
+ 'x': array(['gpt-4'], dtype=object),
112
+ 'xaxis': 'x',
113
+ 'y': array([15.52184566]),
114
+ 'yaxis': 'y'},
115
+ {'alignmentgroup': 'True',
116
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
117
+ 'legendgroup': 'gpt-4-turbo',
118
+ 'marker': {'color': '#FF97FF', 'pattern': {'shape': ''}},
119
+ 'name': 'gpt-4-turbo',
120
+ 'offsetgroup': 'gpt-4-turbo',
121
+ 'orientation': 'v',
122
+ 'showlegend': True,
123
+ 'textposition': 'auto',
124
+ 'type': 'bar',
125
+ 'x': array(['gpt-4-turbo'], dtype=object),
126
+ 'xaxis': 'x',
127
+ 'y': array([14.00852903]),
128
+ 'yaxis': 'y'},
129
+ {'alignmentgroup': 'True',
130
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
131
+ 'legendgroup': 'llama-2-70b-chat',
132
+ 'marker': {'color': '#FECB52', 'pattern': {'shape': ''}},
133
+ 'name': 'llama-2-70b-chat',
134
+ 'offsetgroup': 'llama-2-70b-chat',
135
+ 'orientation': 'v',
136
+ 'showlegend': True,
137
+ 'textposition': 'auto',
138
+ 'type': 'bar',
139
+ 'x': array(['llama-2-70b-chat'], dtype=object),
140
+ 'xaxis': 'x',
141
+ 'y': array([6.0658799]),
142
+ 'yaxis': 'y'},
143
+ {'alignmentgroup': 'True',
144
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
145
+ 'legendgroup': 'zephyr-7b-beta',
146
+ 'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
147
+ 'name': 'zephyr-7b-beta',
148
+ 'offsetgroup': 'zephyr-7b-beta',
149
+ 'orientation': 'v',
150
+ 'showlegend': True,
151
+ 'textposition': 'auto',
152
+ 'type': 'bar',
153
+ 'x': array(['zephyr-7b-beta'], dtype=object),
154
+ 'xaxis': 'x',
155
+ 'y': array([3.23879932]),
156
+ 'yaxis': 'y'}],
157
+ 'layout': {'barmode': 'relative',
158
+ 'legend': {'title': {'text': 'Model'}, 'tracegroupgap': 0},
159
+ 'template': '...',
160
+ 'title': {'text': 'Model endpoints response times'},
161
+ 'xaxis': {'anchor': 'y',
162
+ 'categoryarray': [Mistral-7B-Instruct-v0.2,
163
+ Mixtral-8x7B-Instruct-v0.1,
164
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,
165
+ chat-bison, chat-bison-32k, gemini-pro,
166
+ gpt-3.5-turbo, gpt-4, gpt-4-turbo,
167
+ llama-2-70b-chat, zephyr-7b-beta],
168
+ 'categoryorder': 'array',
169
+ 'domain': [0.0, 1.0],
170
+ 'title': {'text': 'Model'}},
171
+ 'yaxis': {'anchor': 'x', 'domain': [0.0, 1.0], 'title': {'text': 'Execution time (s)'}}}
172
+ })",Model endpoints response times,,"{""data"":[{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral-7B-Instruct-v0.2"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""Mistral-7B-Instruct-v0.2"",""offsetgroup"":""Mistral-7B-Instruct-v0.2"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""Mistral-7B-Instruct-v0.2""],""xaxis"":""x"",""y"":[3.174540030956268],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mixtral-8x7B-Instruct-v0.1"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""Mixtral-8x7B-Instruct-v0.1"",""offsetgroup"":""Mixtral-8x7B-Instruct-v0.1"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""Mixtral-8x7B-Instruct-v0.1""],""xaxis"":""x"",""y"":[7.142197625471814],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""offsetgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0""],""xaxis"":""x"",""y"":[1.2902645373344421],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""chat-bison"",""offsetgroup"":""chat-bison"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""chat-bison""],""xaxis"":""x"",""y"":[3.890243631601334],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison-32k"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""chat-bison-32k"",""offsetgroup"":""chat-bison-32k"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""chat-bison-32k""],""xaxis"":""x"",""y"":[4.128177767992019],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gemini-pro"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""gemini-pro"",""offsetgroup"":""gemini-pro"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gemini-pro""],""xaxis"":""x"",""y"":[4.72138064004937],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-3.5-turbo"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""gpt-3.5-turbo"",""offsetgroup"":""gpt-3.5-turbo"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gpt-3.5-turbo""],""xaxis"":""x"",""y"":[5.282373493889353],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""gpt-4"",""offsetgroup"":""gpt-4"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gpt-4""],""xaxis"":""x"",""y"":[15.5218456586202],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4-turbo"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""gpt-4-turbo"",""offsetgroup"":""gpt-4-turbo"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gpt-4-turbo""],""xaxis"":""x"",""y"":[14.008529031276703],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""llama-2-70b-chat"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""llama-2-70b-chat"",""offsetgroup"":""llama-2-70b-chat"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""llama-2-70b-chat""],""xaxis"":""x"",""y"":[6.06587989590749],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""zephyr-7b-beta"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""zephyr-7b-beta"",""offsetgroup"":""zephyr-7b-beta"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""zephyr-7b-beta""],""xaxis"":""x"",""y"":[3.2387993240356447],""yaxis"":""y"",""type"":""bar""}],""layout"":{""template"":{""data"":{""histogram2dcontour"":[{""type"":""histogram2dcontour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""choropleth"":[{""type"":""choropleth"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""histogram2d"":[{""type"":""histogram2d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmap"":[{""type"":""heatmap"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmapgl"":[{""type"":""heatmapgl"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""contourcarpet"":[{""type"":""contourcarpet"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""contour"":[{""type"":""contour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""surface"":[{""type"":""surface"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""mesh3d"":[{""type"":""mesh3d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""scatter"":[{""fillpattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2},""type"":""scatter""}],""parcoords"":[{""type"":""parcoords"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolargl"":[{""type"":""scatterpolargl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""bar"":[{""error_x"":{""color"":""#2a3f5f""},""error_y"":{""color"":""#2a3f5f""},""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""bar""}],""scattergeo"":[{""type"":""scattergeo"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolar"":[{""type"":""scatterpolar"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""histogram"":[{""marker"":{""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""histogram""}],""scattergl"":[{""type"":""scattergl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatter3d"":[{""type"":""scatter3d"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattermapbox"":[{""type"":""scattermapbox"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterternary"":[{""type"":""scatterternary"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattercarpet"":[{""type"":""scattercarpet"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""carpet"":[{""aaxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""baxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""type"":""carpet""}],""table"":[{""cells"":{""fill"":{""color"":""#EBF0F8""},""line"":{""color"":""white""}},""header"":{""fill"":{""color"":""#C8D4E3""},""line"":{""color"":""white""}},""type"":""table""}],""barpolar"":[{""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""barpolar""}],""pie"":[{""automargin"":true,""type"":""pie""}]},""layout"":{""autotypenumbers"":""strict"",""colorway"":[""#636efa"",""#EF553B"",""#00cc96"",""#ab63fa"",""#FFA15A"",""#19d3f3"",""#FF6692"",""#B6E880"",""#FF97FF"",""#FECB52""],""font"":{""color"":""#2a3f5f""},""hovermode"":""closest"",""hoverlabel"":{""align"":""left""},""paper_bgcolor"":""white"",""plot_bgcolor"":""#E5ECF6"",""polar"":{""bgcolor"":""#E5ECF6"",""angularaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""radialaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""ternary"":{""bgcolor"":""#E5ECF6"",""aaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""baxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""caxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""coloraxis"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""colorscale"":{""sequential"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""sequentialminus"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""diverging"":[[0,""#8e0152""],[0.1,""#c51b7d""],[0.2,""#de77ae""],[0.3,""#f1b6da""],[0.4,""#fde0ef""],[0.5,""#f7f7f7""],[0.6,""#e6f5d0""],[0.7,""#b8e186""],[0.8,""#7fbc41""],[0.9,""#4d9221""],[1,""#276419""]]},""xaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""yaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""scene"":{""xaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""yaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""zaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2}},""shapedefaults"":{""line"":{""color"":""#2a3f5f""}},""annotationdefaults"":{""arrowcolor"":""#2a3f5f"",""arrowhead"":0,""arrowwidth"":1},""geo"":{""bgcolor"":""white"",""landcolor"":""#E5ECF6"",""subunitcolor"":""white"",""showland"":true,""showlakes"":true,""lakecolor"":""white""},""title"":{""x"":0.05},""mapbox"":{""style"":""light""}}},""xaxis"":{""anchor"":""y"",""domain"":[0.0,1.0],""title"":{""text"":""Model""},""categoryorder"":""array"",""categoryarray"":[""Mistral-7B-Instruct-v0.2"",""Mixtral-8x7B-Instruct-v0.1"",""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""chat-bison"",""chat-bison-32k"",""gemini-pro"",""gpt-3.5-turbo"",""gpt-4"",""gpt-4-turbo"",""llama-2-70b-chat"",""zephyr-7b-beta""]},""yaxis"":{""anchor"":""x"",""domain"":[0.0,1.0],""title"":{""text"":""Execution time (s)""}},""legend"":{""title"":{""text"":""Model""},""tracegroupgap"":0},""title"":{""text"":""Model endpoints response times""},""barmode"":""relative""}}"
173
+ ./html/plots/execution_costs.html,"Figure({
174
+ 'data': [{'alignmentgroup': 'True',
175
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
176
+ 'legendgroup': 'gpt-3.5-turbo',
177
+ 'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
178
+ 'name': 'gpt-3.5-turbo',
179
+ 'offsetgroup': 'gpt-3.5-turbo',
180
+ 'orientation': 'v',
181
+ 'showlegend': True,
182
+ 'textposition': 'auto',
183
+ 'type': 'bar',
184
+ 'x': array(['gpt-3.5-turbo', 'gpt-3.5-turbo'], dtype=object),
185
+ 'xaxis': 'x',
186
+ 'y': array([0.144438, 0.144438]),
187
+ 'yaxis': 'y'},
188
+ {'alignmentgroup': 'True',
189
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
190
+ 'legendgroup': 'gpt-4-turbo',
191
+ 'marker': {'color': '#EF553B', 'pattern': {'shape': ''}},
192
+ 'name': 'gpt-4-turbo',
193
+ 'offsetgroup': 'gpt-4-turbo',
194
+ 'orientation': 'v',
195
+ 'showlegend': True,
196
+ 'textposition': 'auto',
197
+ 'type': 'bar',
198
+ 'x': array(['gpt-4-turbo'], dtype=object),
199
+ 'xaxis': 'x',
200
+ 'y': array([0.44014]),
201
+ 'yaxis': 'y'},
202
+ {'alignmentgroup': 'True',
203
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
204
+ 'legendgroup': 'gpt-4',
205
+ 'marker': {'color': '#00cc96', 'pattern': {'shape': ''}},
206
+ 'name': 'gpt-4',
207
+ 'offsetgroup': 'gpt-4',
208
+ 'orientation': 'v',
209
+ 'showlegend': True,
210
+ 'textposition': 'auto',
211
+ 'type': 'bar',
212
+ 'x': array(['gpt-4'], dtype=object),
213
+ 'xaxis': 'x',
214
+ 'y': array([1.1724]),
215
+ 'yaxis': 'y'},
216
+ {'alignmentgroup': 'True',
217
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
218
+ 'legendgroup': 'llama-2-70b-chat',
219
+ 'marker': {'color': '#ab63fa', 'pattern': {'shape': ''}},
220
+ 'name': 'llama-2-70b-chat',
221
+ 'offsetgroup': 'llama-2-70b-chat',
222
+ 'orientation': 'v',
223
+ 'showlegend': True,
224
+ 'textposition': 'auto',
225
+ 'type': 'bar',
226
+ 'x': array(['llama-2-70b-chat'], dtype=object),
227
+ 'xaxis': 'x',
228
+ 'y': array([0.0186864]),
229
+ 'yaxis': 'y'},
230
+ {'alignmentgroup': 'True',
231
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
232
+ 'legendgroup': 'Mixtral-8x7B-Instruct-v0.1',
233
+ 'marker': {'color': '#FFA15A', 'pattern': {'shape': ''}},
234
+ 'name': 'Mixtral-8x7B-Instruct-v0.1',
235
+ 'offsetgroup': 'Mixtral-8x7B-Instruct-v0.1',
236
+ 'orientation': 'v',
237
+ 'showlegend': True,
238
+ 'textposition': 'auto',
239
+ 'type': 'bar',
240
+ 'x': array(['Mixtral-8x7B-Instruct-v0.1'], dtype=object),
241
+ 'xaxis': 'x',
242
+ 'y': array([0.0781551]),
243
+ 'yaxis': 'y'},
244
+ {'alignmentgroup': 'True',
245
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
246
+ 'legendgroup': 'zephyr-7b-beta',
247
+ 'marker': {'color': '#19d3f3', 'pattern': {'shape': ''}},
248
+ 'name': 'zephyr-7b-beta',
249
+ 'offsetgroup': 'zephyr-7b-beta',
250
+ 'orientation': 'v',
251
+ 'showlegend': True,
252
+ 'textposition': 'auto',
253
+ 'type': 'bar',
254
+ 'x': array(['zephyr-7b-beta'], dtype=object),
255
+ 'xaxis': 'x',
256
+ 'y': array([0.09836233]),
257
+ 'yaxis': 'y'},
258
+ {'alignmentgroup': 'True',
259
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
260
+ 'legendgroup': 'Mistral-7B-Instruct-v0.2',
261
+ 'marker': {'color': '#FF6692', 'pattern': {'shape': ''}},
262
+ 'name': 'Mistral-7B-Instruct-v0.2',
263
+ 'offsetgroup': 'Mistral-7B-Instruct-v0.2',
264
+ 'orientation': 'v',
265
+ 'showlegend': True,
266
+ 'textposition': 'auto',
267
+ 'type': 'bar',
268
+ 'x': array(['Mistral-7B-Instruct-v0.2'], dtype=object),
269
+ 'xaxis': 'x',
270
+ 'y': array([0.09813028]),
271
+ 'yaxis': 'y'},
272
+ {'alignmentgroup': 'True',
273
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
274
+ 'legendgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
275
+ 'marker': {'color': '#B6E880', 'pattern': {'shape': ''}},
276
+ 'name': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
277
+ 'offsetgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
278
+ 'orientation': 'v',
279
+ 'showlegend': True,
280
+ 'textposition': 'auto',
281
+ 'type': 'bar',
282
+ 'x': array(['TinyLlama/TinyLlama-1.1B-Chat-v1.0'], dtype=object),
283
+ 'xaxis': 'x',
284
+ 'y': array([0.04215044]),
285
+ 'yaxis': 'y'},
286
+ {'alignmentgroup': 'True',
287
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
288
+ 'legendgroup': 'gemini-pro',
289
+ 'marker': {'color': '#FF97FF', 'pattern': {'shape': ''}},
290
+ 'name': 'gemini-pro',
291
+ 'offsetgroup': 'gemini-pro',
292
+ 'orientation': 'v',
293
+ 'showlegend': True,
294
+ 'textposition': 'auto',
295
+ 'type': 'bar',
296
+ 'x': array(['gemini-pro'], dtype=object),
297
+ 'xaxis': 'x',
298
+ 'y': array([0.022971]),
299
+ 'yaxis': 'y'},
300
+ {'alignmentgroup': 'True',
301
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
302
+ 'legendgroup': 'chat-bison (PaLM 2)',
303
+ 'marker': {'color': '#FECB52', 'pattern': {'shape': ''}},
304
+ 'name': 'chat-bison (PaLM 2)',
305
+ 'offsetgroup': 'chat-bison (PaLM 2)',
306
+ 'orientation': 'v',
307
+ 'showlegend': True,
308
+ 'textposition': 'auto',
309
+ 'type': 'bar',
310
+ 'x': array(['chat-bison (PaLM 2)'], dtype=object),
311
+ 'xaxis': 'x',
312
+ 'y': array([0.]),
313
+ 'yaxis': 'y'},
314
+ {'alignmentgroup': 'True',
315
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
316
+ 'legendgroup': 'chat-bison-32k (PaLM 2 32K)',
317
+ 'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
318
+ 'name': 'chat-bison-32k (PaLM 2 32K)',
319
+ 'offsetgroup': 'chat-bison-32k (PaLM 2 32K)',
320
+ 'orientation': 'v',
321
+ 'showlegend': True,
322
+ 'textposition': 'auto',
323
+ 'type': 'bar',
324
+ 'x': array(['chat-bison-32k (PaLM 2 32K)'], dtype=object),
325
+ 'xaxis': 'x',
326
+ 'y': array([0.]),
327
+ 'yaxis': 'y'}],
328
+ 'layout': {'barmode': 'relative',
329
+ 'legend': {'title': {'text': 'Model'}, 'tracegroupgap': 0},
330
+ 'template': '...',
331
+ 'title': {'text': 'Costs of execution of 200 test queries per model'},
332
+ 'xaxis': {'anchor': 'y', 'domain': [0.0, 1.0], 'title': {'text': 'Model'}},
333
+ 'yaxis': {'anchor': 'x', 'domain': [0.0, 1.0], 'title': {'text': 'Execution cost ($)'}}}
334
+ })",Costs of execution of 200 test queries per model,Note that some providers bill by token count and some by execution time. In the second case we used averaged pausing and resuming time to calculate the cost and assumed that all queries have been done in one session. Also note that for now the Gemini-Pro model is free for under 60 queries per minute.,"{""data"":[{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-3.5-turbo"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""gpt-3.5-turbo"",""offsetgroup"":""gpt-3.5-turbo"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gpt-3.5-turbo"",""gpt-3.5-turbo""],""xaxis"":""x"",""y"":[0.144438,0.144438],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4-turbo"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""gpt-4-turbo"",""offsetgroup"":""gpt-4-turbo"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gpt-4-turbo""],""xaxis"":""x"",""y"":[0.44014],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""gpt-4"",""offsetgroup"":""gpt-4"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gpt-4""],""xaxis"":""x"",""y"":[1.1724],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""llama-2-70b-chat"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""llama-2-70b-chat"",""offsetgroup"":""llama-2-70b-chat"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""llama-2-70b-chat""],""xaxis"":""x"",""y"":[0.0186864],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mixtral-8x7B-Instruct-v0.1"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""Mixtral-8x7B-Instruct-v0.1"",""offsetgroup"":""Mixtral-8x7B-Instruct-v0.1"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""Mixtral-8x7B-Instruct-v0.1""],""xaxis"":""x"",""y"":[0.07815509999999999],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""zephyr-7b-beta"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""zephyr-7b-beta"",""offsetgroup"":""zephyr-7b-beta"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""zephyr-7b-beta""],""xaxis"":""x"",""y"":[0.09836233089235094],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral-7B-Instruct-v0.2"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""Mistral-7B-Instruct-v0.2"",""offsetgroup"":""Mistral-7B-Instruct-v0.2"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""Mistral-7B-Instruct-v0.2""],""xaxis"":""x"",""y"":[0.09813028344511986],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""offsetgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0""],""xaxis"":""x"",""y"":[0.042150440895557396],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gemini-pro"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""gemini-pro"",""offsetgroup"":""gemini-pro"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gemini-pro""],""xaxis"":""x"",""y"":[0.022971],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison (PaLM 2)"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""chat-bison (PaLM 2)"",""offsetgroup"":""chat-bison (PaLM 2)"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""chat-bison (PaLM 2)""],""xaxis"":""x"",""y"":[0.0],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison-32k (PaLM 2 32K)"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""chat-bison-32k (PaLM 2 32K)"",""offsetgroup"":""chat-bison-32k (PaLM 2 32K)"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""chat-bison-32k (PaLM 2 32K)""],""xaxis"":""x"",""y"":[0.0],""yaxis"":""y"",""type"":""bar""}],""layout"":{""template"":{""data"":{""histogram2dcontour"":[{""type"":""histogram2dcontour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""choropleth"":[{""type"":""choropleth"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""histogram2d"":[{""type"":""histogram2d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmap"":[{""type"":""heatmap"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmapgl"":[{""type"":""heatmapgl"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""contourcarpet"":[{""type"":""contourcarpet"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""contour"":[{""type"":""contour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""surface"":[{""type"":""surface"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""mesh3d"":[{""type"":""mesh3d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""scatter"":[{""fillpattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2},""type"":""scatter""}],""parcoords"":[{""type"":""parcoords"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolargl"":[{""type"":""scatterpolargl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""bar"":[{""error_x"":{""color"":""#2a3f5f""},""error_y"":{""color"":""#2a3f5f""},""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""bar""}],""scattergeo"":[{""type"":""scattergeo"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolar"":[{""type"":""scatterpolar"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""histogram"":[{""marker"":{""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""histogram""}],""scattergl"":[{""type"":""scattergl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatter3d"":[{""type"":""scatter3d"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattermapbox"":[{""type"":""scattermapbox"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterternary"":[{""type"":""scatterternary"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattercarpet"":[{""type"":""scattercarpet"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""carpet"":[{""aaxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""baxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""type"":""carpet""}],""table"":[{""cells"":{""fill"":{""color"":""#EBF0F8""},""line"":{""color"":""white""}},""header"":{""fill"":{""color"":""#C8D4E3""},""line"":{""color"":""white""}},""type"":""table""}],""barpolar"":[{""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""barpolar""}],""pie"":[{""automargin"":true,""type"":""pie""}]},""layout"":{""autotypenumbers"":""strict"",""colorway"":[""#636efa"",""#EF553B"",""#00cc96"",""#ab63fa"",""#FFA15A"",""#19d3f3"",""#FF6692"",""#B6E880"",""#FF97FF"",""#FECB52""],""font"":{""color"":""#2a3f5f""},""hovermode"":""closest"",""hoverlabel"":{""align"":""left""},""paper_bgcolor"":""white"",""plot_bgcolor"":""#E5ECF6"",""polar"":{""bgcolor"":""#E5ECF6"",""angularaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""radialaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""ternary"":{""bgcolor"":""#E5ECF6"",""aaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""baxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""caxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""coloraxis"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""colorscale"":{""sequential"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""sequentialminus"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""diverging"":[[0,""#8e0152""],[0.1,""#c51b7d""],[0.2,""#de77ae""],[0.3,""#f1b6da""],[0.4,""#fde0ef""],[0.5,""#f7f7f7""],[0.6,""#e6f5d0""],[0.7,""#b8e186""],[0.8,""#7fbc41""],[0.9,""#4d9221""],[1,""#276419""]]},""xaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""yaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""scene"":{""xaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""yaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""zaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2}},""shapedefaults"":{""line"":{""color"":""#2a3f5f""}},""annotationdefaults"":{""arrowcolor"":""#2a3f5f"",""arrowhead"":0,""arrowwidth"":1},""geo"":{""bgcolor"":""white"",""landcolor"":""#E5ECF6"",""subunitcolor"":""white"",""showland"":true,""showlakes"":true,""lakecolor"":""white""},""title"":{""x"":0.05},""mapbox"":{""style"":""light""}}},""xaxis"":{""anchor"":""y"",""domain"":[0.0,1.0],""title"":{""text"":""Model""}},""yaxis"":{""anchor"":""x"",""domain"":[0.0,1.0],""title"":{""text"":""Execution cost ($)""}},""legend"":{""title"":{""text"":""Model""},""tracegroupgap"":0},""title"":{""text"":""Costs of execution of 200 test queries per model""},""barmode"":""relative""}}"
335
+ ./html/plots/model_sizes.html,"Figure({
336
+ 'data': [{'alignmentgroup': 'True',
337
+ 'hovertemplate': 'Model=%{x}<br>Model size (B params)=%{y}<extra></extra>',
338
+ 'legendgroup': 'Mixtral-8x7B-Instruct-v0.1',
339
+ 'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
340
+ 'name': 'Mixtral-8x7B-Instruct-v0.1',
341
+ 'offsetgroup': 'Mixtral-8x7B-Instruct-v0.1',
342
+ 'orientation': 'v',
343
+ 'showlegend': True,
344
+ 'textposition': 'auto',
345
+ 'type': 'bar',
346
+ 'x': array(['Mixtral-8x7B-Instruct-v0.1'], dtype=object),
347
+ 'xaxis': 'x',
348
+ 'y': array([56.]),
349
+ 'yaxis': 'y'},
350
+ {'alignmentgroup': 'True',
351
+ 'hovertemplate': 'Model=%{x}<br>Model size (B params)=%{y}<extra></extra>',
352
+ 'legendgroup': 'zephyr-7b-beta',
353
+ 'marker': {'color': '#EF553B', 'pattern': {'shape': ''}},
354
+ 'name': 'zephyr-7b-beta',
355
+ 'offsetgroup': 'zephyr-7b-beta',
356
+ 'orientation': 'v',
357
+ 'showlegend': True,
358
+ 'textposition': 'auto',
359
+ 'type': 'bar',
360
+ 'x': array(['zephyr-7b-beta'], dtype=object),
361
+ 'xaxis': 'x',
362
+ 'y': array([7.]),
363
+ 'yaxis': 'y'},
364
+ {'alignmentgroup': 'True',
365
+ 'hovertemplate': 'Model=%{x}<br>Model size (B params)=%{y}<extra></extra>',
366
+ 'legendgroup': 'Mistral-7B-Instruct-v0.2',
367
+ 'marker': {'color': '#00cc96', 'pattern': {'shape': ''}},
368
+ 'name': 'Mistral-7B-Instruct-v0.2',
369
+ 'offsetgroup': 'Mistral-7B-Instruct-v0.2',
370
+ 'orientation': 'v',
371
+ 'showlegend': True,
372
+ 'textposition': 'auto',
373
+ 'type': 'bar',
374
+ 'x': array(['Mistral-7B-Instruct-v0.2'], dtype=object),
375
+ 'xaxis': 'x',
376
+ 'y': array([7.]),
377
+ 'yaxis': 'y'},
378
+ {'alignmentgroup': 'True',
379
+ 'hovertemplate': 'Model=%{x}<br>Model size (B params)=%{y}<extra></extra>',
380
+ 'legendgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
381
+ 'marker': {'color': '#ab63fa', 'pattern': {'shape': ''}},
382
+ 'name': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
383
+ 'offsetgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
384
+ 'orientation': 'v',
385
+ 'showlegend': True,
386
+ 'textposition': 'auto',
387
+ 'type': 'bar',
388
+ 'x': array(['TinyLlama/TinyLlama-1.1B-Chat-v1.0'], dtype=object),
389
+ 'xaxis': 'x',
390
+ 'y': array([1.1]),
391
+ 'yaxis': 'y'}],
392
+ 'layout': {'barmode': 'relative',
393
+ 'legend': {'title': {'text': 'Model'}, 'tracegroupgap': 0},
394
+ 'template': '...',
395
+ 'title': {'text': 'Model sizes in billions of parameters'},
396
+ 'xaxis': {'anchor': 'y', 'domain': [0.0, 1.0], 'title': {'text': 'Model'}},
397
+ 'yaxis': {'anchor': 'x', 'domain': [0.0, 1.0], 'title': {'text': 'Model size (B params)'}}}
398
+ })",Model sizes in billions of parameters,Note that some models have undisclosed sizes.,"{""data"":[{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eModel size (B params)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mixtral-8x7B-Instruct-v0.1"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""Mixtral-8x7B-Instruct-v0.1"",""offsetgroup"":""Mixtral-8x7B-Instruct-v0.1"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""Mixtral-8x7B-Instruct-v0.1""],""xaxis"":""x"",""y"":[56.0],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eModel size (B params)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""zephyr-7b-beta"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""zephyr-7b-beta"",""offsetgroup"":""zephyr-7b-beta"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""zephyr-7b-beta""],""xaxis"":""x"",""y"":[7.0],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eModel size (B params)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral-7B-Instruct-v0.2"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""Mistral-7B-Instruct-v0.2"",""offsetgroup"":""Mistral-7B-Instruct-v0.2"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""Mistral-7B-Instruct-v0.2""],""xaxis"":""x"",""y"":[7.0],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eModel size (B params)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""offsetgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0""],""xaxis"":""x"",""y"":[1.1],""yaxis"":""y"",""type"":""bar""}],""layout"":{""template"":{""data"":{""histogram2dcontour"":[{""type"":""histogram2dcontour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""choropleth"":[{""type"":""choropleth"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""histogram2d"":[{""type"":""histogram2d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmap"":[{""type"":""heatmap"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmapgl"":[{""type"":""heatmapgl"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""contourcarpet"":[{""type"":""contourcarpet"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""contour"":[{""type"":""contour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""surface"":[{""type"":""surface"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""mesh3d"":[{""type"":""mesh3d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""scatter"":[{""fillpattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2},""type"":""scatter""}],""parcoords"":[{""type"":""parcoords"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolargl"":[{""type"":""scatterpolargl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""bar"":[{""error_x"":{""color"":""#2a3f5f""},""error_y"":{""color"":""#2a3f5f""},""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""bar""}],""scattergeo"":[{""type"":""scattergeo"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolar"":[{""type"":""scatterpolar"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""histogram"":[{""marker"":{""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""histogram""}],""scattergl"":[{""type"":""scattergl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatter3d"":[{""type"":""scatter3d"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattermapbox"":[{""type"":""scattermapbox"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterternary"":[{""type"":""scatterternary"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattercarpet"":[{""type"":""scattercarpet"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""carpet"":[{""aaxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""baxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""type"":""carpet""}],""table"":[{""cells"":{""fill"":{""color"":""#EBF0F8""},""line"":{""color"":""white""}},""header"":{""fill"":{""color"":""#C8D4E3""},""line"":{""color"":""white""}},""type"":""table""}],""barpolar"":[{""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""barpolar""}],""pie"":[{""automargin"":true,""type"":""pie""}]},""layout"":{""autotypenumbers"":""strict"",""colorway"":[""#636efa"",""#EF553B"",""#00cc96"",""#ab63fa"",""#FFA15A"",""#19d3f3"",""#FF6692"",""#B6E880"",""#FF97FF"",""#FECB52""],""font"":{""color"":""#2a3f5f""},""hovermode"":""closest"",""hoverlabel"":{""align"":""left""},""paper_bgcolor"":""white"",""plot_bgcolor"":""#E5ECF6"",""polar"":{""bgcolor"":""#E5ECF6"",""angularaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""radialaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""ternary"":{""bgcolor"":""#E5ECF6"",""aaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""baxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""caxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""coloraxis"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""colorscale"":{""sequential"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""sequentialminus"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""diverging"":[[0,""#8e0152""],[0.1,""#c51b7d""],[0.2,""#de77ae""],[0.3,""#f1b6da""],[0.4,""#fde0ef""],[0.5,""#f7f7f7""],[0.6,""#e6f5d0""],[0.7,""#b8e186""],[0.8,""#7fbc41""],[0.9,""#4d9221""],[1,""#276419""]]},""xaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""yaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""scene"":{""xaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""yaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""zaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2}},""shapedefaults"":{""line"":{""color"":""#2a3f5f""}},""annotationdefaults"":{""arrowcolor"":""#2a3f5f"",""arrowhead"":0,""arrowwidth"":1},""geo"":{""bgcolor"":""white"",""landcolor"":""#E5ECF6"",""subunitcolor"":""white"",""showland"":true,""showlakes"":true,""lakecolor"":""white""},""title"":{""x"":0.05},""mapbox"":{""style"":""light""}}},""xaxis"":{""anchor"":""y"",""domain"":[0.0,1.0],""title"":{""text"":""Model""}},""yaxis"":{""anchor"":""x"",""domain"":[0.0,1.0],""title"":{""text"":""Model size (B params)""}},""legend"":{""title"":{""text"":""Model""},""tracegroupgap"":0},""title"":{""text"":""Model sizes in billions of parameters""},""barmode"":""relative""}}"
data/2024-01-26 11:04:35.555342_general_plot.csv ADDED
@@ -0,0 +1,398 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ path,plot_object,description,comment,plot_json
2
+ ./html/plots/response_times.html,"Figure({
3
+ 'data': [{'alignmentgroup': 'True',
4
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
5
+ 'legendgroup': 'Mistral-7B-Instruct-v0.2',
6
+ 'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
7
+ 'name': 'Mistral-7B-Instruct-v0.2',
8
+ 'offsetgroup': 'Mistral-7B-Instruct-v0.2',
9
+ 'orientation': 'v',
10
+ 'showlegend': True,
11
+ 'textposition': 'auto',
12
+ 'type': 'bar',
13
+ 'x': array(['Mistral-7B-Instruct-v0.2'], dtype=object),
14
+ 'xaxis': 'x',
15
+ 'y': array([3.17454003]),
16
+ 'yaxis': 'y'},
17
+ {'alignmentgroup': 'True',
18
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
19
+ 'legendgroup': 'Mixtral-8x7B-Instruct-v0.1',
20
+ 'marker': {'color': '#EF553B', 'pattern': {'shape': ''}},
21
+ 'name': 'Mixtral-8x7B-Instruct-v0.1',
22
+ 'offsetgroup': 'Mixtral-8x7B-Instruct-v0.1',
23
+ 'orientation': 'v',
24
+ 'showlegend': True,
25
+ 'textposition': 'auto',
26
+ 'type': 'bar',
27
+ 'x': array(['Mixtral-8x7B-Instruct-v0.1'], dtype=object),
28
+ 'xaxis': 'x',
29
+ 'y': array([7.14219763]),
30
+ 'yaxis': 'y'},
31
+ {'alignmentgroup': 'True',
32
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
33
+ 'legendgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
34
+ 'marker': {'color': '#00cc96', 'pattern': {'shape': ''}},
35
+ 'name': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
36
+ 'offsetgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
37
+ 'orientation': 'v',
38
+ 'showlegend': True,
39
+ 'textposition': 'auto',
40
+ 'type': 'bar',
41
+ 'x': array(['TinyLlama/TinyLlama-1.1B-Chat-v1.0'], dtype=object),
42
+ 'xaxis': 'x',
43
+ 'y': array([1.29026454]),
44
+ 'yaxis': 'y'},
45
+ {'alignmentgroup': 'True',
46
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
47
+ 'legendgroup': 'chat-bison',
48
+ 'marker': {'color': '#ab63fa', 'pattern': {'shape': ''}},
49
+ 'name': 'chat-bison',
50
+ 'offsetgroup': 'chat-bison',
51
+ 'orientation': 'v',
52
+ 'showlegend': True,
53
+ 'textposition': 'auto',
54
+ 'type': 'bar',
55
+ 'x': array(['chat-bison'], dtype=object),
56
+ 'xaxis': 'x',
57
+ 'y': array([3.89024363]),
58
+ 'yaxis': 'y'},
59
+ {'alignmentgroup': 'True',
60
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
61
+ 'legendgroup': 'chat-bison-32k',
62
+ 'marker': {'color': '#FFA15A', 'pattern': {'shape': ''}},
63
+ 'name': 'chat-bison-32k',
64
+ 'offsetgroup': 'chat-bison-32k',
65
+ 'orientation': 'v',
66
+ 'showlegend': True,
67
+ 'textposition': 'auto',
68
+ 'type': 'bar',
69
+ 'x': array(['chat-bison-32k'], dtype=object),
70
+ 'xaxis': 'x',
71
+ 'y': array([4.12817777]),
72
+ 'yaxis': 'y'},
73
+ {'alignmentgroup': 'True',
74
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
75
+ 'legendgroup': 'gemini-pro',
76
+ 'marker': {'color': '#19d3f3', 'pattern': {'shape': ''}},
77
+ 'name': 'gemini-pro',
78
+ 'offsetgroup': 'gemini-pro',
79
+ 'orientation': 'v',
80
+ 'showlegend': True,
81
+ 'textposition': 'auto',
82
+ 'type': 'bar',
83
+ 'x': array(['gemini-pro'], dtype=object),
84
+ 'xaxis': 'x',
85
+ 'y': array([4.72138064]),
86
+ 'yaxis': 'y'},
87
+ {'alignmentgroup': 'True',
88
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
89
+ 'legendgroup': 'gpt-3.5-turbo',
90
+ 'marker': {'color': '#FF6692', 'pattern': {'shape': ''}},
91
+ 'name': 'gpt-3.5-turbo',
92
+ 'offsetgroup': 'gpt-3.5-turbo',
93
+ 'orientation': 'v',
94
+ 'showlegend': True,
95
+ 'textposition': 'auto',
96
+ 'type': 'bar',
97
+ 'x': array(['gpt-3.5-turbo'], dtype=object),
98
+ 'xaxis': 'x',
99
+ 'y': array([5.28237349]),
100
+ 'yaxis': 'y'},
101
+ {'alignmentgroup': 'True',
102
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
103
+ 'legendgroup': 'gpt-4',
104
+ 'marker': {'color': '#B6E880', 'pattern': {'shape': ''}},
105
+ 'name': 'gpt-4',
106
+ 'offsetgroup': 'gpt-4',
107
+ 'orientation': 'v',
108
+ 'showlegend': True,
109
+ 'textposition': 'auto',
110
+ 'type': 'bar',
111
+ 'x': array(['gpt-4'], dtype=object),
112
+ 'xaxis': 'x',
113
+ 'y': array([15.52184566]),
114
+ 'yaxis': 'y'},
115
+ {'alignmentgroup': 'True',
116
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
117
+ 'legendgroup': 'gpt-4-turbo',
118
+ 'marker': {'color': '#FF97FF', 'pattern': {'shape': ''}},
119
+ 'name': 'gpt-4-turbo',
120
+ 'offsetgroup': 'gpt-4-turbo',
121
+ 'orientation': 'v',
122
+ 'showlegend': True,
123
+ 'textposition': 'auto',
124
+ 'type': 'bar',
125
+ 'x': array(['gpt-4-turbo'], dtype=object),
126
+ 'xaxis': 'x',
127
+ 'y': array([14.00852903]),
128
+ 'yaxis': 'y'},
129
+ {'alignmentgroup': 'True',
130
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
131
+ 'legendgroup': 'llama-2-70b-chat',
132
+ 'marker': {'color': '#FECB52', 'pattern': {'shape': ''}},
133
+ 'name': 'llama-2-70b-chat',
134
+ 'offsetgroup': 'llama-2-70b-chat',
135
+ 'orientation': 'v',
136
+ 'showlegend': True,
137
+ 'textposition': 'auto',
138
+ 'type': 'bar',
139
+ 'x': array(['llama-2-70b-chat'], dtype=object),
140
+ 'xaxis': 'x',
141
+ 'y': array([6.0658799]),
142
+ 'yaxis': 'y'},
143
+ {'alignmentgroup': 'True',
144
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
145
+ 'legendgroup': 'zephyr-7b-beta',
146
+ 'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
147
+ 'name': 'zephyr-7b-beta',
148
+ 'offsetgroup': 'zephyr-7b-beta',
149
+ 'orientation': 'v',
150
+ 'showlegend': True,
151
+ 'textposition': 'auto',
152
+ 'type': 'bar',
153
+ 'x': array(['zephyr-7b-beta'], dtype=object),
154
+ 'xaxis': 'x',
155
+ 'y': array([3.23879932]),
156
+ 'yaxis': 'y'}],
157
+ 'layout': {'barmode': 'relative',
158
+ 'legend': {'title': {'text': 'Model'}, 'tracegroupgap': 0},
159
+ 'template': '...',
160
+ 'title': {'text': 'Model endpoints response times'},
161
+ 'xaxis': {'anchor': 'y',
162
+ 'categoryarray': [Mistral-7B-Instruct-v0.2,
163
+ Mixtral-8x7B-Instruct-v0.1,
164
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,
165
+ chat-bison, chat-bison-32k, gemini-pro,
166
+ gpt-3.5-turbo, gpt-4, gpt-4-turbo,
167
+ llama-2-70b-chat, zephyr-7b-beta],
168
+ 'categoryorder': 'array',
169
+ 'domain': [0.0, 1.0],
170
+ 'title': {'text': 'Model'}},
171
+ 'yaxis': {'anchor': 'x', 'domain': [0.0, 1.0], 'title': {'text': 'Execution time (s)'}}}
172
+ })",Model endpoints response times,,"{""data"":[{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral-7B-Instruct-v0.2"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""Mistral-7B-Instruct-v0.2"",""offsetgroup"":""Mistral-7B-Instruct-v0.2"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""Mistral-7B-Instruct-v0.2""],""xaxis"":""x"",""y"":[3.174540030956268],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mixtral-8x7B-Instruct-v0.1"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""Mixtral-8x7B-Instruct-v0.1"",""offsetgroup"":""Mixtral-8x7B-Instruct-v0.1"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""Mixtral-8x7B-Instruct-v0.1""],""xaxis"":""x"",""y"":[7.142197625471814],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""offsetgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0""],""xaxis"":""x"",""y"":[1.2902645373344421],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""chat-bison"",""offsetgroup"":""chat-bison"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""chat-bison""],""xaxis"":""x"",""y"":[3.890243631601334],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison-32k"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""chat-bison-32k"",""offsetgroup"":""chat-bison-32k"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""chat-bison-32k""],""xaxis"":""x"",""y"":[4.128177767992019],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gemini-pro"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""gemini-pro"",""offsetgroup"":""gemini-pro"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gemini-pro""],""xaxis"":""x"",""y"":[4.72138064004937],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-3.5-turbo"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""gpt-3.5-turbo"",""offsetgroup"":""gpt-3.5-turbo"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gpt-3.5-turbo""],""xaxis"":""x"",""y"":[5.282373493889353],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""gpt-4"",""offsetgroup"":""gpt-4"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gpt-4""],""xaxis"":""x"",""y"":[15.5218456586202],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4-turbo"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""gpt-4-turbo"",""offsetgroup"":""gpt-4-turbo"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gpt-4-turbo""],""xaxis"":""x"",""y"":[14.008529031276703],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""llama-2-70b-chat"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""llama-2-70b-chat"",""offsetgroup"":""llama-2-70b-chat"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""llama-2-70b-chat""],""xaxis"":""x"",""y"":[6.06587989590749],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""zephyr-7b-beta"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""zephyr-7b-beta"",""offsetgroup"":""zephyr-7b-beta"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""zephyr-7b-beta""],""xaxis"":""x"",""y"":[3.2387993240356447],""yaxis"":""y"",""type"":""bar""}],""layout"":{""template"":{""data"":{""histogram2dcontour"":[{""type"":""histogram2dcontour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""choropleth"":[{""type"":""choropleth"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""histogram2d"":[{""type"":""histogram2d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmap"":[{""type"":""heatmap"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmapgl"":[{""type"":""heatmapgl"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""contourcarpet"":[{""type"":""contourcarpet"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""contour"":[{""type"":""contour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""surface"":[{""type"":""surface"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""mesh3d"":[{""type"":""mesh3d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""scatter"":[{""fillpattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2},""type"":""scatter""}],""parcoords"":[{""type"":""parcoords"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolargl"":[{""type"":""scatterpolargl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""bar"":[{""error_x"":{""color"":""#2a3f5f""},""error_y"":{""color"":""#2a3f5f""},""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""bar""}],""scattergeo"":[{""type"":""scattergeo"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolar"":[{""type"":""scatterpolar"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""histogram"":[{""marker"":{""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""histogram""}],""scattergl"":[{""type"":""scattergl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatter3d"":[{""type"":""scatter3d"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattermapbox"":[{""type"":""scattermapbox"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterternary"":[{""type"":""scatterternary"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattercarpet"":[{""type"":""scattercarpet"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""carpet"":[{""aaxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""baxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""type"":""carpet""}],""table"":[{""cells"":{""fill"":{""color"":""#EBF0F8""},""line"":{""color"":""white""}},""header"":{""fill"":{""color"":""#C8D4E3""},""line"":{""color"":""white""}},""type"":""table""}],""barpolar"":[{""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""barpolar""}],""pie"":[{""automargin"":true,""type"":""pie""}]},""layout"":{""autotypenumbers"":""strict"",""colorway"":[""#636efa"",""#EF553B"",""#00cc96"",""#ab63fa"",""#FFA15A"",""#19d3f3"",""#FF6692"",""#B6E880"",""#FF97FF"",""#FECB52""],""font"":{""color"":""#2a3f5f""},""hovermode"":""closest"",""hoverlabel"":{""align"":""left""},""paper_bgcolor"":""white"",""plot_bgcolor"":""#E5ECF6"",""polar"":{""bgcolor"":""#E5ECF6"",""angularaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""radialaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""ternary"":{""bgcolor"":""#E5ECF6"",""aaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""baxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""caxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""coloraxis"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""colorscale"":{""sequential"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""sequentialminus"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""diverging"":[[0,""#8e0152""],[0.1,""#c51b7d""],[0.2,""#de77ae""],[0.3,""#f1b6da""],[0.4,""#fde0ef""],[0.5,""#f7f7f7""],[0.6,""#e6f5d0""],[0.7,""#b8e186""],[0.8,""#7fbc41""],[0.9,""#4d9221""],[1,""#276419""]]},""xaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""yaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""scene"":{""xaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""yaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""zaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2}},""shapedefaults"":{""line"":{""color"":""#2a3f5f""}},""annotationdefaults"":{""arrowcolor"":""#2a3f5f"",""arrowhead"":0,""arrowwidth"":1},""geo"":{""bgcolor"":""white"",""landcolor"":""#E5ECF6"",""subunitcolor"":""white"",""showland"":true,""showlakes"":true,""lakecolor"":""white""},""title"":{""x"":0.05},""mapbox"":{""style"":""light""}}},""xaxis"":{""anchor"":""y"",""domain"":[0.0,1.0],""title"":{""text"":""Model""},""categoryorder"":""array"",""categoryarray"":[""Mistral-7B-Instruct-v0.2"",""Mixtral-8x7B-Instruct-v0.1"",""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""chat-bison"",""chat-bison-32k"",""gemini-pro"",""gpt-3.5-turbo"",""gpt-4"",""gpt-4-turbo"",""llama-2-70b-chat"",""zephyr-7b-beta""]},""yaxis"":{""anchor"":""x"",""domain"":[0.0,1.0],""title"":{""text"":""Execution time (s)""}},""legend"":{""title"":{""text"":""Model""},""tracegroupgap"":0},""title"":{""text"":""Model endpoints response times""},""barmode"":""relative""}}"
173
+ ./html/plots/execution_costs.html,"Figure({
174
+ 'data': [{'alignmentgroup': 'True',
175
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
176
+ 'legendgroup': 'gpt-3.5-turbo',
177
+ 'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
178
+ 'name': 'gpt-3.5-turbo',
179
+ 'offsetgroup': 'gpt-3.5-turbo',
180
+ 'orientation': 'v',
181
+ 'showlegend': True,
182
+ 'textposition': 'auto',
183
+ 'type': 'bar',
184
+ 'x': array(['gpt-3.5-turbo', 'gpt-3.5-turbo'], dtype=object),
185
+ 'xaxis': 'x',
186
+ 'y': array([0.002434, 0.002434]),
187
+ 'yaxis': 'y'},
188
+ {'alignmentgroup': 'True',
189
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
190
+ 'legendgroup': 'gpt-4-turbo',
191
+ 'marker': {'color': '#EF553B', 'pattern': {'shape': ''}},
192
+ 'name': 'gpt-4-turbo',
193
+ 'offsetgroup': 'gpt-4-turbo',
194
+ 'orientation': 'v',
195
+ 'showlegend': True,
196
+ 'textposition': 'auto',
197
+ 'type': 'bar',
198
+ 'x': array(['gpt-4-turbo'], dtype=object),
199
+ 'xaxis': 'x',
200
+ 'y': array([0.02967]),
201
+ 'yaxis': 'y'},
202
+ {'alignmentgroup': 'True',
203
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
204
+ 'legendgroup': 'gpt-4',
205
+ 'marker': {'color': '#00cc96', 'pattern': {'shape': ''}},
206
+ 'name': 'gpt-4',
207
+ 'offsetgroup': 'gpt-4',
208
+ 'orientation': 'v',
209
+ 'showlegend': True,
210
+ 'textposition': 'auto',
211
+ 'type': 'bar',
212
+ 'x': array(['gpt-4'], dtype=object),
213
+ 'xaxis': 'x',
214
+ 'y': array([0.07839]),
215
+ 'yaxis': 'y'},
216
+ {'alignmentgroup': 'True',
217
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
218
+ 'legendgroup': 'llama-2-70b-chat',
219
+ 'marker': {'color': '#ab63fa', 'pattern': {'shape': ''}},
220
+ 'name': 'llama-2-70b-chat',
221
+ 'offsetgroup': 'llama-2-70b-chat',
222
+ 'orientation': 'v',
223
+ 'showlegend': True,
224
+ 'textposition': 'auto',
225
+ 'type': 'bar',
226
+ 'x': array(['llama-2-70b-chat'], dtype=object),
227
+ 'xaxis': 'x',
228
+ 'y': array([0.0011922]),
229
+ 'yaxis': 'y'},
230
+ {'alignmentgroup': 'True',
231
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
232
+ 'legendgroup': 'Mixtral-8x7B-Instruct-v0.1',
233
+ 'marker': {'color': '#FFA15A', 'pattern': {'shape': ''}},
234
+ 'name': 'Mixtral-8x7B-Instruct-v0.1',
235
+ 'offsetgroup': 'Mixtral-8x7B-Instruct-v0.1',
236
+ 'orientation': 'v',
237
+ 'showlegend': True,
238
+ 'textposition': 'auto',
239
+ 'type': 'bar',
240
+ 'x': array(['Mixtral-8x7B-Instruct-v0.1'], dtype=object),
241
+ 'xaxis': 'x',
242
+ 'y': array([0.0021672]),
243
+ 'yaxis': 'y'},
244
+ {'alignmentgroup': 'True',
245
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
246
+ 'legendgroup': 'zephyr-7b-beta',
247
+ 'marker': {'color': '#19d3f3', 'pattern': {'shape': ''}},
248
+ 'name': 'zephyr-7b-beta',
249
+ 'offsetgroup': 'zephyr-7b-beta',
250
+ 'orientation': 'v',
251
+ 'showlegend': True,
252
+ 'textposition': 'auto',
253
+ 'type': 'bar',
254
+ 'x': array(['zephyr-7b-beta'], dtype=object),
255
+ 'xaxis': 'x',
256
+ 'y': array([0.08803055]),
257
+ 'yaxis': 'y'},
258
+ {'alignmentgroup': 'True',
259
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
260
+ 'legendgroup': 'Mistral-7B-Instruct-v0.2',
261
+ 'marker': {'color': '#FF6692', 'pattern': {'shape': ''}},
262
+ 'name': 'Mistral-7B-Instruct-v0.2',
263
+ 'offsetgroup': 'Mistral-7B-Instruct-v0.2',
264
+ 'orientation': 'v',
265
+ 'showlegend': True,
266
+ 'textposition': 'auto',
267
+ 'type': 'bar',
268
+ 'x': array(['Mistral-7B-Instruct-v0.2'], dtype=object),
269
+ 'xaxis': 'x',
270
+ 'y': array([0.08803149]),
271
+ 'yaxis': 'y'},
272
+ {'alignmentgroup': 'True',
273
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
274
+ 'legendgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
275
+ 'marker': {'color': '#B6E880', 'pattern': {'shape': ''}},
276
+ 'name': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
277
+ 'offsetgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
278
+ 'orientation': 'v',
279
+ 'showlegend': True,
280
+ 'textposition': 'auto',
281
+ 'type': 'bar',
282
+ 'x': array(['TinyLlama/TinyLlama-1.1B-Chat-v1.0'], dtype=object),
283
+ 'xaxis': 'x',
284
+ 'y': array([0.04039957]),
285
+ 'yaxis': 'y'},
286
+ {'alignmentgroup': 'True',
287
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
288
+ 'legendgroup': 'gemini-pro',
289
+ 'marker': {'color': '#FF97FF', 'pattern': {'shape': ''}},
290
+ 'name': 'gemini-pro',
291
+ 'offsetgroup': 'gemini-pro',
292
+ 'orientation': 'v',
293
+ 'showlegend': True,
294
+ 'textposition': 'auto',
295
+ 'type': 'bar',
296
+ 'x': array(['gemini-pro'], dtype=object),
297
+ 'xaxis': 'x',
298
+ 'y': array([0.000651]),
299
+ 'yaxis': 'y'},
300
+ {'alignmentgroup': 'True',
301
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
302
+ 'legendgroup': 'chat-bison (PaLM 2)',
303
+ 'marker': {'color': '#FECB52', 'pattern': {'shape': ''}},
304
+ 'name': 'chat-bison (PaLM 2)',
305
+ 'offsetgroup': 'chat-bison (PaLM 2)',
306
+ 'orientation': 'v',
307
+ 'showlegend': True,
308
+ 'textposition': 'auto',
309
+ 'type': 'bar',
310
+ 'x': array(['chat-bison (PaLM 2)'], dtype=object),
311
+ 'xaxis': 'x',
312
+ 'y': array([0.]),
313
+ 'yaxis': 'y'},
314
+ {'alignmentgroup': 'True',
315
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
316
+ 'legendgroup': 'chat-bison-32k (PaLM 2 32K)',
317
+ 'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
318
+ 'name': 'chat-bison-32k (PaLM 2 32K)',
319
+ 'offsetgroup': 'chat-bison-32k (PaLM 2 32K)',
320
+ 'orientation': 'v',
321
+ 'showlegend': True,
322
+ 'textposition': 'auto',
323
+ 'type': 'bar',
324
+ 'x': array(['chat-bison-32k (PaLM 2 32K)'], dtype=object),
325
+ 'xaxis': 'x',
326
+ 'y': array([0.]),
327
+ 'yaxis': 'y'}],
328
+ 'layout': {'barmode': 'relative',
329
+ 'legend': {'title': {'text': 'Model'}, 'tracegroupgap': 0},
330
+ 'template': '...',
331
+ 'title': {'text': 'Costs of execution of 39 test queries per model'},
332
+ 'xaxis': {'anchor': 'y', 'domain': [0.0, 1.0], 'title': {'text': 'Model'}},
333
+ 'yaxis': {'anchor': 'x', 'domain': [0.0, 1.0], 'title': {'text': 'Execution cost ($)'}}}
334
+ })",Costs of execution of 39 test queries per model,Note that some providers bill by token count and some by execution time. In the second case we used averaged pausing and resuming time to calculate the cost and assumed that all queries have been done in one session. Also note that for now the Gemini-Pro model is free for under 60 queries per minute.,"{""data"":[{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-3.5-turbo"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""gpt-3.5-turbo"",""offsetgroup"":""gpt-3.5-turbo"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gpt-3.5-turbo"",""gpt-3.5-turbo""],""xaxis"":""x"",""y"":[0.002434,0.002434],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4-turbo"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""gpt-4-turbo"",""offsetgroup"":""gpt-4-turbo"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gpt-4-turbo""],""xaxis"":""x"",""y"":[0.029670000000000002],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""gpt-4"",""offsetgroup"":""gpt-4"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gpt-4""],""xaxis"":""x"",""y"":[0.07839],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""llama-2-70b-chat"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""llama-2-70b-chat"",""offsetgroup"":""llama-2-70b-chat"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""llama-2-70b-chat""],""xaxis"":""x"",""y"":[0.0011922],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mixtral-8x7B-Instruct-v0.1"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""Mixtral-8x7B-Instruct-v0.1"",""offsetgroup"":""Mixtral-8x7B-Instruct-v0.1"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""Mixtral-8x7B-Instruct-v0.1""],""xaxis"":""x"",""y"":[0.0021672],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""zephyr-7b-beta"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""zephyr-7b-beta"",""offsetgroup"":""zephyr-7b-beta"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""zephyr-7b-beta""],""xaxis"":""x"",""y"":[0.08803054547641014],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral-7B-Instruct-v0.2"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""Mistral-7B-Instruct-v0.2"",""offsetgroup"":""Mistral-7B-Instruct-v0.2"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""Mistral-7B-Instruct-v0.2""],""xaxis"":""x"",""y"":[0.08803148682845963],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""offsetgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0""],""xaxis"":""x"",""y"":[0.040399565458297725],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gemini-pro"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""gemini-pro"",""offsetgroup"":""gemini-pro"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gemini-pro""],""xaxis"":""x"",""y"":[0.000651],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison (PaLM 2)"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""chat-bison (PaLM 2)"",""offsetgroup"":""chat-bison (PaLM 2)"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""chat-bison (PaLM 2)""],""xaxis"":""x"",""y"":[0.0],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison-32k (PaLM 2 32K)"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""chat-bison-32k (PaLM 2 32K)"",""offsetgroup"":""chat-bison-32k (PaLM 2 32K)"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""chat-bison-32k (PaLM 2 32K)""],""xaxis"":""x"",""y"":[0.0],""yaxis"":""y"",""type"":""bar""}],""layout"":{""template"":{""data"":{""histogram2dcontour"":[{""type"":""histogram2dcontour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""choropleth"":[{""type"":""choropleth"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""histogram2d"":[{""type"":""histogram2d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmap"":[{""type"":""heatmap"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmapgl"":[{""type"":""heatmapgl"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""contourcarpet"":[{""type"":""contourcarpet"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""contour"":[{""type"":""contour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""surface"":[{""type"":""surface"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""mesh3d"":[{""type"":""mesh3d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""scatter"":[{""fillpattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2},""type"":""scatter""}],""parcoords"":[{""type"":""parcoords"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolargl"":[{""type"":""scatterpolargl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""bar"":[{""error_x"":{""color"":""#2a3f5f""},""error_y"":{""color"":""#2a3f5f""},""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""bar""}],""scattergeo"":[{""type"":""scattergeo"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolar"":[{""type"":""scatterpolar"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""histogram"":[{""marker"":{""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""histogram""}],""scattergl"":[{""type"":""scattergl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatter3d"":[{""type"":""scatter3d"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattermapbox"":[{""type"":""scattermapbox"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterternary"":[{""type"":""scatterternary"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattercarpet"":[{""type"":""scattercarpet"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""carpet"":[{""aaxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""baxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""type"":""carpet""}],""table"":[{""cells"":{""fill"":{""color"":""#EBF0F8""},""line"":{""color"":""white""}},""header"":{""fill"":{""color"":""#C8D4E3""},""line"":{""color"":""white""}},""type"":""table""}],""barpolar"":[{""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""barpolar""}],""pie"":[{""automargin"":true,""type"":""pie""}]},""layout"":{""autotypenumbers"":""strict"",""colorway"":[""#636efa"",""#EF553B"",""#00cc96"",""#ab63fa"",""#FFA15A"",""#19d3f3"",""#FF6692"",""#B6E880"",""#FF97FF"",""#FECB52""],""font"":{""color"":""#2a3f5f""},""hovermode"":""closest"",""hoverlabel"":{""align"":""left""},""paper_bgcolor"":""white"",""plot_bgcolor"":""#E5ECF6"",""polar"":{""bgcolor"":""#E5ECF6"",""angularaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""radialaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""ternary"":{""bgcolor"":""#E5ECF6"",""aaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""baxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""caxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""coloraxis"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""colorscale"":{""sequential"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""sequentialminus"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""diverging"":[[0,""#8e0152""],[0.1,""#c51b7d""],[0.2,""#de77ae""],[0.3,""#f1b6da""],[0.4,""#fde0ef""],[0.5,""#f7f7f7""],[0.6,""#e6f5d0""],[0.7,""#b8e186""],[0.8,""#7fbc41""],[0.9,""#4d9221""],[1,""#276419""]]},""xaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""yaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""scene"":{""xaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""yaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""zaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2}},""shapedefaults"":{""line"":{""color"":""#2a3f5f""}},""annotationdefaults"":{""arrowcolor"":""#2a3f5f"",""arrowhead"":0,""arrowwidth"":1},""geo"":{""bgcolor"":""white"",""landcolor"":""#E5ECF6"",""subunitcolor"":""white"",""showland"":true,""showlakes"":true,""lakecolor"":""white""},""title"":{""x"":0.05},""mapbox"":{""style"":""light""}}},""xaxis"":{""anchor"":""y"",""domain"":[0.0,1.0],""title"":{""text"":""Model""}},""yaxis"":{""anchor"":""x"",""domain"":[0.0,1.0],""title"":{""text"":""Execution cost ($)""}},""legend"":{""title"":{""text"":""Model""},""tracegroupgap"":0},""title"":{""text"":""Costs of execution of 39 test queries per model""},""barmode"":""relative""}}"
335
+ ./html/plots/model_sizes.html,"Figure({
336
+ 'data': [{'alignmentgroup': 'True',
337
+ 'hovertemplate': 'Model=%{x}<br>Model size (B params)=%{y}<extra></extra>',
338
+ 'legendgroup': 'Mixtral-8x7B-Instruct-v0.1',
339
+ 'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
340
+ 'name': 'Mixtral-8x7B-Instruct-v0.1',
341
+ 'offsetgroup': 'Mixtral-8x7B-Instruct-v0.1',
342
+ 'orientation': 'v',
343
+ 'showlegend': True,
344
+ 'textposition': 'auto',
345
+ 'type': 'bar',
346
+ 'x': array(['Mixtral-8x7B-Instruct-v0.1'], dtype=object),
347
+ 'xaxis': 'x',
348
+ 'y': array([56.]),
349
+ 'yaxis': 'y'},
350
+ {'alignmentgroup': 'True',
351
+ 'hovertemplate': 'Model=%{x}<br>Model size (B params)=%{y}<extra></extra>',
352
+ 'legendgroup': 'zephyr-7b-beta',
353
+ 'marker': {'color': '#EF553B', 'pattern': {'shape': ''}},
354
+ 'name': 'zephyr-7b-beta',
355
+ 'offsetgroup': 'zephyr-7b-beta',
356
+ 'orientation': 'v',
357
+ 'showlegend': True,
358
+ 'textposition': 'auto',
359
+ 'type': 'bar',
360
+ 'x': array(['zephyr-7b-beta'], dtype=object),
361
+ 'xaxis': 'x',
362
+ 'y': array([7.]),
363
+ 'yaxis': 'y'},
364
+ {'alignmentgroup': 'True',
365
+ 'hovertemplate': 'Model=%{x}<br>Model size (B params)=%{y}<extra></extra>',
366
+ 'legendgroup': 'Mistral-7B-Instruct-v0.2',
367
+ 'marker': {'color': '#00cc96', 'pattern': {'shape': ''}},
368
+ 'name': 'Mistral-7B-Instruct-v0.2',
369
+ 'offsetgroup': 'Mistral-7B-Instruct-v0.2',
370
+ 'orientation': 'v',
371
+ 'showlegend': True,
372
+ 'textposition': 'auto',
373
+ 'type': 'bar',
374
+ 'x': array(['Mistral-7B-Instruct-v0.2'], dtype=object),
375
+ 'xaxis': 'x',
376
+ 'y': array([7.]),
377
+ 'yaxis': 'y'},
378
+ {'alignmentgroup': 'True',
379
+ 'hovertemplate': 'Model=%{x}<br>Model size (B params)=%{y}<extra></extra>',
380
+ 'legendgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
381
+ 'marker': {'color': '#ab63fa', 'pattern': {'shape': ''}},
382
+ 'name': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
383
+ 'offsetgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
384
+ 'orientation': 'v',
385
+ 'showlegend': True,
386
+ 'textposition': 'auto',
387
+ 'type': 'bar',
388
+ 'x': array(['TinyLlama/TinyLlama-1.1B-Chat-v1.0'], dtype=object),
389
+ 'xaxis': 'x',
390
+ 'y': array([1.1]),
391
+ 'yaxis': 'y'}],
392
+ 'layout': {'barmode': 'relative',
393
+ 'legend': {'title': {'text': 'Model'}, 'tracegroupgap': 0},
394
+ 'template': '...',
395
+ 'title': {'text': 'Model sizes in billions of parameters'},
396
+ 'xaxis': {'anchor': 'y', 'domain': [0.0, 1.0], 'title': {'text': 'Model'}},
397
+ 'yaxis': {'anchor': 'x', 'domain': [0.0, 1.0], 'title': {'text': 'Model size (B params)'}}}
398
+ })",Model sizes in billions of parameters,Note that some models have undisclosed sizes.,"{""data"":[{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eModel size (B params)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mixtral-8x7B-Instruct-v0.1"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""Mixtral-8x7B-Instruct-v0.1"",""offsetgroup"":""Mixtral-8x7B-Instruct-v0.1"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""Mixtral-8x7B-Instruct-v0.1""],""xaxis"":""x"",""y"":[56.0],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eModel size (B params)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""zephyr-7b-beta"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""zephyr-7b-beta"",""offsetgroup"":""zephyr-7b-beta"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""zephyr-7b-beta""],""xaxis"":""x"",""y"":[7.0],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eModel size (B params)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral-7B-Instruct-v0.2"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""Mistral-7B-Instruct-v0.2"",""offsetgroup"":""Mistral-7B-Instruct-v0.2"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""Mistral-7B-Instruct-v0.2""],""xaxis"":""x"",""y"":[7.0],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eModel size (B params)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""offsetgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0""],""xaxis"":""x"",""y"":[1.1],""yaxis"":""y"",""type"":""bar""}],""layout"":{""template"":{""data"":{""histogram2dcontour"":[{""type"":""histogram2dcontour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""choropleth"":[{""type"":""choropleth"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""histogram2d"":[{""type"":""histogram2d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmap"":[{""type"":""heatmap"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmapgl"":[{""type"":""heatmapgl"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""contourcarpet"":[{""type"":""contourcarpet"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""contour"":[{""type"":""contour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""surface"":[{""type"":""surface"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""mesh3d"":[{""type"":""mesh3d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""scatter"":[{""fillpattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2},""type"":""scatter""}],""parcoords"":[{""type"":""parcoords"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolargl"":[{""type"":""scatterpolargl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""bar"":[{""error_x"":{""color"":""#2a3f5f""},""error_y"":{""color"":""#2a3f5f""},""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""bar""}],""scattergeo"":[{""type"":""scattergeo"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolar"":[{""type"":""scatterpolar"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""histogram"":[{""marker"":{""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""histogram""}],""scattergl"":[{""type"":""scattergl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatter3d"":[{""type"":""scatter3d"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattermapbox"":[{""type"":""scattermapbox"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterternary"":[{""type"":""scatterternary"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattercarpet"":[{""type"":""scattercarpet"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""carpet"":[{""aaxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""baxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""type"":""carpet""}],""table"":[{""cells"":{""fill"":{""color"":""#EBF0F8""},""line"":{""color"":""white""}},""header"":{""fill"":{""color"":""#C8D4E3""},""line"":{""color"":""white""}},""type"":""table""}],""barpolar"":[{""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""barpolar""}],""pie"":[{""automargin"":true,""type"":""pie""}]},""layout"":{""autotypenumbers"":""strict"",""colorway"":[""#636efa"",""#EF553B"",""#00cc96"",""#ab63fa"",""#FFA15A"",""#19d3f3"",""#FF6692"",""#B6E880"",""#FF97FF"",""#FECB52""],""font"":{""color"":""#2a3f5f""},""hovermode"":""closest"",""hoverlabel"":{""align"":""left""},""paper_bgcolor"":""white"",""plot_bgcolor"":""#E5ECF6"",""polar"":{""bgcolor"":""#E5ECF6"",""angularaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""radialaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""ternary"":{""bgcolor"":""#E5ECF6"",""aaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""baxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""caxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""coloraxis"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""colorscale"":{""sequential"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""sequentialminus"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""diverging"":[[0,""#8e0152""],[0.1,""#c51b7d""],[0.2,""#de77ae""],[0.3,""#f1b6da""],[0.4,""#fde0ef""],[0.5,""#f7f7f7""],[0.6,""#e6f5d0""],[0.7,""#b8e186""],[0.8,""#7fbc41""],[0.9,""#4d9221""],[1,""#276419""]]},""xaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""yaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""scene"":{""xaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""yaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""zaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2}},""shapedefaults"":{""line"":{""color"":""#2a3f5f""}},""annotationdefaults"":{""arrowcolor"":""#2a3f5f"",""arrowhead"":0,""arrowwidth"":1},""geo"":{""bgcolor"":""white"",""landcolor"":""#E5ECF6"",""subunitcolor"":""white"",""showland"":true,""showlakes"":true,""lakecolor"":""white""},""title"":{""x"":0.05},""mapbox"":{""style"":""light""}}},""xaxis"":{""anchor"":""y"",""domain"":[0.0,1.0],""title"":{""text"":""Model""}},""yaxis"":{""anchor"":""x"",""domain"":[0.0,1.0],""title"":{""text"":""Model size (B params)""}},""legend"":{""title"":{""text"":""Model""},""tracegroupgap"":0},""title"":{""text"":""Model sizes in billions of parameters""},""barmode"":""relative""}}"
data/2024-01-26 11:06:20.415218_general_plot.csv ADDED
@@ -0,0 +1,398 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ path,plot_object,description,comment,plot_json
2
+ ./html/plots/response_times.html,"Figure({
3
+ 'data': [{'alignmentgroup': 'True',
4
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
5
+ 'legendgroup': 'Mistral-7B-Instruct-v0.2',
6
+ 'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
7
+ 'name': 'Mistral-7B-Instruct-v0.2',
8
+ 'offsetgroup': 'Mistral-7B-Instruct-v0.2',
9
+ 'orientation': 'v',
10
+ 'showlegend': True,
11
+ 'textposition': 'auto',
12
+ 'type': 'bar',
13
+ 'x': array(['Mistral-7B-Instruct-v0.2'], dtype=object),
14
+ 'xaxis': 'x',
15
+ 'y': array([3.17454003]),
16
+ 'yaxis': 'y'},
17
+ {'alignmentgroup': 'True',
18
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
19
+ 'legendgroup': 'Mixtral-8x7B-Instruct-v0.1',
20
+ 'marker': {'color': '#EF553B', 'pattern': {'shape': ''}},
21
+ 'name': 'Mixtral-8x7B-Instruct-v0.1',
22
+ 'offsetgroup': 'Mixtral-8x7B-Instruct-v0.1',
23
+ 'orientation': 'v',
24
+ 'showlegend': True,
25
+ 'textposition': 'auto',
26
+ 'type': 'bar',
27
+ 'x': array(['Mixtral-8x7B-Instruct-v0.1'], dtype=object),
28
+ 'xaxis': 'x',
29
+ 'y': array([7.14219763]),
30
+ 'yaxis': 'y'},
31
+ {'alignmentgroup': 'True',
32
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
33
+ 'legendgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
34
+ 'marker': {'color': '#00cc96', 'pattern': {'shape': ''}},
35
+ 'name': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
36
+ 'offsetgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
37
+ 'orientation': 'v',
38
+ 'showlegend': True,
39
+ 'textposition': 'auto',
40
+ 'type': 'bar',
41
+ 'x': array(['TinyLlama/TinyLlama-1.1B-Chat-v1.0'], dtype=object),
42
+ 'xaxis': 'x',
43
+ 'y': array([1.29026454]),
44
+ 'yaxis': 'y'},
45
+ {'alignmentgroup': 'True',
46
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
47
+ 'legendgroup': 'chat-bison',
48
+ 'marker': {'color': '#ab63fa', 'pattern': {'shape': ''}},
49
+ 'name': 'chat-bison',
50
+ 'offsetgroup': 'chat-bison',
51
+ 'orientation': 'v',
52
+ 'showlegend': True,
53
+ 'textposition': 'auto',
54
+ 'type': 'bar',
55
+ 'x': array(['chat-bison'], dtype=object),
56
+ 'xaxis': 'x',
57
+ 'y': array([3.89024363]),
58
+ 'yaxis': 'y'},
59
+ {'alignmentgroup': 'True',
60
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
61
+ 'legendgroup': 'chat-bison-32k',
62
+ 'marker': {'color': '#FFA15A', 'pattern': {'shape': ''}},
63
+ 'name': 'chat-bison-32k',
64
+ 'offsetgroup': 'chat-bison-32k',
65
+ 'orientation': 'v',
66
+ 'showlegend': True,
67
+ 'textposition': 'auto',
68
+ 'type': 'bar',
69
+ 'x': array(['chat-bison-32k'], dtype=object),
70
+ 'xaxis': 'x',
71
+ 'y': array([4.12817777]),
72
+ 'yaxis': 'y'},
73
+ {'alignmentgroup': 'True',
74
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
75
+ 'legendgroup': 'gemini-pro',
76
+ 'marker': {'color': '#19d3f3', 'pattern': {'shape': ''}},
77
+ 'name': 'gemini-pro',
78
+ 'offsetgroup': 'gemini-pro',
79
+ 'orientation': 'v',
80
+ 'showlegend': True,
81
+ 'textposition': 'auto',
82
+ 'type': 'bar',
83
+ 'x': array(['gemini-pro'], dtype=object),
84
+ 'xaxis': 'x',
85
+ 'y': array([4.72138064]),
86
+ 'yaxis': 'y'},
87
+ {'alignmentgroup': 'True',
88
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
89
+ 'legendgroup': 'gpt-3.5-turbo',
90
+ 'marker': {'color': '#FF6692', 'pattern': {'shape': ''}},
91
+ 'name': 'gpt-3.5-turbo',
92
+ 'offsetgroup': 'gpt-3.5-turbo',
93
+ 'orientation': 'v',
94
+ 'showlegend': True,
95
+ 'textposition': 'auto',
96
+ 'type': 'bar',
97
+ 'x': array(['gpt-3.5-turbo'], dtype=object),
98
+ 'xaxis': 'x',
99
+ 'y': array([5.28237349]),
100
+ 'yaxis': 'y'},
101
+ {'alignmentgroup': 'True',
102
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
103
+ 'legendgroup': 'gpt-4',
104
+ 'marker': {'color': '#B6E880', 'pattern': {'shape': ''}},
105
+ 'name': 'gpt-4',
106
+ 'offsetgroup': 'gpt-4',
107
+ 'orientation': 'v',
108
+ 'showlegend': True,
109
+ 'textposition': 'auto',
110
+ 'type': 'bar',
111
+ 'x': array(['gpt-4'], dtype=object),
112
+ 'xaxis': 'x',
113
+ 'y': array([15.52184566]),
114
+ 'yaxis': 'y'},
115
+ {'alignmentgroup': 'True',
116
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
117
+ 'legendgroup': 'gpt-4-turbo',
118
+ 'marker': {'color': '#FF97FF', 'pattern': {'shape': ''}},
119
+ 'name': 'gpt-4-turbo',
120
+ 'offsetgroup': 'gpt-4-turbo',
121
+ 'orientation': 'v',
122
+ 'showlegend': True,
123
+ 'textposition': 'auto',
124
+ 'type': 'bar',
125
+ 'x': array(['gpt-4-turbo'], dtype=object),
126
+ 'xaxis': 'x',
127
+ 'y': array([14.00852903]),
128
+ 'yaxis': 'y'},
129
+ {'alignmentgroup': 'True',
130
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
131
+ 'legendgroup': 'llama-2-70b-chat',
132
+ 'marker': {'color': '#FECB52', 'pattern': {'shape': ''}},
133
+ 'name': 'llama-2-70b-chat',
134
+ 'offsetgroup': 'llama-2-70b-chat',
135
+ 'orientation': 'v',
136
+ 'showlegend': True,
137
+ 'textposition': 'auto',
138
+ 'type': 'bar',
139
+ 'x': array(['llama-2-70b-chat'], dtype=object),
140
+ 'xaxis': 'x',
141
+ 'y': array([6.0658799]),
142
+ 'yaxis': 'y'},
143
+ {'alignmentgroup': 'True',
144
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
145
+ 'legendgroup': 'zephyr-7b-beta',
146
+ 'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
147
+ 'name': 'zephyr-7b-beta',
148
+ 'offsetgroup': 'zephyr-7b-beta',
149
+ 'orientation': 'v',
150
+ 'showlegend': True,
151
+ 'textposition': 'auto',
152
+ 'type': 'bar',
153
+ 'x': array(['zephyr-7b-beta'], dtype=object),
154
+ 'xaxis': 'x',
155
+ 'y': array([3.23879932]),
156
+ 'yaxis': 'y'}],
157
+ 'layout': {'barmode': 'relative',
158
+ 'legend': {'title': {'text': 'Model'}, 'tracegroupgap': 0},
159
+ 'template': '...',
160
+ 'title': {'text': 'Model endpoints response times'},
161
+ 'xaxis': {'anchor': 'y',
162
+ 'categoryarray': [Mistral-7B-Instruct-v0.2,
163
+ Mixtral-8x7B-Instruct-v0.1,
164
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,
165
+ chat-bison, chat-bison-32k, gemini-pro,
166
+ gpt-3.5-turbo, gpt-4, gpt-4-turbo,
167
+ llama-2-70b-chat, zephyr-7b-beta],
168
+ 'categoryorder': 'array',
169
+ 'domain': [0.0, 1.0],
170
+ 'title': {'text': 'Model'}},
171
+ 'yaxis': {'anchor': 'x', 'domain': [0.0, 1.0], 'title': {'text': 'Execution time (s)'}}}
172
+ })",Model endpoints response times,,"{""data"":[{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral-7B-Instruct-v0.2"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""Mistral-7B-Instruct-v0.2"",""offsetgroup"":""Mistral-7B-Instruct-v0.2"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""Mistral-7B-Instruct-v0.2""],""xaxis"":""x"",""y"":[3.174540030956268],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mixtral-8x7B-Instruct-v0.1"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""Mixtral-8x7B-Instruct-v0.1"",""offsetgroup"":""Mixtral-8x7B-Instruct-v0.1"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""Mixtral-8x7B-Instruct-v0.1""],""xaxis"":""x"",""y"":[7.142197625471814],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""offsetgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0""],""xaxis"":""x"",""y"":[1.2902645373344421],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""chat-bison"",""offsetgroup"":""chat-bison"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""chat-bison""],""xaxis"":""x"",""y"":[3.890243631601334],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison-32k"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""chat-bison-32k"",""offsetgroup"":""chat-bison-32k"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""chat-bison-32k""],""xaxis"":""x"",""y"":[4.128177767992019],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gemini-pro"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""gemini-pro"",""offsetgroup"":""gemini-pro"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gemini-pro""],""xaxis"":""x"",""y"":[4.72138064004937],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-3.5-turbo"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""gpt-3.5-turbo"",""offsetgroup"":""gpt-3.5-turbo"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gpt-3.5-turbo""],""xaxis"":""x"",""y"":[5.282373493889353],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""gpt-4"",""offsetgroup"":""gpt-4"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gpt-4""],""xaxis"":""x"",""y"":[15.5218456586202],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4-turbo"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""gpt-4-turbo"",""offsetgroup"":""gpt-4-turbo"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gpt-4-turbo""],""xaxis"":""x"",""y"":[14.008529031276703],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""llama-2-70b-chat"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""llama-2-70b-chat"",""offsetgroup"":""llama-2-70b-chat"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""llama-2-70b-chat""],""xaxis"":""x"",""y"":[6.06587989590749],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""zephyr-7b-beta"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""zephyr-7b-beta"",""offsetgroup"":""zephyr-7b-beta"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""zephyr-7b-beta""],""xaxis"":""x"",""y"":[3.2387993240356447],""yaxis"":""y"",""type"":""bar""}],""layout"":{""template"":{""data"":{""histogram2dcontour"":[{""type"":""histogram2dcontour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""choropleth"":[{""type"":""choropleth"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""histogram2d"":[{""type"":""histogram2d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmap"":[{""type"":""heatmap"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmapgl"":[{""type"":""heatmapgl"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""contourcarpet"":[{""type"":""contourcarpet"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""contour"":[{""type"":""contour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""surface"":[{""type"":""surface"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""mesh3d"":[{""type"":""mesh3d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""scatter"":[{""fillpattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2},""type"":""scatter""}],""parcoords"":[{""type"":""parcoords"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolargl"":[{""type"":""scatterpolargl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""bar"":[{""error_x"":{""color"":""#2a3f5f""},""error_y"":{""color"":""#2a3f5f""},""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""bar""}],""scattergeo"":[{""type"":""scattergeo"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolar"":[{""type"":""scatterpolar"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""histogram"":[{""marker"":{""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""histogram""}],""scattergl"":[{""type"":""scattergl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatter3d"":[{""type"":""scatter3d"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattermapbox"":[{""type"":""scattermapbox"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterternary"":[{""type"":""scatterternary"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattercarpet"":[{""type"":""scattercarpet"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""carpet"":[{""aaxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""baxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""type"":""carpet""}],""table"":[{""cells"":{""fill"":{""color"":""#EBF0F8""},""line"":{""color"":""white""}},""header"":{""fill"":{""color"":""#C8D4E3""},""line"":{""color"":""white""}},""type"":""table""}],""barpolar"":[{""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""barpolar""}],""pie"":[{""automargin"":true,""type"":""pie""}]},""layout"":{""autotypenumbers"":""strict"",""colorway"":[""#636efa"",""#EF553B"",""#00cc96"",""#ab63fa"",""#FFA15A"",""#19d3f3"",""#FF6692"",""#B6E880"",""#FF97FF"",""#FECB52""],""font"":{""color"":""#2a3f5f""},""hovermode"":""closest"",""hoverlabel"":{""align"":""left""},""paper_bgcolor"":""white"",""plot_bgcolor"":""#E5ECF6"",""polar"":{""bgcolor"":""#E5ECF6"",""angularaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""radialaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""ternary"":{""bgcolor"":""#E5ECF6"",""aaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""baxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""caxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""coloraxis"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""colorscale"":{""sequential"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""sequentialminus"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""diverging"":[[0,""#8e0152""],[0.1,""#c51b7d""],[0.2,""#de77ae""],[0.3,""#f1b6da""],[0.4,""#fde0ef""],[0.5,""#f7f7f7""],[0.6,""#e6f5d0""],[0.7,""#b8e186""],[0.8,""#7fbc41""],[0.9,""#4d9221""],[1,""#276419""]]},""xaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""yaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""scene"":{""xaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""yaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""zaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2}},""shapedefaults"":{""line"":{""color"":""#2a3f5f""}},""annotationdefaults"":{""arrowcolor"":""#2a3f5f"",""arrowhead"":0,""arrowwidth"":1},""geo"":{""bgcolor"":""white"",""landcolor"":""#E5ECF6"",""subunitcolor"":""white"",""showland"":true,""showlakes"":true,""lakecolor"":""white""},""title"":{""x"":0.05},""mapbox"":{""style"":""light""}}},""xaxis"":{""anchor"":""y"",""domain"":[0.0,1.0],""title"":{""text"":""Model""},""categoryorder"":""array"",""categoryarray"":[""Mistral-7B-Instruct-v0.2"",""Mixtral-8x7B-Instruct-v0.1"",""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""chat-bison"",""chat-bison-32k"",""gemini-pro"",""gpt-3.5-turbo"",""gpt-4"",""gpt-4-turbo"",""llama-2-70b-chat"",""zephyr-7b-beta""]},""yaxis"":{""anchor"":""x"",""domain"":[0.0,1.0],""title"":{""text"":""Execution time (s)""}},""legend"":{""title"":{""text"":""Model""},""tracegroupgap"":0},""title"":{""text"":""Model endpoints response times""},""barmode"":""relative""}}"
173
+ ./html/plots/execution_costs.html,"Figure({
174
+ 'data': [{'alignmentgroup': 'True',
175
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
176
+ 'legendgroup': 'gpt-3.5-turbo',
177
+ 'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
178
+ 'name': 'gpt-3.5-turbo',
179
+ 'offsetgroup': 'gpt-3.5-turbo',
180
+ 'orientation': 'v',
181
+ 'showlegend': True,
182
+ 'textposition': 'auto',
183
+ 'type': 'bar',
184
+ 'x': array(['gpt-3.5-turbo', 'gpt-3.5-turbo'], dtype=object),
185
+ 'xaxis': 'x',
186
+ 'y': array([0.020961, 0.020961]),
187
+ 'yaxis': 'y'},
188
+ {'alignmentgroup': 'True',
189
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
190
+ 'legendgroup': 'gpt-4-turbo',
191
+ 'marker': {'color': '#EF553B', 'pattern': {'shape': ''}},
192
+ 'name': 'gpt-4-turbo',
193
+ 'offsetgroup': 'gpt-4-turbo',
194
+ 'orientation': 'v',
195
+ 'showlegend': True,
196
+ 'textposition': 'auto',
197
+ 'type': 'bar',
198
+ 'x': array(['gpt-4-turbo'], dtype=object),
199
+ 'xaxis': 'x',
200
+ 'y': array([0.21067]),
201
+ 'yaxis': 'y'},
202
+ {'alignmentgroup': 'True',
203
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
204
+ 'legendgroup': 'gpt-4',
205
+ 'marker': {'color': '#00cc96', 'pattern': {'shape': ''}},
206
+ 'name': 'gpt-4',
207
+ 'offsetgroup': 'gpt-4',
208
+ 'orientation': 'v',
209
+ 'showlegend': True,
210
+ 'textposition': 'auto',
211
+ 'type': 'bar',
212
+ 'x': array(['gpt-4'], dtype=object),
213
+ 'xaxis': 'x',
214
+ 'y': array([0.5502]),
215
+ 'yaxis': 'y'},
216
+ {'alignmentgroup': 'True',
217
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
218
+ 'legendgroup': 'llama-2-70b-chat',
219
+ 'marker': {'color': '#ab63fa', 'pattern': {'shape': ''}},
220
+ 'name': 'llama-2-70b-chat',
221
+ 'offsetgroup': 'llama-2-70b-chat',
222
+ 'orientation': 'v',
223
+ 'showlegend': True,
224
+ 'textposition': 'auto',
225
+ 'type': 'bar',
226
+ 'x': array(['llama-2-70b-chat'], dtype=object),
227
+ 'xaxis': 'x',
228
+ 'y': array([0.004106]),
229
+ 'yaxis': 'y'},
230
+ {'alignmentgroup': 'True',
231
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
232
+ 'legendgroup': 'Mixtral-8x7B-Instruct-v0.1',
233
+ 'marker': {'color': '#FFA15A', 'pattern': {'shape': ''}},
234
+ 'name': 'Mixtral-8x7B-Instruct-v0.1',
235
+ 'offsetgroup': 'Mixtral-8x7B-Instruct-v0.1',
236
+ 'orientation': 'v',
237
+ 'showlegend': True,
238
+ 'textposition': 'auto',
239
+ 'type': 'bar',
240
+ 'x': array(['Mixtral-8x7B-Instruct-v0.1'], dtype=object),
241
+ 'xaxis': 'x',
242
+ 'y': array([0.0171468]),
243
+ 'yaxis': 'y'},
244
+ {'alignmentgroup': 'True',
245
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
246
+ 'legendgroup': 'zephyr-7b-beta',
247
+ 'marker': {'color': '#19d3f3', 'pattern': {'shape': ''}},
248
+ 'name': 'zephyr-7b-beta',
249
+ 'offsetgroup': 'zephyr-7b-beta',
250
+ 'orientation': 'v',
251
+ 'showlegend': True,
252
+ 'textposition': 'auto',
253
+ 'type': 'bar',
254
+ 'x': array(['zephyr-7b-beta'], dtype=object),
255
+ 'xaxis': 'x',
256
+ 'y': array([0.00641104]),
257
+ 'yaxis': 'y'},
258
+ {'alignmentgroup': 'True',
259
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
260
+ 'legendgroup': 'Mistral-7B-Instruct-v0.2',
261
+ 'marker': {'color': '#FF6692', 'pattern': {'shape': ''}},
262
+ 'name': 'Mistral-7B-Instruct-v0.2',
263
+ 'offsetgroup': 'Mistral-7B-Instruct-v0.2',
264
+ 'orientation': 'v',
265
+ 'showlegend': True,
266
+ 'textposition': 'auto',
267
+ 'type': 'bar',
268
+ 'x': array(['Mistral-7B-Instruct-v0.2'], dtype=object),
269
+ 'xaxis': 'x',
270
+ 'y': array([0.00295553]),
271
+ 'yaxis': 'y'},
272
+ {'alignmentgroup': 'True',
273
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
274
+ 'legendgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
275
+ 'marker': {'color': '#B6E880', 'pattern': {'shape': ''}},
276
+ 'name': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
277
+ 'offsetgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
278
+ 'orientation': 'v',
279
+ 'showlegend': True,
280
+ 'textposition': 'auto',
281
+ 'type': 'bar',
282
+ 'x': array(['TinyLlama/TinyLlama-1.1B-Chat-v1.0'], dtype=object),
283
+ 'xaxis': 'x',
284
+ 'y': array([0.00086983]),
285
+ 'yaxis': 'y'},
286
+ {'alignmentgroup': 'True',
287
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
288
+ 'legendgroup': 'gemini-pro',
289
+ 'marker': {'color': '#FF97FF', 'pattern': {'shape': ''}},
290
+ 'name': 'gemini-pro',
291
+ 'offsetgroup': 'gemini-pro',
292
+ 'orientation': 'v',
293
+ 'showlegend': True,
294
+ 'textposition': 'auto',
295
+ 'type': 'bar',
296
+ 'x': array(['gemini-pro'], dtype=object),
297
+ 'xaxis': 'x',
298
+ 'y': array([0.00511725]),
299
+ 'yaxis': 'y'},
300
+ {'alignmentgroup': 'True',
301
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
302
+ 'legendgroup': 'chat-bison (PaLM 2)',
303
+ 'marker': {'color': '#FECB52', 'pattern': {'shape': ''}},
304
+ 'name': 'chat-bison (PaLM 2)',
305
+ 'offsetgroup': 'chat-bison (PaLM 2)',
306
+ 'orientation': 'v',
307
+ 'showlegend': True,
308
+ 'textposition': 'auto',
309
+ 'type': 'bar',
310
+ 'x': array(['chat-bison (PaLM 2)'], dtype=object),
311
+ 'xaxis': 'x',
312
+ 'y': array([0.]),
313
+ 'yaxis': 'y'},
314
+ {'alignmentgroup': 'True',
315
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
316
+ 'legendgroup': 'chat-bison-32k (PaLM 2 32K)',
317
+ 'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
318
+ 'name': 'chat-bison-32k (PaLM 2 32K)',
319
+ 'offsetgroup': 'chat-bison-32k (PaLM 2 32K)',
320
+ 'orientation': 'v',
321
+ 'showlegend': True,
322
+ 'textposition': 'auto',
323
+ 'type': 'bar',
324
+ 'x': array(['chat-bison-32k (PaLM 2 32K)'], dtype=object),
325
+ 'xaxis': 'x',
326
+ 'y': array([0.]),
327
+ 'yaxis': 'y'}],
328
+ 'layout': {'barmode': 'relative',
329
+ 'legend': {'title': {'text': 'Model'}, 'tracegroupgap': 0},
330
+ 'template': '...',
331
+ 'title': {'text': 'Costs of execution of 39 test queries per model'},
332
+ 'xaxis': {'anchor': 'y', 'domain': [0.0, 1.0], 'title': {'text': 'Model'}},
333
+ 'yaxis': {'anchor': 'x', 'domain': [0.0, 1.0], 'title': {'text': 'Execution cost ($)'}}}
334
+ })",Costs of execution of 39 test queries per model,Note that some providers bill by token count and some by execution time. In the second case we used averaged pausing and resuming time to calculate the cost and assumed that all queries have been done in one session. Also note that for now the Gemini-Pro model is free for under 60 queries per minute.,"{""data"":[{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-3.5-turbo"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""gpt-3.5-turbo"",""offsetgroup"":""gpt-3.5-turbo"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gpt-3.5-turbo"",""gpt-3.5-turbo""],""xaxis"":""x"",""y"":[0.020961,0.020961],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4-turbo"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""gpt-4-turbo"",""offsetgroup"":""gpt-4-turbo"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gpt-4-turbo""],""xaxis"":""x"",""y"":[0.21067],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""gpt-4"",""offsetgroup"":""gpt-4"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gpt-4""],""xaxis"":""x"",""y"":[0.5502],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""llama-2-70b-chat"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""llama-2-70b-chat"",""offsetgroup"":""llama-2-70b-chat"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""llama-2-70b-chat""],""xaxis"":""x"",""y"":[0.004106],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mixtral-8x7B-Instruct-v0.1"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""Mixtral-8x7B-Instruct-v0.1"",""offsetgroup"":""Mixtral-8x7B-Instruct-v0.1"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""Mixtral-8x7B-Instruct-v0.1""],""xaxis"":""x"",""y"":[0.0171468],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""zephyr-7b-beta"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""zephyr-7b-beta"",""offsetgroup"":""zephyr-7b-beta"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""zephyr-7b-beta""],""xaxis"":""x"",""y"":[0.006411035042338901],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral-7B-Instruct-v0.2"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""Mistral-7B-Instruct-v0.2"",""offsetgroup"":""Mistral-7B-Instruct-v0.2"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""Mistral-7B-Instruct-v0.2""],""xaxis"":""x"",""y"":[0.002955533709128698],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""offsetgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0""],""xaxis"":""x"",""y"":[0.0008698255022366842],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gemini-pro"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""gemini-pro"",""offsetgroup"":""gemini-pro"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gemini-pro""],""xaxis"":""x"",""y"":[0.00511725],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison (PaLM 2)"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""chat-bison (PaLM 2)"",""offsetgroup"":""chat-bison (PaLM 2)"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""chat-bison (PaLM 2)""],""xaxis"":""x"",""y"":[0.0],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison-32k (PaLM 2 32K)"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""chat-bison-32k (PaLM 2 32K)"",""offsetgroup"":""chat-bison-32k (PaLM 2 32K)"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""chat-bison-32k (PaLM 2 32K)""],""xaxis"":""x"",""y"":[0.0],""yaxis"":""y"",""type"":""bar""}],""layout"":{""template"":{""data"":{""histogram2dcontour"":[{""type"":""histogram2dcontour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""choropleth"":[{""type"":""choropleth"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""histogram2d"":[{""type"":""histogram2d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmap"":[{""type"":""heatmap"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmapgl"":[{""type"":""heatmapgl"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""contourcarpet"":[{""type"":""contourcarpet"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""contour"":[{""type"":""contour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""surface"":[{""type"":""surface"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""mesh3d"":[{""type"":""mesh3d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""scatter"":[{""fillpattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2},""type"":""scatter""}],""parcoords"":[{""type"":""parcoords"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolargl"":[{""type"":""scatterpolargl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""bar"":[{""error_x"":{""color"":""#2a3f5f""},""error_y"":{""color"":""#2a3f5f""},""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""bar""}],""scattergeo"":[{""type"":""scattergeo"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolar"":[{""type"":""scatterpolar"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""histogram"":[{""marker"":{""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""histogram""}],""scattergl"":[{""type"":""scattergl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatter3d"":[{""type"":""scatter3d"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattermapbox"":[{""type"":""scattermapbox"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterternary"":[{""type"":""scatterternary"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattercarpet"":[{""type"":""scattercarpet"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""carpet"":[{""aaxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""baxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""type"":""carpet""}],""table"":[{""cells"":{""fill"":{""color"":""#EBF0F8""},""line"":{""color"":""white""}},""header"":{""fill"":{""color"":""#C8D4E3""},""line"":{""color"":""white""}},""type"":""table""}],""barpolar"":[{""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""barpolar""}],""pie"":[{""automargin"":true,""type"":""pie""}]},""layout"":{""autotypenumbers"":""strict"",""colorway"":[""#636efa"",""#EF553B"",""#00cc96"",""#ab63fa"",""#FFA15A"",""#19d3f3"",""#FF6692"",""#B6E880"",""#FF97FF"",""#FECB52""],""font"":{""color"":""#2a3f5f""},""hovermode"":""closest"",""hoverlabel"":{""align"":""left""},""paper_bgcolor"":""white"",""plot_bgcolor"":""#E5ECF6"",""polar"":{""bgcolor"":""#E5ECF6"",""angularaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""radialaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""ternary"":{""bgcolor"":""#E5ECF6"",""aaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""baxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""caxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""coloraxis"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""colorscale"":{""sequential"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""sequentialminus"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""diverging"":[[0,""#8e0152""],[0.1,""#c51b7d""],[0.2,""#de77ae""],[0.3,""#f1b6da""],[0.4,""#fde0ef""],[0.5,""#f7f7f7""],[0.6,""#e6f5d0""],[0.7,""#b8e186""],[0.8,""#7fbc41""],[0.9,""#4d9221""],[1,""#276419""]]},""xaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""yaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""scene"":{""xaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""yaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""zaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2}},""shapedefaults"":{""line"":{""color"":""#2a3f5f""}},""annotationdefaults"":{""arrowcolor"":""#2a3f5f"",""arrowhead"":0,""arrowwidth"":1},""geo"":{""bgcolor"":""white"",""landcolor"":""#E5ECF6"",""subunitcolor"":""white"",""showland"":true,""showlakes"":true,""lakecolor"":""white""},""title"":{""x"":0.05},""mapbox"":{""style"":""light""}}},""xaxis"":{""anchor"":""y"",""domain"":[0.0,1.0],""title"":{""text"":""Model""}},""yaxis"":{""anchor"":""x"",""domain"":[0.0,1.0],""title"":{""text"":""Execution cost ($)""}},""legend"":{""title"":{""text"":""Model""},""tracegroupgap"":0},""title"":{""text"":""Costs of execution of 39 test queries per model""},""barmode"":""relative""}}"
335
+ ./html/plots/model_sizes.html,"Figure({
336
+ 'data': [{'alignmentgroup': 'True',
337
+ 'hovertemplate': 'Model=%{x}<br>Model size (B params)=%{y}<extra></extra>',
338
+ 'legendgroup': 'Mixtral-8x7B-Instruct-v0.1',
339
+ 'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
340
+ 'name': 'Mixtral-8x7B-Instruct-v0.1',
341
+ 'offsetgroup': 'Mixtral-8x7B-Instruct-v0.1',
342
+ 'orientation': 'v',
343
+ 'showlegend': True,
344
+ 'textposition': 'auto',
345
+ 'type': 'bar',
346
+ 'x': array(['Mixtral-8x7B-Instruct-v0.1'], dtype=object),
347
+ 'xaxis': 'x',
348
+ 'y': array([56.]),
349
+ 'yaxis': 'y'},
350
+ {'alignmentgroup': 'True',
351
+ 'hovertemplate': 'Model=%{x}<br>Model size (B params)=%{y}<extra></extra>',
352
+ 'legendgroup': 'zephyr-7b-beta',
353
+ 'marker': {'color': '#EF553B', 'pattern': {'shape': ''}},
354
+ 'name': 'zephyr-7b-beta',
355
+ 'offsetgroup': 'zephyr-7b-beta',
356
+ 'orientation': 'v',
357
+ 'showlegend': True,
358
+ 'textposition': 'auto',
359
+ 'type': 'bar',
360
+ 'x': array(['zephyr-7b-beta'], dtype=object),
361
+ 'xaxis': 'x',
362
+ 'y': array([7.]),
363
+ 'yaxis': 'y'},
364
+ {'alignmentgroup': 'True',
365
+ 'hovertemplate': 'Model=%{x}<br>Model size (B params)=%{y}<extra></extra>',
366
+ 'legendgroup': 'Mistral-7B-Instruct-v0.2',
367
+ 'marker': {'color': '#00cc96', 'pattern': {'shape': ''}},
368
+ 'name': 'Mistral-7B-Instruct-v0.2',
369
+ 'offsetgroup': 'Mistral-7B-Instruct-v0.2',
370
+ 'orientation': 'v',
371
+ 'showlegend': True,
372
+ 'textposition': 'auto',
373
+ 'type': 'bar',
374
+ 'x': array(['Mistral-7B-Instruct-v0.2'], dtype=object),
375
+ 'xaxis': 'x',
376
+ 'y': array([7.]),
377
+ 'yaxis': 'y'},
378
+ {'alignmentgroup': 'True',
379
+ 'hovertemplate': 'Model=%{x}<br>Model size (B params)=%{y}<extra></extra>',
380
+ 'legendgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
381
+ 'marker': {'color': '#ab63fa', 'pattern': {'shape': ''}},
382
+ 'name': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
383
+ 'offsetgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
384
+ 'orientation': 'v',
385
+ 'showlegend': True,
386
+ 'textposition': 'auto',
387
+ 'type': 'bar',
388
+ 'x': array(['TinyLlama/TinyLlama-1.1B-Chat-v1.0'], dtype=object),
389
+ 'xaxis': 'x',
390
+ 'y': array([1.1]),
391
+ 'yaxis': 'y'}],
392
+ 'layout': {'barmode': 'relative',
393
+ 'legend': {'title': {'text': 'Model'}, 'tracegroupgap': 0},
394
+ 'template': '...',
395
+ 'title': {'text': 'Model sizes in billions of parameters'},
396
+ 'xaxis': {'anchor': 'y', 'domain': [0.0, 1.0], 'title': {'text': 'Model'}},
397
+ 'yaxis': {'anchor': 'x', 'domain': [0.0, 1.0], 'title': {'text': 'Model size (B params)'}}}
398
+ })",Model sizes in billions of parameters,Note that some models have undisclosed sizes.,"{""data"":[{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eModel size (B params)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mixtral-8x7B-Instruct-v0.1"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""Mixtral-8x7B-Instruct-v0.1"",""offsetgroup"":""Mixtral-8x7B-Instruct-v0.1"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""Mixtral-8x7B-Instruct-v0.1""],""xaxis"":""x"",""y"":[56.0],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eModel size (B params)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""zephyr-7b-beta"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""zephyr-7b-beta"",""offsetgroup"":""zephyr-7b-beta"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""zephyr-7b-beta""],""xaxis"":""x"",""y"":[7.0],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eModel size (B params)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral-7B-Instruct-v0.2"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""Mistral-7B-Instruct-v0.2"",""offsetgroup"":""Mistral-7B-Instruct-v0.2"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""Mistral-7B-Instruct-v0.2""],""xaxis"":""x"",""y"":[7.0],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eModel size (B params)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""offsetgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0""],""xaxis"":""x"",""y"":[1.1],""yaxis"":""y"",""type"":""bar""}],""layout"":{""template"":{""data"":{""histogram2dcontour"":[{""type"":""histogram2dcontour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""choropleth"":[{""type"":""choropleth"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""histogram2d"":[{""type"":""histogram2d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmap"":[{""type"":""heatmap"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmapgl"":[{""type"":""heatmapgl"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""contourcarpet"":[{""type"":""contourcarpet"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""contour"":[{""type"":""contour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""surface"":[{""type"":""surface"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""mesh3d"":[{""type"":""mesh3d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""scatter"":[{""fillpattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2},""type"":""scatter""}],""parcoords"":[{""type"":""parcoords"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolargl"":[{""type"":""scatterpolargl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""bar"":[{""error_x"":{""color"":""#2a3f5f""},""error_y"":{""color"":""#2a3f5f""},""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""bar""}],""scattergeo"":[{""type"":""scattergeo"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolar"":[{""type"":""scatterpolar"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""histogram"":[{""marker"":{""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""histogram""}],""scattergl"":[{""type"":""scattergl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatter3d"":[{""type"":""scatter3d"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattermapbox"":[{""type"":""scattermapbox"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterternary"":[{""type"":""scatterternary"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattercarpet"":[{""type"":""scattercarpet"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""carpet"":[{""aaxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""baxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""type"":""carpet""}],""table"":[{""cells"":{""fill"":{""color"":""#EBF0F8""},""line"":{""color"":""white""}},""header"":{""fill"":{""color"":""#C8D4E3""},""line"":{""color"":""white""}},""type"":""table""}],""barpolar"":[{""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""barpolar""}],""pie"":[{""automargin"":true,""type"":""pie""}]},""layout"":{""autotypenumbers"":""strict"",""colorway"":[""#636efa"",""#EF553B"",""#00cc96"",""#ab63fa"",""#FFA15A"",""#19d3f3"",""#FF6692"",""#B6E880"",""#FF97FF"",""#FECB52""],""font"":{""color"":""#2a3f5f""},""hovermode"":""closest"",""hoverlabel"":{""align"":""left""},""paper_bgcolor"":""white"",""plot_bgcolor"":""#E5ECF6"",""polar"":{""bgcolor"":""#E5ECF6"",""angularaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""radialaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""ternary"":{""bgcolor"":""#E5ECF6"",""aaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""baxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""caxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""coloraxis"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""colorscale"":{""sequential"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""sequentialminus"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""diverging"":[[0,""#8e0152""],[0.1,""#c51b7d""],[0.2,""#de77ae""],[0.3,""#f1b6da""],[0.4,""#fde0ef""],[0.5,""#f7f7f7""],[0.6,""#e6f5d0""],[0.7,""#b8e186""],[0.8,""#7fbc41""],[0.9,""#4d9221""],[1,""#276419""]]},""xaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""yaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""scene"":{""xaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""yaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""zaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2}},""shapedefaults"":{""line"":{""color"":""#2a3f5f""}},""annotationdefaults"":{""arrowcolor"":""#2a3f5f"",""arrowhead"":0,""arrowwidth"":1},""geo"":{""bgcolor"":""white"",""landcolor"":""#E5ECF6"",""subunitcolor"":""white"",""showland"":true,""showlakes"":true,""lakecolor"":""white""},""title"":{""x"":0.05},""mapbox"":{""style"":""light""}}},""xaxis"":{""anchor"":""y"",""domain"":[0.0,1.0],""title"":{""text"":""Model""}},""yaxis"":{""anchor"":""x"",""domain"":[0.0,1.0],""title"":{""text"":""Model size (B params)""}},""legend"":{""title"":{""text"":""Model""},""tracegroupgap"":0},""title"":{""text"":""Model sizes in billions of parameters""},""barmode"":""relative""}}"
data/2024-01-26 11:19:58.683853_general_plot.csv ADDED
@@ -0,0 +1,398 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ path,plot_object,description,comment,plot_json
2
+ ./html/plots/response_times.html,"Figure({
3
+ 'data': [{'alignmentgroup': 'True',
4
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
5
+ 'legendgroup': 'Mistral-7B-Instruct-v0.2',
6
+ 'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
7
+ 'name': 'Mistral-7B-Instruct-v0.2',
8
+ 'offsetgroup': 'Mistral-7B-Instruct-v0.2',
9
+ 'orientation': 'v',
10
+ 'showlegend': True,
11
+ 'textposition': 'auto',
12
+ 'type': 'bar',
13
+ 'x': array(['Mistral-7B-Instruct-v0.2'], dtype=object),
14
+ 'xaxis': 'x',
15
+ 'y': array([3.17454003]),
16
+ 'yaxis': 'y'},
17
+ {'alignmentgroup': 'True',
18
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
19
+ 'legendgroup': 'Mixtral-8x7B-Instruct-v0.1',
20
+ 'marker': {'color': '#EF553B', 'pattern': {'shape': ''}},
21
+ 'name': 'Mixtral-8x7B-Instruct-v0.1',
22
+ 'offsetgroup': 'Mixtral-8x7B-Instruct-v0.1',
23
+ 'orientation': 'v',
24
+ 'showlegend': True,
25
+ 'textposition': 'auto',
26
+ 'type': 'bar',
27
+ 'x': array(['Mixtral-8x7B-Instruct-v0.1'], dtype=object),
28
+ 'xaxis': 'x',
29
+ 'y': array([7.14219763]),
30
+ 'yaxis': 'y'},
31
+ {'alignmentgroup': 'True',
32
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
33
+ 'legendgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
34
+ 'marker': {'color': '#00cc96', 'pattern': {'shape': ''}},
35
+ 'name': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
36
+ 'offsetgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
37
+ 'orientation': 'v',
38
+ 'showlegend': True,
39
+ 'textposition': 'auto',
40
+ 'type': 'bar',
41
+ 'x': array(['TinyLlama/TinyLlama-1.1B-Chat-v1.0'], dtype=object),
42
+ 'xaxis': 'x',
43
+ 'y': array([1.29026454]),
44
+ 'yaxis': 'y'},
45
+ {'alignmentgroup': 'True',
46
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
47
+ 'legendgroup': 'chat-bison',
48
+ 'marker': {'color': '#ab63fa', 'pattern': {'shape': ''}},
49
+ 'name': 'chat-bison',
50
+ 'offsetgroup': 'chat-bison',
51
+ 'orientation': 'v',
52
+ 'showlegend': True,
53
+ 'textposition': 'auto',
54
+ 'type': 'bar',
55
+ 'x': array(['chat-bison'], dtype=object),
56
+ 'xaxis': 'x',
57
+ 'y': array([3.89024363]),
58
+ 'yaxis': 'y'},
59
+ {'alignmentgroup': 'True',
60
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
61
+ 'legendgroup': 'chat-bison-32k',
62
+ 'marker': {'color': '#FFA15A', 'pattern': {'shape': ''}},
63
+ 'name': 'chat-bison-32k',
64
+ 'offsetgroup': 'chat-bison-32k',
65
+ 'orientation': 'v',
66
+ 'showlegend': True,
67
+ 'textposition': 'auto',
68
+ 'type': 'bar',
69
+ 'x': array(['chat-bison-32k'], dtype=object),
70
+ 'xaxis': 'x',
71
+ 'y': array([4.12817777]),
72
+ 'yaxis': 'y'},
73
+ {'alignmentgroup': 'True',
74
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
75
+ 'legendgroup': 'gemini-pro',
76
+ 'marker': {'color': '#19d3f3', 'pattern': {'shape': ''}},
77
+ 'name': 'gemini-pro',
78
+ 'offsetgroup': 'gemini-pro',
79
+ 'orientation': 'v',
80
+ 'showlegend': True,
81
+ 'textposition': 'auto',
82
+ 'type': 'bar',
83
+ 'x': array(['gemini-pro'], dtype=object),
84
+ 'xaxis': 'x',
85
+ 'y': array([4.72138064]),
86
+ 'yaxis': 'y'},
87
+ {'alignmentgroup': 'True',
88
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
89
+ 'legendgroup': 'gpt-3.5-turbo',
90
+ 'marker': {'color': '#FF6692', 'pattern': {'shape': ''}},
91
+ 'name': 'gpt-3.5-turbo',
92
+ 'offsetgroup': 'gpt-3.5-turbo',
93
+ 'orientation': 'v',
94
+ 'showlegend': True,
95
+ 'textposition': 'auto',
96
+ 'type': 'bar',
97
+ 'x': array(['gpt-3.5-turbo'], dtype=object),
98
+ 'xaxis': 'x',
99
+ 'y': array([5.28237349]),
100
+ 'yaxis': 'y'},
101
+ {'alignmentgroup': 'True',
102
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
103
+ 'legendgroup': 'gpt-4',
104
+ 'marker': {'color': '#B6E880', 'pattern': {'shape': ''}},
105
+ 'name': 'gpt-4',
106
+ 'offsetgroup': 'gpt-4',
107
+ 'orientation': 'v',
108
+ 'showlegend': True,
109
+ 'textposition': 'auto',
110
+ 'type': 'bar',
111
+ 'x': array(['gpt-4'], dtype=object),
112
+ 'xaxis': 'x',
113
+ 'y': array([15.52184566]),
114
+ 'yaxis': 'y'},
115
+ {'alignmentgroup': 'True',
116
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
117
+ 'legendgroup': 'gpt-4-turbo',
118
+ 'marker': {'color': '#FF97FF', 'pattern': {'shape': ''}},
119
+ 'name': 'gpt-4-turbo',
120
+ 'offsetgroup': 'gpt-4-turbo',
121
+ 'orientation': 'v',
122
+ 'showlegend': True,
123
+ 'textposition': 'auto',
124
+ 'type': 'bar',
125
+ 'x': array(['gpt-4-turbo'], dtype=object),
126
+ 'xaxis': 'x',
127
+ 'y': array([14.00852903]),
128
+ 'yaxis': 'y'},
129
+ {'alignmentgroup': 'True',
130
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
131
+ 'legendgroup': 'llama-2-70b-chat',
132
+ 'marker': {'color': '#FECB52', 'pattern': {'shape': ''}},
133
+ 'name': 'llama-2-70b-chat',
134
+ 'offsetgroup': 'llama-2-70b-chat',
135
+ 'orientation': 'v',
136
+ 'showlegend': True,
137
+ 'textposition': 'auto',
138
+ 'type': 'bar',
139
+ 'x': array(['llama-2-70b-chat'], dtype=object),
140
+ 'xaxis': 'x',
141
+ 'y': array([6.0658799]),
142
+ 'yaxis': 'y'},
143
+ {'alignmentgroup': 'True',
144
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
145
+ 'legendgroup': 'zephyr-7b-beta',
146
+ 'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
147
+ 'name': 'zephyr-7b-beta',
148
+ 'offsetgroup': 'zephyr-7b-beta',
149
+ 'orientation': 'v',
150
+ 'showlegend': True,
151
+ 'textposition': 'auto',
152
+ 'type': 'bar',
153
+ 'x': array(['zephyr-7b-beta'], dtype=object),
154
+ 'xaxis': 'x',
155
+ 'y': array([3.23879932]),
156
+ 'yaxis': 'y'}],
157
+ 'layout': {'barmode': 'relative',
158
+ 'legend': {'title': {'text': 'Model'}, 'tracegroupgap': 0},
159
+ 'template': '...',
160
+ 'title': {'text': 'Model endpoints response times'},
161
+ 'xaxis': {'anchor': 'y',
162
+ 'categoryarray': [Mistral-7B-Instruct-v0.2,
163
+ Mixtral-8x7B-Instruct-v0.1,
164
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,
165
+ chat-bison, chat-bison-32k, gemini-pro,
166
+ gpt-3.5-turbo, gpt-4, gpt-4-turbo,
167
+ llama-2-70b-chat, zephyr-7b-beta],
168
+ 'categoryorder': 'array',
169
+ 'domain': [0.0, 1.0],
170
+ 'title': {'text': 'Model'}},
171
+ 'yaxis': {'anchor': 'x', 'domain': [0.0, 1.0], 'title': {'text': 'Execution time (s)'}}}
172
+ })",Model endpoints response times,,"{""data"":[{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral-7B-Instruct-v0.2"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""Mistral-7B-Instruct-v0.2"",""offsetgroup"":""Mistral-7B-Instruct-v0.2"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""Mistral-7B-Instruct-v0.2""],""xaxis"":""x"",""y"":[3.174540030956268],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mixtral-8x7B-Instruct-v0.1"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""Mixtral-8x7B-Instruct-v0.1"",""offsetgroup"":""Mixtral-8x7B-Instruct-v0.1"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""Mixtral-8x7B-Instruct-v0.1""],""xaxis"":""x"",""y"":[7.142197625471814],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""offsetgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0""],""xaxis"":""x"",""y"":[1.2902645373344421],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""chat-bison"",""offsetgroup"":""chat-bison"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""chat-bison""],""xaxis"":""x"",""y"":[3.890243631601334],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison-32k"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""chat-bison-32k"",""offsetgroup"":""chat-bison-32k"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""chat-bison-32k""],""xaxis"":""x"",""y"":[4.128177767992019],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gemini-pro"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""gemini-pro"",""offsetgroup"":""gemini-pro"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gemini-pro""],""xaxis"":""x"",""y"":[4.72138064004937],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-3.5-turbo"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""gpt-3.5-turbo"",""offsetgroup"":""gpt-3.5-turbo"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gpt-3.5-turbo""],""xaxis"":""x"",""y"":[5.282373493889353],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""gpt-4"",""offsetgroup"":""gpt-4"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gpt-4""],""xaxis"":""x"",""y"":[15.5218456586202],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4-turbo"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""gpt-4-turbo"",""offsetgroup"":""gpt-4-turbo"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gpt-4-turbo""],""xaxis"":""x"",""y"":[14.008529031276703],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""llama-2-70b-chat"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""llama-2-70b-chat"",""offsetgroup"":""llama-2-70b-chat"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""llama-2-70b-chat""],""xaxis"":""x"",""y"":[6.06587989590749],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""zephyr-7b-beta"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""zephyr-7b-beta"",""offsetgroup"":""zephyr-7b-beta"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""zephyr-7b-beta""],""xaxis"":""x"",""y"":[3.2387993240356447],""yaxis"":""y"",""type"":""bar""}],""layout"":{""template"":{""data"":{""histogram2dcontour"":[{""type"":""histogram2dcontour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""choropleth"":[{""type"":""choropleth"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""histogram2d"":[{""type"":""histogram2d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmap"":[{""type"":""heatmap"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmapgl"":[{""type"":""heatmapgl"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""contourcarpet"":[{""type"":""contourcarpet"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""contour"":[{""type"":""contour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""surface"":[{""type"":""surface"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""mesh3d"":[{""type"":""mesh3d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""scatter"":[{""fillpattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2},""type"":""scatter""}],""parcoords"":[{""type"":""parcoords"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolargl"":[{""type"":""scatterpolargl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""bar"":[{""error_x"":{""color"":""#2a3f5f""},""error_y"":{""color"":""#2a3f5f""},""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""bar""}],""scattergeo"":[{""type"":""scattergeo"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolar"":[{""type"":""scatterpolar"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""histogram"":[{""marker"":{""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""histogram""}],""scattergl"":[{""type"":""scattergl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatter3d"":[{""type"":""scatter3d"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattermapbox"":[{""type"":""scattermapbox"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterternary"":[{""type"":""scatterternary"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattercarpet"":[{""type"":""scattercarpet"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""carpet"":[{""aaxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""baxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""type"":""carpet""}],""table"":[{""cells"":{""fill"":{""color"":""#EBF0F8""},""line"":{""color"":""white""}},""header"":{""fill"":{""color"":""#C8D4E3""},""line"":{""color"":""white""}},""type"":""table""}],""barpolar"":[{""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""barpolar""}],""pie"":[{""automargin"":true,""type"":""pie""}]},""layout"":{""autotypenumbers"":""strict"",""colorway"":[""#636efa"",""#EF553B"",""#00cc96"",""#ab63fa"",""#FFA15A"",""#19d3f3"",""#FF6692"",""#B6E880"",""#FF97FF"",""#FECB52""],""font"":{""color"":""#2a3f5f""},""hovermode"":""closest"",""hoverlabel"":{""align"":""left""},""paper_bgcolor"":""white"",""plot_bgcolor"":""#E5ECF6"",""polar"":{""bgcolor"":""#E5ECF6"",""angularaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""radialaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""ternary"":{""bgcolor"":""#E5ECF6"",""aaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""baxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""caxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""coloraxis"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""colorscale"":{""sequential"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""sequentialminus"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""diverging"":[[0,""#8e0152""],[0.1,""#c51b7d""],[0.2,""#de77ae""],[0.3,""#f1b6da""],[0.4,""#fde0ef""],[0.5,""#f7f7f7""],[0.6,""#e6f5d0""],[0.7,""#b8e186""],[0.8,""#7fbc41""],[0.9,""#4d9221""],[1,""#276419""]]},""xaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""yaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""scene"":{""xaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""yaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""zaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2}},""shapedefaults"":{""line"":{""color"":""#2a3f5f""}},""annotationdefaults"":{""arrowcolor"":""#2a3f5f"",""arrowhead"":0,""arrowwidth"":1},""geo"":{""bgcolor"":""white"",""landcolor"":""#E5ECF6"",""subunitcolor"":""white"",""showland"":true,""showlakes"":true,""lakecolor"":""white""},""title"":{""x"":0.05},""mapbox"":{""style"":""light""}}},""xaxis"":{""anchor"":""y"",""domain"":[0.0,1.0],""title"":{""text"":""Model""},""categoryorder"":""array"",""categoryarray"":[""Mistral-7B-Instruct-v0.2"",""Mixtral-8x7B-Instruct-v0.1"",""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""chat-bison"",""chat-bison-32k"",""gemini-pro"",""gpt-3.5-turbo"",""gpt-4"",""gpt-4-turbo"",""llama-2-70b-chat"",""zephyr-7b-beta""]},""yaxis"":{""anchor"":""x"",""domain"":[0.0,1.0],""title"":{""text"":""Execution time (s)""}},""legend"":{""title"":{""text"":""Model""},""tracegroupgap"":0},""title"":{""text"":""Model endpoints response times""},""barmode"":""relative""}}"
173
+ ./html/plots/execution_costs.html,"Figure({
174
+ 'data': [{'alignmentgroup': 'True',
175
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
176
+ 'legendgroup': 'gpt-3.5-turbo',
177
+ 'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
178
+ 'name': 'gpt-3.5-turbo',
179
+ 'offsetgroup': 'gpt-3.5-turbo',
180
+ 'orientation': 'v',
181
+ 'showlegend': True,
182
+ 'textposition': 'auto',
183
+ 'type': 'bar',
184
+ 'x': array(['gpt-3.5-turbo', 'gpt-3.5-turbo'], dtype=object),
185
+ 'xaxis': 'x',
186
+ 'y': array([0.020813, 0.020813]),
187
+ 'yaxis': 'y'},
188
+ {'alignmentgroup': 'True',
189
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
190
+ 'legendgroup': 'gpt-4-turbo',
191
+ 'marker': {'color': '#EF553B', 'pattern': {'shape': ''}},
192
+ 'name': 'gpt-4-turbo',
193
+ 'offsetgroup': 'gpt-4-turbo',
194
+ 'orientation': 'v',
195
+ 'showlegend': True,
196
+ 'textposition': 'auto',
197
+ 'type': 'bar',
198
+ 'x': array(['gpt-4-turbo'], dtype=object),
199
+ 'xaxis': 'x',
200
+ 'y': array([0.21397]),
201
+ 'yaxis': 'y'},
202
+ {'alignmentgroup': 'True',
203
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
204
+ 'legendgroup': 'gpt-4',
205
+ 'marker': {'color': '#00cc96', 'pattern': {'shape': ''}},
206
+ 'name': 'gpt-4',
207
+ 'offsetgroup': 'gpt-4',
208
+ 'orientation': 'v',
209
+ 'showlegend': True,
210
+ 'textposition': 'auto',
211
+ 'type': 'bar',
212
+ 'x': array(['gpt-4'], dtype=object),
213
+ 'xaxis': 'x',
214
+ 'y': array([0.58395]),
215
+ 'yaxis': 'y'},
216
+ {'alignmentgroup': 'True',
217
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
218
+ 'legendgroup': 'llama-2-70b-chat',
219
+ 'marker': {'color': '#ab63fa', 'pattern': {'shape': ''}},
220
+ 'name': 'llama-2-70b-chat',
221
+ 'offsetgroup': 'llama-2-70b-chat',
222
+ 'orientation': 'v',
223
+ 'showlegend': True,
224
+ 'textposition': 'auto',
225
+ 'type': 'bar',
226
+ 'x': array(['llama-2-70b-chat'], dtype=object),
227
+ 'xaxis': 'x',
228
+ 'y': array([0.0044992]),
229
+ 'yaxis': 'y'},
230
+ {'alignmentgroup': 'True',
231
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
232
+ 'legendgroup': 'Mixtral-8x7B-Instruct-v0.1',
233
+ 'marker': {'color': '#FFA15A', 'pattern': {'shape': ''}},
234
+ 'name': 'Mixtral-8x7B-Instruct-v0.1',
235
+ 'offsetgroup': 'Mixtral-8x7B-Instruct-v0.1',
236
+ 'orientation': 'v',
237
+ 'showlegend': True,
238
+ 'textposition': 'auto',
239
+ 'type': 'bar',
240
+ 'x': array(['Mixtral-8x7B-Instruct-v0.1'], dtype=object),
241
+ 'xaxis': 'x',
242
+ 'y': array([0.016236]),
243
+ 'yaxis': 'y'},
244
+ {'alignmentgroup': 'True',
245
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
246
+ 'legendgroup': 'zephyr-7b-beta',
247
+ 'marker': {'color': '#19d3f3', 'pattern': {'shape': ''}},
248
+ 'name': 'zephyr-7b-beta',
249
+ 'offsetgroup': 'zephyr-7b-beta',
250
+ 'orientation': 'v',
251
+ 'showlegend': True,
252
+ 'textposition': 'auto',
253
+ 'type': 'bar',
254
+ 'x': array(['zephyr-7b-beta'], dtype=object),
255
+ 'xaxis': 'x',
256
+ 'y': array([0.09306563]),
257
+ 'yaxis': 'y'},
258
+ {'alignmentgroup': 'True',
259
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
260
+ 'legendgroup': 'Mistral-7B-Instruct-v0.2',
261
+ 'marker': {'color': '#FF6692', 'pattern': {'shape': ''}},
262
+ 'name': 'Mistral-7B-Instruct-v0.2',
263
+ 'offsetgroup': 'Mistral-7B-Instruct-v0.2',
264
+ 'orientation': 'v',
265
+ 'showlegend': True,
266
+ 'textposition': 'auto',
267
+ 'type': 'bar',
268
+ 'x': array(['Mistral-7B-Instruct-v0.2'], dtype=object),
269
+ 'xaxis': 'x',
270
+ 'y': array([0.08959219]),
271
+ 'yaxis': 'y'},
272
+ {'alignmentgroup': 'True',
273
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
274
+ 'legendgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
275
+ 'marker': {'color': '#B6E880', 'pattern': {'shape': ''}},
276
+ 'name': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
277
+ 'offsetgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
278
+ 'orientation': 'v',
279
+ 'showlegend': True,
280
+ 'textposition': 'auto',
281
+ 'type': 'bar',
282
+ 'x': array(['TinyLlama/TinyLlama-1.1B-Chat-v1.0'], dtype=object),
283
+ 'xaxis': 'x',
284
+ 'y': array([0.04085264]),
285
+ 'yaxis': 'y'},
286
+ {'alignmentgroup': 'True',
287
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
288
+ 'legendgroup': 'gemini-pro',
289
+ 'marker': {'color': '#FF97FF', 'pattern': {'shape': ''}},
290
+ 'name': 'gemini-pro',
291
+ 'offsetgroup': 'gemini-pro',
292
+ 'orientation': 'v',
293
+ 'showlegend': True,
294
+ 'textposition': 'auto',
295
+ 'type': 'bar',
296
+ 'x': array(['gemini-pro'], dtype=object),
297
+ 'xaxis': 'x',
298
+ 'y': array([0.00511825]),
299
+ 'yaxis': 'y'},
300
+ {'alignmentgroup': 'True',
301
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
302
+ 'legendgroup': 'chat-bison (PaLM 2)',
303
+ 'marker': {'color': '#FECB52', 'pattern': {'shape': ''}},
304
+ 'name': 'chat-bison (PaLM 2)',
305
+ 'offsetgroup': 'chat-bison (PaLM 2)',
306
+ 'orientation': 'v',
307
+ 'showlegend': True,
308
+ 'textposition': 'auto',
309
+ 'type': 'bar',
310
+ 'x': array(['chat-bison (PaLM 2)'], dtype=object),
311
+ 'xaxis': 'x',
312
+ 'y': array([0.]),
313
+ 'yaxis': 'y'},
314
+ {'alignmentgroup': 'True',
315
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
316
+ 'legendgroup': 'chat-bison-32k (PaLM 2 32K)',
317
+ 'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
318
+ 'name': 'chat-bison-32k (PaLM 2 32K)',
319
+ 'offsetgroup': 'chat-bison-32k (PaLM 2 32K)',
320
+ 'orientation': 'v',
321
+ 'showlegend': True,
322
+ 'textposition': 'auto',
323
+ 'type': 'bar',
324
+ 'x': array(['chat-bison-32k (PaLM 2 32K)'], dtype=object),
325
+ 'xaxis': 'x',
326
+ 'y': array([0.]),
327
+ 'yaxis': 'y'}],
328
+ 'layout': {'barmode': 'relative',
329
+ 'legend': {'title': {'text': 'Model'}, 'tracegroupgap': 0},
330
+ 'template': '...',
331
+ 'title': {'text': 'Costs of execution of 39 test queries per model'},
332
+ 'xaxis': {'anchor': 'y', 'domain': [0.0, 1.0], 'title': {'text': 'Model'}},
333
+ 'yaxis': {'anchor': 'x', 'domain': [0.0, 1.0], 'title': {'text': 'Execution cost ($)'}}}
334
+ })",Costs of execution of 39 test queries per model,Note that some providers bill by token count and some by execution time. In the second case we used averaged pausing and resuming time to calculate the cost and assumed that all queries have been done in one session. Also note that for now the Gemini-Pro model is free for under 60 queries per minute.,"{""data"":[{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-3.5-turbo"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""gpt-3.5-turbo"",""offsetgroup"":""gpt-3.5-turbo"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gpt-3.5-turbo"",""gpt-3.5-turbo""],""xaxis"":""x"",""y"":[0.020813,0.020813],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4-turbo"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""gpt-4-turbo"",""offsetgroup"":""gpt-4-turbo"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gpt-4-turbo""],""xaxis"":""x"",""y"":[0.21397],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""gpt-4"",""offsetgroup"":""gpt-4"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gpt-4""],""xaxis"":""x"",""y"":[0.58395],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""llama-2-70b-chat"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""llama-2-70b-chat"",""offsetgroup"":""llama-2-70b-chat"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""llama-2-70b-chat""],""xaxis"":""x"",""y"":[0.0044992],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mixtral-8x7B-Instruct-v0.1"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""Mixtral-8x7B-Instruct-v0.1"",""offsetgroup"":""Mixtral-8x7B-Instruct-v0.1"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""Mixtral-8x7B-Instruct-v0.1""],""xaxis"":""x"",""y"":[0.016236],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""zephyr-7b-beta"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""zephyr-7b-beta"",""offsetgroup"":""zephyr-7b-beta"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""zephyr-7b-beta""],""xaxis"":""x"",""y"":[0.09306563151081403],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral-7B-Instruct-v0.2"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""Mistral-7B-Instruct-v0.2"",""offsetgroup"":""Mistral-7B-Instruct-v0.2"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""Mistral-7B-Instruct-v0.2""],""xaxis"":""x"",""y"":[0.08959219022260773],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""offsetgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0""],""xaxis"":""x"",""y"":[0.04085263746182124],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gemini-pro"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""gemini-pro"",""offsetgroup"":""gemini-pro"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gemini-pro""],""xaxis"":""x"",""y"":[0.00511825],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison (PaLM 2)"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""chat-bison (PaLM 2)"",""offsetgroup"":""chat-bison (PaLM 2)"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""chat-bison (PaLM 2)""],""xaxis"":""x"",""y"":[0.0],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison-32k (PaLM 2 32K)"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""chat-bison-32k (PaLM 2 32K)"",""offsetgroup"":""chat-bison-32k (PaLM 2 32K)"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""chat-bison-32k (PaLM 2 32K)""],""xaxis"":""x"",""y"":[0.0],""yaxis"":""y"",""type"":""bar""}],""layout"":{""template"":{""data"":{""histogram2dcontour"":[{""type"":""histogram2dcontour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""choropleth"":[{""type"":""choropleth"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""histogram2d"":[{""type"":""histogram2d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmap"":[{""type"":""heatmap"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmapgl"":[{""type"":""heatmapgl"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""contourcarpet"":[{""type"":""contourcarpet"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""contour"":[{""type"":""contour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""surface"":[{""type"":""surface"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""mesh3d"":[{""type"":""mesh3d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""scatter"":[{""fillpattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2},""type"":""scatter""}],""parcoords"":[{""type"":""parcoords"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolargl"":[{""type"":""scatterpolargl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""bar"":[{""error_x"":{""color"":""#2a3f5f""},""error_y"":{""color"":""#2a3f5f""},""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""bar""}],""scattergeo"":[{""type"":""scattergeo"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolar"":[{""type"":""scatterpolar"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""histogram"":[{""marker"":{""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""histogram""}],""scattergl"":[{""type"":""scattergl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatter3d"":[{""type"":""scatter3d"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattermapbox"":[{""type"":""scattermapbox"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterternary"":[{""type"":""scatterternary"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattercarpet"":[{""type"":""scattercarpet"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""carpet"":[{""aaxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""baxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""type"":""carpet""}],""table"":[{""cells"":{""fill"":{""color"":""#EBF0F8""},""line"":{""color"":""white""}},""header"":{""fill"":{""color"":""#C8D4E3""},""line"":{""color"":""white""}},""type"":""table""}],""barpolar"":[{""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""barpolar""}],""pie"":[{""automargin"":true,""type"":""pie""}]},""layout"":{""autotypenumbers"":""strict"",""colorway"":[""#636efa"",""#EF553B"",""#00cc96"",""#ab63fa"",""#FFA15A"",""#19d3f3"",""#FF6692"",""#B6E880"",""#FF97FF"",""#FECB52""],""font"":{""color"":""#2a3f5f""},""hovermode"":""closest"",""hoverlabel"":{""align"":""left""},""paper_bgcolor"":""white"",""plot_bgcolor"":""#E5ECF6"",""polar"":{""bgcolor"":""#E5ECF6"",""angularaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""radialaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""ternary"":{""bgcolor"":""#E5ECF6"",""aaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""baxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""caxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""coloraxis"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""colorscale"":{""sequential"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""sequentialminus"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""diverging"":[[0,""#8e0152""],[0.1,""#c51b7d""],[0.2,""#de77ae""],[0.3,""#f1b6da""],[0.4,""#fde0ef""],[0.5,""#f7f7f7""],[0.6,""#e6f5d0""],[0.7,""#b8e186""],[0.8,""#7fbc41""],[0.9,""#4d9221""],[1,""#276419""]]},""xaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""yaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""scene"":{""xaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""yaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""zaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2}},""shapedefaults"":{""line"":{""color"":""#2a3f5f""}},""annotationdefaults"":{""arrowcolor"":""#2a3f5f"",""arrowhead"":0,""arrowwidth"":1},""geo"":{""bgcolor"":""white"",""landcolor"":""#E5ECF6"",""subunitcolor"":""white"",""showland"":true,""showlakes"":true,""lakecolor"":""white""},""title"":{""x"":0.05},""mapbox"":{""style"":""light""}}},""xaxis"":{""anchor"":""y"",""domain"":[0.0,1.0],""title"":{""text"":""Model""}},""yaxis"":{""anchor"":""x"",""domain"":[0.0,1.0],""title"":{""text"":""Execution cost ($)""}},""legend"":{""title"":{""text"":""Model""},""tracegroupgap"":0},""title"":{""text"":""Costs of execution of 39 test queries per model""},""barmode"":""relative""}}"
335
+ ./html/plots/model_sizes.html,"Figure({
336
+ 'data': [{'alignmentgroup': 'True',
337
+ 'hovertemplate': 'Model=%{x}<br>Model size (B params)=%{y}<extra></extra>',
338
+ 'legendgroup': 'Mixtral-8x7B-Instruct-v0.1',
339
+ 'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
340
+ 'name': 'Mixtral-8x7B-Instruct-v0.1',
341
+ 'offsetgroup': 'Mixtral-8x7B-Instruct-v0.1',
342
+ 'orientation': 'v',
343
+ 'showlegend': True,
344
+ 'textposition': 'auto',
345
+ 'type': 'bar',
346
+ 'x': array(['Mixtral-8x7B-Instruct-v0.1'], dtype=object),
347
+ 'xaxis': 'x',
348
+ 'y': array([56.]),
349
+ 'yaxis': 'y'},
350
+ {'alignmentgroup': 'True',
351
+ 'hovertemplate': 'Model=%{x}<br>Model size (B params)=%{y}<extra></extra>',
352
+ 'legendgroup': 'zephyr-7b-beta',
353
+ 'marker': {'color': '#EF553B', 'pattern': {'shape': ''}},
354
+ 'name': 'zephyr-7b-beta',
355
+ 'offsetgroup': 'zephyr-7b-beta',
356
+ 'orientation': 'v',
357
+ 'showlegend': True,
358
+ 'textposition': 'auto',
359
+ 'type': 'bar',
360
+ 'x': array(['zephyr-7b-beta'], dtype=object),
361
+ 'xaxis': 'x',
362
+ 'y': array([7.]),
363
+ 'yaxis': 'y'},
364
+ {'alignmentgroup': 'True',
365
+ 'hovertemplate': 'Model=%{x}<br>Model size (B params)=%{y}<extra></extra>',
366
+ 'legendgroup': 'Mistral-7B-Instruct-v0.2',
367
+ 'marker': {'color': '#00cc96', 'pattern': {'shape': ''}},
368
+ 'name': 'Mistral-7B-Instruct-v0.2',
369
+ 'offsetgroup': 'Mistral-7B-Instruct-v0.2',
370
+ 'orientation': 'v',
371
+ 'showlegend': True,
372
+ 'textposition': 'auto',
373
+ 'type': 'bar',
374
+ 'x': array(['Mistral-7B-Instruct-v0.2'], dtype=object),
375
+ 'xaxis': 'x',
376
+ 'y': array([7.]),
377
+ 'yaxis': 'y'},
378
+ {'alignmentgroup': 'True',
379
+ 'hovertemplate': 'Model=%{x}<br>Model size (B params)=%{y}<extra></extra>',
380
+ 'legendgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
381
+ 'marker': {'color': '#ab63fa', 'pattern': {'shape': ''}},
382
+ 'name': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
383
+ 'offsetgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
384
+ 'orientation': 'v',
385
+ 'showlegend': True,
386
+ 'textposition': 'auto',
387
+ 'type': 'bar',
388
+ 'x': array(['TinyLlama/TinyLlama-1.1B-Chat-v1.0'], dtype=object),
389
+ 'xaxis': 'x',
390
+ 'y': array([1.1]),
391
+ 'yaxis': 'y'}],
392
+ 'layout': {'barmode': 'relative',
393
+ 'legend': {'title': {'text': 'Model'}, 'tracegroupgap': 0},
394
+ 'template': '...',
395
+ 'title': {'text': 'Model sizes in billions of parameters'},
396
+ 'xaxis': {'anchor': 'y', 'domain': [0.0, 1.0], 'title': {'text': 'Model'}},
397
+ 'yaxis': {'anchor': 'x', 'domain': [0.0, 1.0], 'title': {'text': 'Model size (B params)'}}}
398
+ })",Model sizes in billions of parameters,Note that some models have undisclosed sizes.,"{""data"":[{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eModel size (B params)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mixtral-8x7B-Instruct-v0.1"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""Mixtral-8x7B-Instruct-v0.1"",""offsetgroup"":""Mixtral-8x7B-Instruct-v0.1"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""Mixtral-8x7B-Instruct-v0.1""],""xaxis"":""x"",""y"":[56.0],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eModel size (B params)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""zephyr-7b-beta"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""zephyr-7b-beta"",""offsetgroup"":""zephyr-7b-beta"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""zephyr-7b-beta""],""xaxis"":""x"",""y"":[7.0],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eModel size (B params)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral-7B-Instruct-v0.2"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""Mistral-7B-Instruct-v0.2"",""offsetgroup"":""Mistral-7B-Instruct-v0.2"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""Mistral-7B-Instruct-v0.2""],""xaxis"":""x"",""y"":[7.0],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eModel size (B params)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""offsetgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0""],""xaxis"":""x"",""y"":[1.1],""yaxis"":""y"",""type"":""bar""}],""layout"":{""template"":{""data"":{""histogram2dcontour"":[{""type"":""histogram2dcontour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""choropleth"":[{""type"":""choropleth"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""histogram2d"":[{""type"":""histogram2d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmap"":[{""type"":""heatmap"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmapgl"":[{""type"":""heatmapgl"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""contourcarpet"":[{""type"":""contourcarpet"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""contour"":[{""type"":""contour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""surface"":[{""type"":""surface"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""mesh3d"":[{""type"":""mesh3d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""scatter"":[{""fillpattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2},""type"":""scatter""}],""parcoords"":[{""type"":""parcoords"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolargl"":[{""type"":""scatterpolargl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""bar"":[{""error_x"":{""color"":""#2a3f5f""},""error_y"":{""color"":""#2a3f5f""},""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""bar""}],""scattergeo"":[{""type"":""scattergeo"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolar"":[{""type"":""scatterpolar"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""histogram"":[{""marker"":{""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""histogram""}],""scattergl"":[{""type"":""scattergl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatter3d"":[{""type"":""scatter3d"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattermapbox"":[{""type"":""scattermapbox"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterternary"":[{""type"":""scatterternary"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattercarpet"":[{""type"":""scattercarpet"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""carpet"":[{""aaxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""baxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""type"":""carpet""}],""table"":[{""cells"":{""fill"":{""color"":""#EBF0F8""},""line"":{""color"":""white""}},""header"":{""fill"":{""color"":""#C8D4E3""},""line"":{""color"":""white""}},""type"":""table""}],""barpolar"":[{""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""barpolar""}],""pie"":[{""automargin"":true,""type"":""pie""}]},""layout"":{""autotypenumbers"":""strict"",""colorway"":[""#636efa"",""#EF553B"",""#00cc96"",""#ab63fa"",""#FFA15A"",""#19d3f3"",""#FF6692"",""#B6E880"",""#FF97FF"",""#FECB52""],""font"":{""color"":""#2a3f5f""},""hovermode"":""closest"",""hoverlabel"":{""align"":""left""},""paper_bgcolor"":""white"",""plot_bgcolor"":""#E5ECF6"",""polar"":{""bgcolor"":""#E5ECF6"",""angularaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""radialaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""ternary"":{""bgcolor"":""#E5ECF6"",""aaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""baxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""caxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""coloraxis"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""colorscale"":{""sequential"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""sequentialminus"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""diverging"":[[0,""#8e0152""],[0.1,""#c51b7d""],[0.2,""#de77ae""],[0.3,""#f1b6da""],[0.4,""#fde0ef""],[0.5,""#f7f7f7""],[0.6,""#e6f5d0""],[0.7,""#b8e186""],[0.8,""#7fbc41""],[0.9,""#4d9221""],[1,""#276419""]]},""xaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""yaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""scene"":{""xaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""yaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""zaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2}},""shapedefaults"":{""line"":{""color"":""#2a3f5f""}},""annotationdefaults"":{""arrowcolor"":""#2a3f5f"",""arrowhead"":0,""arrowwidth"":1},""geo"":{""bgcolor"":""white"",""landcolor"":""#E5ECF6"",""subunitcolor"":""white"",""showland"":true,""showlakes"":true,""lakecolor"":""white""},""title"":{""x"":0.05},""mapbox"":{""style"":""light""}}},""xaxis"":{""anchor"":""y"",""domain"":[0.0,1.0],""title"":{""text"":""Model""}},""yaxis"":{""anchor"":""x"",""domain"":[0.0,1.0],""title"":{""text"":""Model size (B params)""}},""legend"":{""title"":{""text"":""Model""},""tracegroupgap"":0},""title"":{""text"":""Model sizes in billions of parameters""},""barmode"":""relative""}}"
data/2024-01-26 11:20:49.179382_general_plot.csv ADDED
@@ -0,0 +1,398 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ path,plot_object,description,comment,plot_json
2
+ ./html/plots/response_times.html,"Figure({
3
+ 'data': [{'alignmentgroup': 'True',
4
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
5
+ 'legendgroup': 'Mistral-7B-Instruct-v0.2',
6
+ 'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
7
+ 'name': 'Mistral-7B-Instruct-v0.2',
8
+ 'offsetgroup': 'Mistral-7B-Instruct-v0.2',
9
+ 'orientation': 'v',
10
+ 'showlegend': True,
11
+ 'textposition': 'auto',
12
+ 'type': 'bar',
13
+ 'x': array(['Mistral-7B-Instruct-v0.2'], dtype=object),
14
+ 'xaxis': 'x',
15
+ 'y': array([3.17454003]),
16
+ 'yaxis': 'y'},
17
+ {'alignmentgroup': 'True',
18
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
19
+ 'legendgroup': 'Mixtral-8x7B-Instruct-v0.1',
20
+ 'marker': {'color': '#EF553B', 'pattern': {'shape': ''}},
21
+ 'name': 'Mixtral-8x7B-Instruct-v0.1',
22
+ 'offsetgroup': 'Mixtral-8x7B-Instruct-v0.1',
23
+ 'orientation': 'v',
24
+ 'showlegend': True,
25
+ 'textposition': 'auto',
26
+ 'type': 'bar',
27
+ 'x': array(['Mixtral-8x7B-Instruct-v0.1'], dtype=object),
28
+ 'xaxis': 'x',
29
+ 'y': array([7.14219763]),
30
+ 'yaxis': 'y'},
31
+ {'alignmentgroup': 'True',
32
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
33
+ 'legendgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
34
+ 'marker': {'color': '#00cc96', 'pattern': {'shape': ''}},
35
+ 'name': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
36
+ 'offsetgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
37
+ 'orientation': 'v',
38
+ 'showlegend': True,
39
+ 'textposition': 'auto',
40
+ 'type': 'bar',
41
+ 'x': array(['TinyLlama/TinyLlama-1.1B-Chat-v1.0'], dtype=object),
42
+ 'xaxis': 'x',
43
+ 'y': array([1.29026454]),
44
+ 'yaxis': 'y'},
45
+ {'alignmentgroup': 'True',
46
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
47
+ 'legendgroup': 'chat-bison',
48
+ 'marker': {'color': '#ab63fa', 'pattern': {'shape': ''}},
49
+ 'name': 'chat-bison',
50
+ 'offsetgroup': 'chat-bison',
51
+ 'orientation': 'v',
52
+ 'showlegend': True,
53
+ 'textposition': 'auto',
54
+ 'type': 'bar',
55
+ 'x': array(['chat-bison'], dtype=object),
56
+ 'xaxis': 'x',
57
+ 'y': array([3.89024363]),
58
+ 'yaxis': 'y'},
59
+ {'alignmentgroup': 'True',
60
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
61
+ 'legendgroup': 'chat-bison-32k',
62
+ 'marker': {'color': '#FFA15A', 'pattern': {'shape': ''}},
63
+ 'name': 'chat-bison-32k',
64
+ 'offsetgroup': 'chat-bison-32k',
65
+ 'orientation': 'v',
66
+ 'showlegend': True,
67
+ 'textposition': 'auto',
68
+ 'type': 'bar',
69
+ 'x': array(['chat-bison-32k'], dtype=object),
70
+ 'xaxis': 'x',
71
+ 'y': array([4.12817777]),
72
+ 'yaxis': 'y'},
73
+ {'alignmentgroup': 'True',
74
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
75
+ 'legendgroup': 'gemini-pro',
76
+ 'marker': {'color': '#19d3f3', 'pattern': {'shape': ''}},
77
+ 'name': 'gemini-pro',
78
+ 'offsetgroup': 'gemini-pro',
79
+ 'orientation': 'v',
80
+ 'showlegend': True,
81
+ 'textposition': 'auto',
82
+ 'type': 'bar',
83
+ 'x': array(['gemini-pro'], dtype=object),
84
+ 'xaxis': 'x',
85
+ 'y': array([4.72138064]),
86
+ 'yaxis': 'y'},
87
+ {'alignmentgroup': 'True',
88
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
89
+ 'legendgroup': 'gpt-3.5-turbo',
90
+ 'marker': {'color': '#FF6692', 'pattern': {'shape': ''}},
91
+ 'name': 'gpt-3.5-turbo',
92
+ 'offsetgroup': 'gpt-3.5-turbo',
93
+ 'orientation': 'v',
94
+ 'showlegend': True,
95
+ 'textposition': 'auto',
96
+ 'type': 'bar',
97
+ 'x': array(['gpt-3.5-turbo'], dtype=object),
98
+ 'xaxis': 'x',
99
+ 'y': array([5.28237349]),
100
+ 'yaxis': 'y'},
101
+ {'alignmentgroup': 'True',
102
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
103
+ 'legendgroup': 'gpt-4',
104
+ 'marker': {'color': '#B6E880', 'pattern': {'shape': ''}},
105
+ 'name': 'gpt-4',
106
+ 'offsetgroup': 'gpt-4',
107
+ 'orientation': 'v',
108
+ 'showlegend': True,
109
+ 'textposition': 'auto',
110
+ 'type': 'bar',
111
+ 'x': array(['gpt-4'], dtype=object),
112
+ 'xaxis': 'x',
113
+ 'y': array([15.52184566]),
114
+ 'yaxis': 'y'},
115
+ {'alignmentgroup': 'True',
116
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
117
+ 'legendgroup': 'gpt-4-turbo',
118
+ 'marker': {'color': '#FF97FF', 'pattern': {'shape': ''}},
119
+ 'name': 'gpt-4-turbo',
120
+ 'offsetgroup': 'gpt-4-turbo',
121
+ 'orientation': 'v',
122
+ 'showlegend': True,
123
+ 'textposition': 'auto',
124
+ 'type': 'bar',
125
+ 'x': array(['gpt-4-turbo'], dtype=object),
126
+ 'xaxis': 'x',
127
+ 'y': array([14.00852903]),
128
+ 'yaxis': 'y'},
129
+ {'alignmentgroup': 'True',
130
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
131
+ 'legendgroup': 'llama-2-70b-chat',
132
+ 'marker': {'color': '#FECB52', 'pattern': {'shape': ''}},
133
+ 'name': 'llama-2-70b-chat',
134
+ 'offsetgroup': 'llama-2-70b-chat',
135
+ 'orientation': 'v',
136
+ 'showlegend': True,
137
+ 'textposition': 'auto',
138
+ 'type': 'bar',
139
+ 'x': array(['llama-2-70b-chat'], dtype=object),
140
+ 'xaxis': 'x',
141
+ 'y': array([6.0658799]),
142
+ 'yaxis': 'y'},
143
+ {'alignmentgroup': 'True',
144
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
145
+ 'legendgroup': 'zephyr-7b-beta',
146
+ 'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
147
+ 'name': 'zephyr-7b-beta',
148
+ 'offsetgroup': 'zephyr-7b-beta',
149
+ 'orientation': 'v',
150
+ 'showlegend': True,
151
+ 'textposition': 'auto',
152
+ 'type': 'bar',
153
+ 'x': array(['zephyr-7b-beta'], dtype=object),
154
+ 'xaxis': 'x',
155
+ 'y': array([3.23879932]),
156
+ 'yaxis': 'y'}],
157
+ 'layout': {'barmode': 'relative',
158
+ 'legend': {'title': {'text': 'Model'}, 'tracegroupgap': 0},
159
+ 'template': '...',
160
+ 'title': {'text': 'Model endpoints response times'},
161
+ 'xaxis': {'anchor': 'y',
162
+ 'categoryarray': [Mistral-7B-Instruct-v0.2,
163
+ Mixtral-8x7B-Instruct-v0.1,
164
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,
165
+ chat-bison, chat-bison-32k, gemini-pro,
166
+ gpt-3.5-turbo, gpt-4, gpt-4-turbo,
167
+ llama-2-70b-chat, zephyr-7b-beta],
168
+ 'categoryorder': 'array',
169
+ 'domain': [0.0, 1.0],
170
+ 'title': {'text': 'Model'}},
171
+ 'yaxis': {'anchor': 'x', 'domain': [0.0, 1.0], 'title': {'text': 'Execution time (s)'}}}
172
+ })",Model endpoints response times,,"{""data"":[{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral-7B-Instruct-v0.2"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""Mistral-7B-Instruct-v0.2"",""offsetgroup"":""Mistral-7B-Instruct-v0.2"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""Mistral-7B-Instruct-v0.2""],""xaxis"":""x"",""y"":[3.174540030956268],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mixtral-8x7B-Instruct-v0.1"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""Mixtral-8x7B-Instruct-v0.1"",""offsetgroup"":""Mixtral-8x7B-Instruct-v0.1"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""Mixtral-8x7B-Instruct-v0.1""],""xaxis"":""x"",""y"":[7.142197625471814],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""offsetgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0""],""xaxis"":""x"",""y"":[1.2902645373344421],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""chat-bison"",""offsetgroup"":""chat-bison"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""chat-bison""],""xaxis"":""x"",""y"":[3.890243631601334],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison-32k"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""chat-bison-32k"",""offsetgroup"":""chat-bison-32k"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""chat-bison-32k""],""xaxis"":""x"",""y"":[4.128177767992019],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gemini-pro"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""gemini-pro"",""offsetgroup"":""gemini-pro"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gemini-pro""],""xaxis"":""x"",""y"":[4.72138064004937],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-3.5-turbo"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""gpt-3.5-turbo"",""offsetgroup"":""gpt-3.5-turbo"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gpt-3.5-turbo""],""xaxis"":""x"",""y"":[5.282373493889353],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""gpt-4"",""offsetgroup"":""gpt-4"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gpt-4""],""xaxis"":""x"",""y"":[15.5218456586202],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4-turbo"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""gpt-4-turbo"",""offsetgroup"":""gpt-4-turbo"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gpt-4-turbo""],""xaxis"":""x"",""y"":[14.008529031276703],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""llama-2-70b-chat"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""llama-2-70b-chat"",""offsetgroup"":""llama-2-70b-chat"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""llama-2-70b-chat""],""xaxis"":""x"",""y"":[6.06587989590749],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""zephyr-7b-beta"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""zephyr-7b-beta"",""offsetgroup"":""zephyr-7b-beta"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""zephyr-7b-beta""],""xaxis"":""x"",""y"":[3.2387993240356447],""yaxis"":""y"",""type"":""bar""}],""layout"":{""template"":{""data"":{""histogram2dcontour"":[{""type"":""histogram2dcontour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""choropleth"":[{""type"":""choropleth"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""histogram2d"":[{""type"":""histogram2d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmap"":[{""type"":""heatmap"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmapgl"":[{""type"":""heatmapgl"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""contourcarpet"":[{""type"":""contourcarpet"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""contour"":[{""type"":""contour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""surface"":[{""type"":""surface"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""mesh3d"":[{""type"":""mesh3d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""scatter"":[{""fillpattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2},""type"":""scatter""}],""parcoords"":[{""type"":""parcoords"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolargl"":[{""type"":""scatterpolargl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""bar"":[{""error_x"":{""color"":""#2a3f5f""},""error_y"":{""color"":""#2a3f5f""},""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""bar""}],""scattergeo"":[{""type"":""scattergeo"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolar"":[{""type"":""scatterpolar"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""histogram"":[{""marker"":{""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""histogram""}],""scattergl"":[{""type"":""scattergl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatter3d"":[{""type"":""scatter3d"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattermapbox"":[{""type"":""scattermapbox"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterternary"":[{""type"":""scatterternary"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattercarpet"":[{""type"":""scattercarpet"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""carpet"":[{""aaxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""baxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""type"":""carpet""}],""table"":[{""cells"":{""fill"":{""color"":""#EBF0F8""},""line"":{""color"":""white""}},""header"":{""fill"":{""color"":""#C8D4E3""},""line"":{""color"":""white""}},""type"":""table""}],""barpolar"":[{""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""barpolar""}],""pie"":[{""automargin"":true,""type"":""pie""}]},""layout"":{""autotypenumbers"":""strict"",""colorway"":[""#636efa"",""#EF553B"",""#00cc96"",""#ab63fa"",""#FFA15A"",""#19d3f3"",""#FF6692"",""#B6E880"",""#FF97FF"",""#FECB52""],""font"":{""color"":""#2a3f5f""},""hovermode"":""closest"",""hoverlabel"":{""align"":""left""},""paper_bgcolor"":""white"",""plot_bgcolor"":""#E5ECF6"",""polar"":{""bgcolor"":""#E5ECF6"",""angularaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""radialaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""ternary"":{""bgcolor"":""#E5ECF6"",""aaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""baxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""caxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""coloraxis"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""colorscale"":{""sequential"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""sequentialminus"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""diverging"":[[0,""#8e0152""],[0.1,""#c51b7d""],[0.2,""#de77ae""],[0.3,""#f1b6da""],[0.4,""#fde0ef""],[0.5,""#f7f7f7""],[0.6,""#e6f5d0""],[0.7,""#b8e186""],[0.8,""#7fbc41""],[0.9,""#4d9221""],[1,""#276419""]]},""xaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""yaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""scene"":{""xaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""yaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""zaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2}},""shapedefaults"":{""line"":{""color"":""#2a3f5f""}},""annotationdefaults"":{""arrowcolor"":""#2a3f5f"",""arrowhead"":0,""arrowwidth"":1},""geo"":{""bgcolor"":""white"",""landcolor"":""#E5ECF6"",""subunitcolor"":""white"",""showland"":true,""showlakes"":true,""lakecolor"":""white""},""title"":{""x"":0.05},""mapbox"":{""style"":""light""}}},""xaxis"":{""anchor"":""y"",""domain"":[0.0,1.0],""title"":{""text"":""Model""},""categoryorder"":""array"",""categoryarray"":[""Mistral-7B-Instruct-v0.2"",""Mixtral-8x7B-Instruct-v0.1"",""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""chat-bison"",""chat-bison-32k"",""gemini-pro"",""gpt-3.5-turbo"",""gpt-4"",""gpt-4-turbo"",""llama-2-70b-chat"",""zephyr-7b-beta""]},""yaxis"":{""anchor"":""x"",""domain"":[0.0,1.0],""title"":{""text"":""Execution time (s)""}},""legend"":{""title"":{""text"":""Model""},""tracegroupgap"":0},""title"":{""text"":""Model endpoints response times""},""barmode"":""relative""}}"
173
+ ./html/plots/execution_costs.html,"Figure({
174
+ 'data': [{'alignmentgroup': 'True',
175
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
176
+ 'legendgroup': 'gpt-3.5-turbo',
177
+ 'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
178
+ 'name': 'gpt-3.5-turbo',
179
+ 'offsetgroup': 'gpt-3.5-turbo',
180
+ 'orientation': 'v',
181
+ 'showlegend': True,
182
+ 'textposition': 'auto',
183
+ 'type': 'bar',
184
+ 'x': array(['gpt-3.5-turbo', 'gpt-3.5-turbo'], dtype=object),
185
+ 'xaxis': 'x',
186
+ 'y': array([0.032366, 0.032366]),
187
+ 'yaxis': 'y'},
188
+ {'alignmentgroup': 'True',
189
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
190
+ 'legendgroup': 'gpt-4-turbo',
191
+ 'marker': {'color': '#EF553B', 'pattern': {'shape': ''}},
192
+ 'name': 'gpt-4-turbo',
193
+ 'offsetgroup': 'gpt-4-turbo',
194
+ 'orientation': 'v',
195
+ 'showlegend': True,
196
+ 'textposition': 'auto',
197
+ 'type': 'bar',
198
+ 'x': array(['gpt-4-turbo'], dtype=object),
199
+ 'xaxis': 'x',
200
+ 'y': array([0.21176]),
201
+ 'yaxis': 'y'},
202
+ {'alignmentgroup': 'True',
203
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
204
+ 'legendgroup': 'gpt-4',
205
+ 'marker': {'color': '#00cc96', 'pattern': {'shape': ''}},
206
+ 'name': 'gpt-4',
207
+ 'offsetgroup': 'gpt-4',
208
+ 'orientation': 'v',
209
+ 'showlegend': True,
210
+ 'textposition': 'auto',
211
+ 'type': 'bar',
212
+ 'x': array(['gpt-4'], dtype=object),
213
+ 'xaxis': 'x',
214
+ 'y': array([0.5778]),
215
+ 'yaxis': 'y'},
216
+ {'alignmentgroup': 'True',
217
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
218
+ 'legendgroup': 'llama-2-70b-chat',
219
+ 'marker': {'color': '#ab63fa', 'pattern': {'shape': ''}},
220
+ 'name': 'llama-2-70b-chat',
221
+ 'offsetgroup': 'llama-2-70b-chat',
222
+ 'orientation': 'v',
223
+ 'showlegend': True,
224
+ 'textposition': 'auto',
225
+ 'type': 'bar',
226
+ 'x': array(['llama-2-70b-chat'], dtype=object),
227
+ 'xaxis': 'x',
228
+ 'y': array([0.0051984]),
229
+ 'yaxis': 'y'},
230
+ {'alignmentgroup': 'True',
231
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
232
+ 'legendgroup': 'Mixtral-8x7B-Instruct-v0.1',
233
+ 'marker': {'color': '#FFA15A', 'pattern': {'shape': ''}},
234
+ 'name': 'Mixtral-8x7B-Instruct-v0.1',
235
+ 'offsetgroup': 'Mixtral-8x7B-Instruct-v0.1',
236
+ 'orientation': 'v',
237
+ 'showlegend': True,
238
+ 'textposition': 'auto',
239
+ 'type': 'bar',
240
+ 'x': array(['Mixtral-8x7B-Instruct-v0.1'], dtype=object),
241
+ 'xaxis': 'x',
242
+ 'y': array([0.0254493]),
243
+ 'yaxis': 'y'},
244
+ {'alignmentgroup': 'True',
245
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
246
+ 'legendgroup': 'zephyr-7b-beta',
247
+ 'marker': {'color': '#19d3f3', 'pattern': {'shape': ''}},
248
+ 'name': 'zephyr-7b-beta',
249
+ 'offsetgroup': 'zephyr-7b-beta',
250
+ 'orientation': 'v',
251
+ 'showlegend': True,
252
+ 'textposition': 'auto',
253
+ 'type': 'bar',
254
+ 'x': array(['zephyr-7b-beta'], dtype=object),
255
+ 'xaxis': 'x',
256
+ 'y': array([0.]),
257
+ 'yaxis': 'y'},
258
+ {'alignmentgroup': 'True',
259
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
260
+ 'legendgroup': 'Mistral-7B-Instruct-v0.2',
261
+ 'marker': {'color': '#FF6692', 'pattern': {'shape': ''}},
262
+ 'name': 'Mistral-7B-Instruct-v0.2',
263
+ 'offsetgroup': 'Mistral-7B-Instruct-v0.2',
264
+ 'orientation': 'v',
265
+ 'showlegend': True,
266
+ 'textposition': 'auto',
267
+ 'type': 'bar',
268
+ 'x': array(['Mistral-7B-Instruct-v0.2'], dtype=object),
269
+ 'xaxis': 'x',
270
+ 'y': array([0.]),
271
+ 'yaxis': 'y'},
272
+ {'alignmentgroup': 'True',
273
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
274
+ 'legendgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
275
+ 'marker': {'color': '#B6E880', 'pattern': {'shape': ''}},
276
+ 'name': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
277
+ 'offsetgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
278
+ 'orientation': 'v',
279
+ 'showlegend': True,
280
+ 'textposition': 'auto',
281
+ 'type': 'bar',
282
+ 'x': array(['TinyLlama/TinyLlama-1.1B-Chat-v1.0'], dtype=object),
283
+ 'xaxis': 'x',
284
+ 'y': array([0.]),
285
+ 'yaxis': 'y'},
286
+ {'alignmentgroup': 'True',
287
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
288
+ 'legendgroup': 'gemini-pro',
289
+ 'marker': {'color': '#FF97FF', 'pattern': {'shape': ''}},
290
+ 'name': 'gemini-pro',
291
+ 'offsetgroup': 'gemini-pro',
292
+ 'orientation': 'v',
293
+ 'showlegend': True,
294
+ 'textposition': 'auto',
295
+ 'type': 'bar',
296
+ 'x': array(['gemini-pro'], dtype=object),
297
+ 'xaxis': 'x',
298
+ 'y': array([0.00706925]),
299
+ 'yaxis': 'y'},
300
+ {'alignmentgroup': 'True',
301
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
302
+ 'legendgroup': 'chat-bison (PaLM 2)',
303
+ 'marker': {'color': '#FECB52', 'pattern': {'shape': ''}},
304
+ 'name': 'chat-bison (PaLM 2)',
305
+ 'offsetgroup': 'chat-bison (PaLM 2)',
306
+ 'orientation': 'v',
307
+ 'showlegend': True,
308
+ 'textposition': 'auto',
309
+ 'type': 'bar',
310
+ 'x': array(['chat-bison (PaLM 2)'], dtype=object),
311
+ 'xaxis': 'x',
312
+ 'y': array([0.]),
313
+ 'yaxis': 'y'},
314
+ {'alignmentgroup': 'True',
315
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
316
+ 'legendgroup': 'chat-bison-32k (PaLM 2 32K)',
317
+ 'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
318
+ 'name': 'chat-bison-32k (PaLM 2 32K)',
319
+ 'offsetgroup': 'chat-bison-32k (PaLM 2 32K)',
320
+ 'orientation': 'v',
321
+ 'showlegend': True,
322
+ 'textposition': 'auto',
323
+ 'type': 'bar',
324
+ 'x': array(['chat-bison-32k (PaLM 2 32K)'], dtype=object),
325
+ 'xaxis': 'x',
326
+ 'y': array([0.]),
327
+ 'yaxis': 'y'}],
328
+ 'layout': {'barmode': 'relative',
329
+ 'legend': {'title': {'text': 'Model'}, 'tracegroupgap': 0},
330
+ 'template': '...',
331
+ 'title': {'text': 'Costs of execution of 39 test queries per model'},
332
+ 'xaxis': {'anchor': 'y', 'domain': [0.0, 1.0], 'title': {'text': 'Model'}},
333
+ 'yaxis': {'anchor': 'x', 'domain': [0.0, 1.0], 'title': {'text': 'Execution cost ($)'}}}
334
+ })",Costs of execution of 39 test queries per model,Note that some providers bill by token count and some by execution time. In the second case we used averaged pausing and resuming time to calculate the cost and assumed that all queries have been done in one session. Also note that for now the Gemini-Pro model is free for under 60 queries per minute.,"{""data"":[{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-3.5-turbo"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""gpt-3.5-turbo"",""offsetgroup"":""gpt-3.5-turbo"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gpt-3.5-turbo"",""gpt-3.5-turbo""],""xaxis"":""x"",""y"":[0.032366,0.032366],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4-turbo"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""gpt-4-turbo"",""offsetgroup"":""gpt-4-turbo"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gpt-4-turbo""],""xaxis"":""x"",""y"":[0.21176000000000003],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""gpt-4"",""offsetgroup"":""gpt-4"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gpt-4""],""xaxis"":""x"",""y"":[0.5778000000000001],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""llama-2-70b-chat"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""llama-2-70b-chat"",""offsetgroup"":""llama-2-70b-chat"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""llama-2-70b-chat""],""xaxis"":""x"",""y"":[0.005198400000000001],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mixtral-8x7B-Instruct-v0.1"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""Mixtral-8x7B-Instruct-v0.1"",""offsetgroup"":""Mixtral-8x7B-Instruct-v0.1"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""Mixtral-8x7B-Instruct-v0.1""],""xaxis"":""x"",""y"":[0.0254493],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""zephyr-7b-beta"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""zephyr-7b-beta"",""offsetgroup"":""zephyr-7b-beta"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""zephyr-7b-beta""],""xaxis"":""x"",""y"":[0.0],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral-7B-Instruct-v0.2"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""Mistral-7B-Instruct-v0.2"",""offsetgroup"":""Mistral-7B-Instruct-v0.2"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""Mistral-7B-Instruct-v0.2""],""xaxis"":""x"",""y"":[0.0],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""offsetgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0""],""xaxis"":""x"",""y"":[0.0],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gemini-pro"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""gemini-pro"",""offsetgroup"":""gemini-pro"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gemini-pro""],""xaxis"":""x"",""y"":[0.00706925],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison (PaLM 2)"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""chat-bison (PaLM 2)"",""offsetgroup"":""chat-bison (PaLM 2)"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""chat-bison (PaLM 2)""],""xaxis"":""x"",""y"":[0.0],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison-32k (PaLM 2 32K)"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""chat-bison-32k (PaLM 2 32K)"",""offsetgroup"":""chat-bison-32k (PaLM 2 32K)"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""chat-bison-32k (PaLM 2 32K)""],""xaxis"":""x"",""y"":[0.0],""yaxis"":""y"",""type"":""bar""}],""layout"":{""template"":{""data"":{""histogram2dcontour"":[{""type"":""histogram2dcontour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""choropleth"":[{""type"":""choropleth"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""histogram2d"":[{""type"":""histogram2d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmap"":[{""type"":""heatmap"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmapgl"":[{""type"":""heatmapgl"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""contourcarpet"":[{""type"":""contourcarpet"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""contour"":[{""type"":""contour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""surface"":[{""type"":""surface"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""mesh3d"":[{""type"":""mesh3d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""scatter"":[{""fillpattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2},""type"":""scatter""}],""parcoords"":[{""type"":""parcoords"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolargl"":[{""type"":""scatterpolargl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""bar"":[{""error_x"":{""color"":""#2a3f5f""},""error_y"":{""color"":""#2a3f5f""},""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""bar""}],""scattergeo"":[{""type"":""scattergeo"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolar"":[{""type"":""scatterpolar"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""histogram"":[{""marker"":{""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""histogram""}],""scattergl"":[{""type"":""scattergl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatter3d"":[{""type"":""scatter3d"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattermapbox"":[{""type"":""scattermapbox"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterternary"":[{""type"":""scatterternary"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattercarpet"":[{""type"":""scattercarpet"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""carpet"":[{""aaxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""baxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""type"":""carpet""}],""table"":[{""cells"":{""fill"":{""color"":""#EBF0F8""},""line"":{""color"":""white""}},""header"":{""fill"":{""color"":""#C8D4E3""},""line"":{""color"":""white""}},""type"":""table""}],""barpolar"":[{""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""barpolar""}],""pie"":[{""automargin"":true,""type"":""pie""}]},""layout"":{""autotypenumbers"":""strict"",""colorway"":[""#636efa"",""#EF553B"",""#00cc96"",""#ab63fa"",""#FFA15A"",""#19d3f3"",""#FF6692"",""#B6E880"",""#FF97FF"",""#FECB52""],""font"":{""color"":""#2a3f5f""},""hovermode"":""closest"",""hoverlabel"":{""align"":""left""},""paper_bgcolor"":""white"",""plot_bgcolor"":""#E5ECF6"",""polar"":{""bgcolor"":""#E5ECF6"",""angularaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""radialaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""ternary"":{""bgcolor"":""#E5ECF6"",""aaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""baxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""caxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""coloraxis"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""colorscale"":{""sequential"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""sequentialminus"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""diverging"":[[0,""#8e0152""],[0.1,""#c51b7d""],[0.2,""#de77ae""],[0.3,""#f1b6da""],[0.4,""#fde0ef""],[0.5,""#f7f7f7""],[0.6,""#e6f5d0""],[0.7,""#b8e186""],[0.8,""#7fbc41""],[0.9,""#4d9221""],[1,""#276419""]]},""xaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""yaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""scene"":{""xaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""yaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""zaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2}},""shapedefaults"":{""line"":{""color"":""#2a3f5f""}},""annotationdefaults"":{""arrowcolor"":""#2a3f5f"",""arrowhead"":0,""arrowwidth"":1},""geo"":{""bgcolor"":""white"",""landcolor"":""#E5ECF6"",""subunitcolor"":""white"",""showland"":true,""showlakes"":true,""lakecolor"":""white""},""title"":{""x"":0.05},""mapbox"":{""style"":""light""}}},""xaxis"":{""anchor"":""y"",""domain"":[0.0,1.0],""title"":{""text"":""Model""}},""yaxis"":{""anchor"":""x"",""domain"":[0.0,1.0],""title"":{""text"":""Execution cost ($)""}},""legend"":{""title"":{""text"":""Model""},""tracegroupgap"":0},""title"":{""text"":""Costs of execution of 39 test queries per model""},""barmode"":""relative""}}"
335
+ ./html/plots/model_sizes.html,"Figure({
336
+ 'data': [{'alignmentgroup': 'True',
337
+ 'hovertemplate': 'Model=%{x}<br>Model size (B params)=%{y}<extra></extra>',
338
+ 'legendgroup': 'Mixtral-8x7B-Instruct-v0.1',
339
+ 'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
340
+ 'name': 'Mixtral-8x7B-Instruct-v0.1',
341
+ 'offsetgroup': 'Mixtral-8x7B-Instruct-v0.1',
342
+ 'orientation': 'v',
343
+ 'showlegend': True,
344
+ 'textposition': 'auto',
345
+ 'type': 'bar',
346
+ 'x': array(['Mixtral-8x7B-Instruct-v0.1'], dtype=object),
347
+ 'xaxis': 'x',
348
+ 'y': array([56.]),
349
+ 'yaxis': 'y'},
350
+ {'alignmentgroup': 'True',
351
+ 'hovertemplate': 'Model=%{x}<br>Model size (B params)=%{y}<extra></extra>',
352
+ 'legendgroup': 'zephyr-7b-beta',
353
+ 'marker': {'color': '#EF553B', 'pattern': {'shape': ''}},
354
+ 'name': 'zephyr-7b-beta',
355
+ 'offsetgroup': 'zephyr-7b-beta',
356
+ 'orientation': 'v',
357
+ 'showlegend': True,
358
+ 'textposition': 'auto',
359
+ 'type': 'bar',
360
+ 'x': array(['zephyr-7b-beta'], dtype=object),
361
+ 'xaxis': 'x',
362
+ 'y': array([7.]),
363
+ 'yaxis': 'y'},
364
+ {'alignmentgroup': 'True',
365
+ 'hovertemplate': 'Model=%{x}<br>Model size (B params)=%{y}<extra></extra>',
366
+ 'legendgroup': 'Mistral-7B-Instruct-v0.2',
367
+ 'marker': {'color': '#00cc96', 'pattern': {'shape': ''}},
368
+ 'name': 'Mistral-7B-Instruct-v0.2',
369
+ 'offsetgroup': 'Mistral-7B-Instruct-v0.2',
370
+ 'orientation': 'v',
371
+ 'showlegend': True,
372
+ 'textposition': 'auto',
373
+ 'type': 'bar',
374
+ 'x': array(['Mistral-7B-Instruct-v0.2'], dtype=object),
375
+ 'xaxis': 'x',
376
+ 'y': array([7.]),
377
+ 'yaxis': 'y'},
378
+ {'alignmentgroup': 'True',
379
+ 'hovertemplate': 'Model=%{x}<br>Model size (B params)=%{y}<extra></extra>',
380
+ 'legendgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
381
+ 'marker': {'color': '#ab63fa', 'pattern': {'shape': ''}},
382
+ 'name': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
383
+ 'offsetgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
384
+ 'orientation': 'v',
385
+ 'showlegend': True,
386
+ 'textposition': 'auto',
387
+ 'type': 'bar',
388
+ 'x': array(['TinyLlama/TinyLlama-1.1B-Chat-v1.0'], dtype=object),
389
+ 'xaxis': 'x',
390
+ 'y': array([1.1]),
391
+ 'yaxis': 'y'}],
392
+ 'layout': {'barmode': 'relative',
393
+ 'legend': {'title': {'text': 'Model'}, 'tracegroupgap': 0},
394
+ 'template': '...',
395
+ 'title': {'text': 'Model sizes in billions of parameters'},
396
+ 'xaxis': {'anchor': 'y', 'domain': [0.0, 1.0], 'title': {'text': 'Model'}},
397
+ 'yaxis': {'anchor': 'x', 'domain': [0.0, 1.0], 'title': {'text': 'Model size (B params)'}}}
398
+ })",Model sizes in billions of parameters,Note that some models have undisclosed sizes.,"{""data"":[{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eModel size (B params)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mixtral-8x7B-Instruct-v0.1"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""Mixtral-8x7B-Instruct-v0.1"",""offsetgroup"":""Mixtral-8x7B-Instruct-v0.1"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""Mixtral-8x7B-Instruct-v0.1""],""xaxis"":""x"",""y"":[56.0],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eModel size (B params)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""zephyr-7b-beta"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""zephyr-7b-beta"",""offsetgroup"":""zephyr-7b-beta"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""zephyr-7b-beta""],""xaxis"":""x"",""y"":[7.0],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eModel size (B params)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral-7B-Instruct-v0.2"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""Mistral-7B-Instruct-v0.2"",""offsetgroup"":""Mistral-7B-Instruct-v0.2"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""Mistral-7B-Instruct-v0.2""],""xaxis"":""x"",""y"":[7.0],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eModel size (B params)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""offsetgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0""],""xaxis"":""x"",""y"":[1.1],""yaxis"":""y"",""type"":""bar""}],""layout"":{""template"":{""data"":{""histogram2dcontour"":[{""type"":""histogram2dcontour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""choropleth"":[{""type"":""choropleth"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""histogram2d"":[{""type"":""histogram2d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmap"":[{""type"":""heatmap"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmapgl"":[{""type"":""heatmapgl"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""contourcarpet"":[{""type"":""contourcarpet"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""contour"":[{""type"":""contour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""surface"":[{""type"":""surface"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""mesh3d"":[{""type"":""mesh3d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""scatter"":[{""fillpattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2},""type"":""scatter""}],""parcoords"":[{""type"":""parcoords"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolargl"":[{""type"":""scatterpolargl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""bar"":[{""error_x"":{""color"":""#2a3f5f""},""error_y"":{""color"":""#2a3f5f""},""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""bar""}],""scattergeo"":[{""type"":""scattergeo"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolar"":[{""type"":""scatterpolar"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""histogram"":[{""marker"":{""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""histogram""}],""scattergl"":[{""type"":""scattergl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatter3d"":[{""type"":""scatter3d"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattermapbox"":[{""type"":""scattermapbox"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterternary"":[{""type"":""scatterternary"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattercarpet"":[{""type"":""scattercarpet"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""carpet"":[{""aaxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""baxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""type"":""carpet""}],""table"":[{""cells"":{""fill"":{""color"":""#EBF0F8""},""line"":{""color"":""white""}},""header"":{""fill"":{""color"":""#C8D4E3""},""line"":{""color"":""white""}},""type"":""table""}],""barpolar"":[{""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""barpolar""}],""pie"":[{""automargin"":true,""type"":""pie""}]},""layout"":{""autotypenumbers"":""strict"",""colorway"":[""#636efa"",""#EF553B"",""#00cc96"",""#ab63fa"",""#FFA15A"",""#19d3f3"",""#FF6692"",""#B6E880"",""#FF97FF"",""#FECB52""],""font"":{""color"":""#2a3f5f""},""hovermode"":""closest"",""hoverlabel"":{""align"":""left""},""paper_bgcolor"":""white"",""plot_bgcolor"":""#E5ECF6"",""polar"":{""bgcolor"":""#E5ECF6"",""angularaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""radialaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""ternary"":{""bgcolor"":""#E5ECF6"",""aaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""baxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""caxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""coloraxis"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""colorscale"":{""sequential"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""sequentialminus"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""diverging"":[[0,""#8e0152""],[0.1,""#c51b7d""],[0.2,""#de77ae""],[0.3,""#f1b6da""],[0.4,""#fde0ef""],[0.5,""#f7f7f7""],[0.6,""#e6f5d0""],[0.7,""#b8e186""],[0.8,""#7fbc41""],[0.9,""#4d9221""],[1,""#276419""]]},""xaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""yaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""scene"":{""xaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""yaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""zaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2}},""shapedefaults"":{""line"":{""color"":""#2a3f5f""}},""annotationdefaults"":{""arrowcolor"":""#2a3f5f"",""arrowhead"":0,""arrowwidth"":1},""geo"":{""bgcolor"":""white"",""landcolor"":""#E5ECF6"",""subunitcolor"":""white"",""showland"":true,""showlakes"":true,""lakecolor"":""white""},""title"":{""x"":0.05},""mapbox"":{""style"":""light""}}},""xaxis"":{""anchor"":""y"",""domain"":[0.0,1.0],""title"":{""text"":""Model""}},""yaxis"":{""anchor"":""x"",""domain"":[0.0,1.0],""title"":{""text"":""Model size (B params)""}},""legend"":{""title"":{""text"":""Model""},""tracegroupgap"":0},""title"":{""text"":""Model sizes in billions of parameters""},""barmode"":""relative""}}"
data/2024-01-26 11:22:32.771167_general_plot.csv ADDED
@@ -0,0 +1,398 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ path,plot_object,description,comment,plot_json
2
+ ./html/plots/response_times.html,"Figure({
3
+ 'data': [{'alignmentgroup': 'True',
4
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
5
+ 'legendgroup': 'Mistral-7B-Instruct-v0.2',
6
+ 'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
7
+ 'name': 'Mistral-7B-Instruct-v0.2',
8
+ 'offsetgroup': 'Mistral-7B-Instruct-v0.2',
9
+ 'orientation': 'v',
10
+ 'showlegend': True,
11
+ 'textposition': 'auto',
12
+ 'type': 'bar',
13
+ 'x': array(['Mistral-7B-Instruct-v0.2'], dtype=object),
14
+ 'xaxis': 'x',
15
+ 'y': array([3.17454003]),
16
+ 'yaxis': 'y'},
17
+ {'alignmentgroup': 'True',
18
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
19
+ 'legendgroup': 'Mixtral-8x7B-Instruct-v0.1',
20
+ 'marker': {'color': '#EF553B', 'pattern': {'shape': ''}},
21
+ 'name': 'Mixtral-8x7B-Instruct-v0.1',
22
+ 'offsetgroup': 'Mixtral-8x7B-Instruct-v0.1',
23
+ 'orientation': 'v',
24
+ 'showlegend': True,
25
+ 'textposition': 'auto',
26
+ 'type': 'bar',
27
+ 'x': array(['Mixtral-8x7B-Instruct-v0.1'], dtype=object),
28
+ 'xaxis': 'x',
29
+ 'y': array([7.14219763]),
30
+ 'yaxis': 'y'},
31
+ {'alignmentgroup': 'True',
32
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
33
+ 'legendgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
34
+ 'marker': {'color': '#00cc96', 'pattern': {'shape': ''}},
35
+ 'name': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
36
+ 'offsetgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
37
+ 'orientation': 'v',
38
+ 'showlegend': True,
39
+ 'textposition': 'auto',
40
+ 'type': 'bar',
41
+ 'x': array(['TinyLlama/TinyLlama-1.1B-Chat-v1.0'], dtype=object),
42
+ 'xaxis': 'x',
43
+ 'y': array([1.29026454]),
44
+ 'yaxis': 'y'},
45
+ {'alignmentgroup': 'True',
46
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
47
+ 'legendgroup': 'chat-bison',
48
+ 'marker': {'color': '#ab63fa', 'pattern': {'shape': ''}},
49
+ 'name': 'chat-bison',
50
+ 'offsetgroup': 'chat-bison',
51
+ 'orientation': 'v',
52
+ 'showlegend': True,
53
+ 'textposition': 'auto',
54
+ 'type': 'bar',
55
+ 'x': array(['chat-bison'], dtype=object),
56
+ 'xaxis': 'x',
57
+ 'y': array([3.89024363]),
58
+ 'yaxis': 'y'},
59
+ {'alignmentgroup': 'True',
60
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
61
+ 'legendgroup': 'chat-bison-32k',
62
+ 'marker': {'color': '#FFA15A', 'pattern': {'shape': ''}},
63
+ 'name': 'chat-bison-32k',
64
+ 'offsetgroup': 'chat-bison-32k',
65
+ 'orientation': 'v',
66
+ 'showlegend': True,
67
+ 'textposition': 'auto',
68
+ 'type': 'bar',
69
+ 'x': array(['chat-bison-32k'], dtype=object),
70
+ 'xaxis': 'x',
71
+ 'y': array([4.12817777]),
72
+ 'yaxis': 'y'},
73
+ {'alignmentgroup': 'True',
74
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
75
+ 'legendgroup': 'gemini-pro',
76
+ 'marker': {'color': '#19d3f3', 'pattern': {'shape': ''}},
77
+ 'name': 'gemini-pro',
78
+ 'offsetgroup': 'gemini-pro',
79
+ 'orientation': 'v',
80
+ 'showlegend': True,
81
+ 'textposition': 'auto',
82
+ 'type': 'bar',
83
+ 'x': array(['gemini-pro'], dtype=object),
84
+ 'xaxis': 'x',
85
+ 'y': array([4.72138064]),
86
+ 'yaxis': 'y'},
87
+ {'alignmentgroup': 'True',
88
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
89
+ 'legendgroup': 'gpt-3.5-turbo',
90
+ 'marker': {'color': '#FF6692', 'pattern': {'shape': ''}},
91
+ 'name': 'gpt-3.5-turbo',
92
+ 'offsetgroup': 'gpt-3.5-turbo',
93
+ 'orientation': 'v',
94
+ 'showlegend': True,
95
+ 'textposition': 'auto',
96
+ 'type': 'bar',
97
+ 'x': array(['gpt-3.5-turbo'], dtype=object),
98
+ 'xaxis': 'x',
99
+ 'y': array([5.28237349]),
100
+ 'yaxis': 'y'},
101
+ {'alignmentgroup': 'True',
102
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
103
+ 'legendgroup': 'gpt-4',
104
+ 'marker': {'color': '#B6E880', 'pattern': {'shape': ''}},
105
+ 'name': 'gpt-4',
106
+ 'offsetgroup': 'gpt-4',
107
+ 'orientation': 'v',
108
+ 'showlegend': True,
109
+ 'textposition': 'auto',
110
+ 'type': 'bar',
111
+ 'x': array(['gpt-4'], dtype=object),
112
+ 'xaxis': 'x',
113
+ 'y': array([15.52184566]),
114
+ 'yaxis': 'y'},
115
+ {'alignmentgroup': 'True',
116
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
117
+ 'legendgroup': 'gpt-4-turbo',
118
+ 'marker': {'color': '#FF97FF', 'pattern': {'shape': ''}},
119
+ 'name': 'gpt-4-turbo',
120
+ 'offsetgroup': 'gpt-4-turbo',
121
+ 'orientation': 'v',
122
+ 'showlegend': True,
123
+ 'textposition': 'auto',
124
+ 'type': 'bar',
125
+ 'x': array(['gpt-4-turbo'], dtype=object),
126
+ 'xaxis': 'x',
127
+ 'y': array([14.00852903]),
128
+ 'yaxis': 'y'},
129
+ {'alignmentgroup': 'True',
130
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
131
+ 'legendgroup': 'llama-2-70b-chat',
132
+ 'marker': {'color': '#FECB52', 'pattern': {'shape': ''}},
133
+ 'name': 'llama-2-70b-chat',
134
+ 'offsetgroup': 'llama-2-70b-chat',
135
+ 'orientation': 'v',
136
+ 'showlegend': True,
137
+ 'textposition': 'auto',
138
+ 'type': 'bar',
139
+ 'x': array(['llama-2-70b-chat'], dtype=object),
140
+ 'xaxis': 'x',
141
+ 'y': array([6.0658799]),
142
+ 'yaxis': 'y'},
143
+ {'alignmentgroup': 'True',
144
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
145
+ 'legendgroup': 'zephyr-7b-beta',
146
+ 'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
147
+ 'name': 'zephyr-7b-beta',
148
+ 'offsetgroup': 'zephyr-7b-beta',
149
+ 'orientation': 'v',
150
+ 'showlegend': True,
151
+ 'textposition': 'auto',
152
+ 'type': 'bar',
153
+ 'x': array(['zephyr-7b-beta'], dtype=object),
154
+ 'xaxis': 'x',
155
+ 'y': array([3.23879932]),
156
+ 'yaxis': 'y'}],
157
+ 'layout': {'barmode': 'relative',
158
+ 'legend': {'title': {'text': 'Model'}, 'tracegroupgap': 0},
159
+ 'template': '...',
160
+ 'title': {'text': 'Model endpoints response times'},
161
+ 'xaxis': {'anchor': 'y',
162
+ 'categoryarray': [Mistral-7B-Instruct-v0.2,
163
+ Mixtral-8x7B-Instruct-v0.1,
164
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,
165
+ chat-bison, chat-bison-32k, gemini-pro,
166
+ gpt-3.5-turbo, gpt-4, gpt-4-turbo,
167
+ llama-2-70b-chat, zephyr-7b-beta],
168
+ 'categoryorder': 'array',
169
+ 'domain': [0.0, 1.0],
170
+ 'title': {'text': 'Model'}},
171
+ 'yaxis': {'anchor': 'x', 'domain': [0.0, 1.0], 'title': {'text': 'Execution time (s)'}}}
172
+ })",Model endpoints response times,,"{""data"":[{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral-7B-Instruct-v0.2"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""Mistral-7B-Instruct-v0.2"",""offsetgroup"":""Mistral-7B-Instruct-v0.2"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""Mistral-7B-Instruct-v0.2""],""xaxis"":""x"",""y"":[3.174540030956268],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mixtral-8x7B-Instruct-v0.1"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""Mixtral-8x7B-Instruct-v0.1"",""offsetgroup"":""Mixtral-8x7B-Instruct-v0.1"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""Mixtral-8x7B-Instruct-v0.1""],""xaxis"":""x"",""y"":[7.142197625471814],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""offsetgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0""],""xaxis"":""x"",""y"":[1.2902645373344421],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""chat-bison"",""offsetgroup"":""chat-bison"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""chat-bison""],""xaxis"":""x"",""y"":[3.890243631601334],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison-32k"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""chat-bison-32k"",""offsetgroup"":""chat-bison-32k"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""chat-bison-32k""],""xaxis"":""x"",""y"":[4.128177767992019],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gemini-pro"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""gemini-pro"",""offsetgroup"":""gemini-pro"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gemini-pro""],""xaxis"":""x"",""y"":[4.72138064004937],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-3.5-turbo"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""gpt-3.5-turbo"",""offsetgroup"":""gpt-3.5-turbo"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gpt-3.5-turbo""],""xaxis"":""x"",""y"":[5.282373493889353],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""gpt-4"",""offsetgroup"":""gpt-4"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gpt-4""],""xaxis"":""x"",""y"":[15.5218456586202],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4-turbo"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""gpt-4-turbo"",""offsetgroup"":""gpt-4-turbo"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gpt-4-turbo""],""xaxis"":""x"",""y"":[14.008529031276703],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""llama-2-70b-chat"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""llama-2-70b-chat"",""offsetgroup"":""llama-2-70b-chat"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""llama-2-70b-chat""],""xaxis"":""x"",""y"":[6.06587989590749],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""zephyr-7b-beta"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""zephyr-7b-beta"",""offsetgroup"":""zephyr-7b-beta"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""zephyr-7b-beta""],""xaxis"":""x"",""y"":[3.2387993240356447],""yaxis"":""y"",""type"":""bar""}],""layout"":{""template"":{""data"":{""histogram2dcontour"":[{""type"":""histogram2dcontour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""choropleth"":[{""type"":""choropleth"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""histogram2d"":[{""type"":""histogram2d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmap"":[{""type"":""heatmap"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmapgl"":[{""type"":""heatmapgl"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""contourcarpet"":[{""type"":""contourcarpet"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""contour"":[{""type"":""contour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""surface"":[{""type"":""surface"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""mesh3d"":[{""type"":""mesh3d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""scatter"":[{""fillpattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2},""type"":""scatter""}],""parcoords"":[{""type"":""parcoords"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolargl"":[{""type"":""scatterpolargl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""bar"":[{""error_x"":{""color"":""#2a3f5f""},""error_y"":{""color"":""#2a3f5f""},""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""bar""}],""scattergeo"":[{""type"":""scattergeo"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolar"":[{""type"":""scatterpolar"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""histogram"":[{""marker"":{""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""histogram""}],""scattergl"":[{""type"":""scattergl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatter3d"":[{""type"":""scatter3d"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattermapbox"":[{""type"":""scattermapbox"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterternary"":[{""type"":""scatterternary"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattercarpet"":[{""type"":""scattercarpet"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""carpet"":[{""aaxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""baxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""type"":""carpet""}],""table"":[{""cells"":{""fill"":{""color"":""#EBF0F8""},""line"":{""color"":""white""}},""header"":{""fill"":{""color"":""#C8D4E3""},""line"":{""color"":""white""}},""type"":""table""}],""barpolar"":[{""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""barpolar""}],""pie"":[{""automargin"":true,""type"":""pie""}]},""layout"":{""autotypenumbers"":""strict"",""colorway"":[""#636efa"",""#EF553B"",""#00cc96"",""#ab63fa"",""#FFA15A"",""#19d3f3"",""#FF6692"",""#B6E880"",""#FF97FF"",""#FECB52""],""font"":{""color"":""#2a3f5f""},""hovermode"":""closest"",""hoverlabel"":{""align"":""left""},""paper_bgcolor"":""white"",""plot_bgcolor"":""#E5ECF6"",""polar"":{""bgcolor"":""#E5ECF6"",""angularaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""radialaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""ternary"":{""bgcolor"":""#E5ECF6"",""aaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""baxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""caxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""coloraxis"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""colorscale"":{""sequential"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""sequentialminus"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""diverging"":[[0,""#8e0152""],[0.1,""#c51b7d""],[0.2,""#de77ae""],[0.3,""#f1b6da""],[0.4,""#fde0ef""],[0.5,""#f7f7f7""],[0.6,""#e6f5d0""],[0.7,""#b8e186""],[0.8,""#7fbc41""],[0.9,""#4d9221""],[1,""#276419""]]},""xaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""yaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""scene"":{""xaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""yaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""zaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2}},""shapedefaults"":{""line"":{""color"":""#2a3f5f""}},""annotationdefaults"":{""arrowcolor"":""#2a3f5f"",""arrowhead"":0,""arrowwidth"":1},""geo"":{""bgcolor"":""white"",""landcolor"":""#E5ECF6"",""subunitcolor"":""white"",""showland"":true,""showlakes"":true,""lakecolor"":""white""},""title"":{""x"":0.05},""mapbox"":{""style"":""light""}}},""xaxis"":{""anchor"":""y"",""domain"":[0.0,1.0],""title"":{""text"":""Model""},""categoryorder"":""array"",""categoryarray"":[""Mistral-7B-Instruct-v0.2"",""Mixtral-8x7B-Instruct-v0.1"",""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""chat-bison"",""chat-bison-32k"",""gemini-pro"",""gpt-3.5-turbo"",""gpt-4"",""gpt-4-turbo"",""llama-2-70b-chat"",""zephyr-7b-beta""]},""yaxis"":{""anchor"":""x"",""domain"":[0.0,1.0],""title"":{""text"":""Execution time (s)""}},""legend"":{""title"":{""text"":""Model""},""tracegroupgap"":0},""title"":{""text"":""Model endpoints response times""},""barmode"":""relative""}}"
173
+ ./html/plots/execution_costs.html,"Figure({
174
+ 'data': [{'alignmentgroup': 'True',
175
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
176
+ 'legendgroup': 'gpt-3.5-turbo',
177
+ 'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
178
+ 'name': 'gpt-3.5-turbo',
179
+ 'offsetgroup': 'gpt-3.5-turbo',
180
+ 'orientation': 'v',
181
+ 'showlegend': True,
182
+ 'textposition': 'auto',
183
+ 'type': 'bar',
184
+ 'x': array(['gpt-3.5-turbo', 'gpt-3.5-turbo'], dtype=object),
185
+ 'xaxis': 'x',
186
+ 'y': array([0.020994, 0.020994]),
187
+ 'yaxis': 'y'},
188
+ {'alignmentgroup': 'True',
189
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
190
+ 'legendgroup': 'gpt-4-turbo',
191
+ 'marker': {'color': '#EF553B', 'pattern': {'shape': ''}},
192
+ 'name': 'gpt-4-turbo',
193
+ 'offsetgroup': 'gpt-4-turbo',
194
+ 'orientation': 'v',
195
+ 'showlegend': True,
196
+ 'textposition': 'auto',
197
+ 'type': 'bar',
198
+ 'x': array(['gpt-4-turbo'], dtype=object),
199
+ 'xaxis': 'x',
200
+ 'y': array([0.02967]),
201
+ 'yaxis': 'y'},
202
+ {'alignmentgroup': 'True',
203
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
204
+ 'legendgroup': 'gpt-4',
205
+ 'marker': {'color': '#00cc96', 'pattern': {'shape': ''}},
206
+ 'name': 'gpt-4',
207
+ 'offsetgroup': 'gpt-4',
208
+ 'orientation': 'v',
209
+ 'showlegend': True,
210
+ 'textposition': 'auto',
211
+ 'type': 'bar',
212
+ 'x': array(['gpt-4'], dtype=object),
213
+ 'xaxis': 'x',
214
+ 'y': array([0.07839]),
215
+ 'yaxis': 'y'},
216
+ {'alignmentgroup': 'True',
217
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
218
+ 'legendgroup': 'llama-2-70b-chat',
219
+ 'marker': {'color': '#ab63fa', 'pattern': {'shape': ''}},
220
+ 'name': 'llama-2-70b-chat',
221
+ 'offsetgroup': 'llama-2-70b-chat',
222
+ 'orientation': 'v',
223
+ 'showlegend': True,
224
+ 'textposition': 'auto',
225
+ 'type': 'bar',
226
+ 'x': array(['llama-2-70b-chat'], dtype=object),
227
+ 'xaxis': 'x',
228
+ 'y': array([0.0039636]),
229
+ 'yaxis': 'y'},
230
+ {'alignmentgroup': 'True',
231
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
232
+ 'legendgroup': 'Mixtral-8x7B-Instruct-v0.1',
233
+ 'marker': {'color': '#FFA15A', 'pattern': {'shape': ''}},
234
+ 'name': 'Mixtral-8x7B-Instruct-v0.1',
235
+ 'offsetgroup': 'Mixtral-8x7B-Instruct-v0.1',
236
+ 'orientation': 'v',
237
+ 'showlegend': True,
238
+ 'textposition': 'auto',
239
+ 'type': 'bar',
240
+ 'x': array(['Mixtral-8x7B-Instruct-v0.1'], dtype=object),
241
+ 'xaxis': 'x',
242
+ 'y': array([0.0161523]),
243
+ 'yaxis': 'y'},
244
+ {'alignmentgroup': 'True',
245
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
246
+ 'legendgroup': 'zephyr-7b-beta',
247
+ 'marker': {'color': '#19d3f3', 'pattern': {'shape': ''}},
248
+ 'name': 'zephyr-7b-beta',
249
+ 'offsetgroup': 'zephyr-7b-beta',
250
+ 'orientation': 'v',
251
+ 'showlegend': True,
252
+ 'textposition': 'auto',
253
+ 'type': 'bar',
254
+ 'x': array(['zephyr-7b-beta'], dtype=object),
255
+ 'xaxis': 'x',
256
+ 'y': array([0.00550208]),
257
+ 'yaxis': 'y'},
258
+ {'alignmentgroup': 'True',
259
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
260
+ 'legendgroup': 'Mistral-7B-Instruct-v0.2',
261
+ 'marker': {'color': '#FF6692', 'pattern': {'shape': ''}},
262
+ 'name': 'Mistral-7B-Instruct-v0.2',
263
+ 'offsetgroup': 'Mistral-7B-Instruct-v0.2',
264
+ 'orientation': 'v',
265
+ 'showlegend': True,
266
+ 'textposition': 'auto',
267
+ 'type': 'bar',
268
+ 'x': array(['Mistral-7B-Instruct-v0.2'], dtype=object),
269
+ 'xaxis': 'x',
270
+ 'y': array([0.00202543]),
271
+ 'yaxis': 'y'},
272
+ {'alignmentgroup': 'True',
273
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
274
+ 'legendgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
275
+ 'marker': {'color': '#B6E880', 'pattern': {'shape': ''}},
276
+ 'name': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
277
+ 'offsetgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
278
+ 'orientation': 'v',
279
+ 'showlegend': True,
280
+ 'textposition': 'auto',
281
+ 'type': 'bar',
282
+ 'x': array(['TinyLlama/TinyLlama-1.1B-Chat-v1.0'], dtype=object),
283
+ 'xaxis': 'x',
284
+ 'y': array([0.00046687]),
285
+ 'yaxis': 'y'},
286
+ {'alignmentgroup': 'True',
287
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
288
+ 'legendgroup': 'gemini-pro',
289
+ 'marker': {'color': '#FF97FF', 'pattern': {'shape': ''}},
290
+ 'name': 'gemini-pro',
291
+ 'offsetgroup': 'gemini-pro',
292
+ 'orientation': 'v',
293
+ 'showlegend': True,
294
+ 'textposition': 'auto',
295
+ 'type': 'bar',
296
+ 'x': array(['gemini-pro'], dtype=object),
297
+ 'xaxis': 'x',
298
+ 'y': array([0.005052]),
299
+ 'yaxis': 'y'},
300
+ {'alignmentgroup': 'True',
301
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
302
+ 'legendgroup': 'chat-bison (PaLM 2)',
303
+ 'marker': {'color': '#FECB52', 'pattern': {'shape': ''}},
304
+ 'name': 'chat-bison (PaLM 2)',
305
+ 'offsetgroup': 'chat-bison (PaLM 2)',
306
+ 'orientation': 'v',
307
+ 'showlegend': True,
308
+ 'textposition': 'auto',
309
+ 'type': 'bar',
310
+ 'x': array(['chat-bison (PaLM 2)'], dtype=object),
311
+ 'xaxis': 'x',
312
+ 'y': array([0.]),
313
+ 'yaxis': 'y'},
314
+ {'alignmentgroup': 'True',
315
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
316
+ 'legendgroup': 'chat-bison-32k (PaLM 2 32K)',
317
+ 'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
318
+ 'name': 'chat-bison-32k (PaLM 2 32K)',
319
+ 'offsetgroup': 'chat-bison-32k (PaLM 2 32K)',
320
+ 'orientation': 'v',
321
+ 'showlegend': True,
322
+ 'textposition': 'auto',
323
+ 'type': 'bar',
324
+ 'x': array(['chat-bison-32k (PaLM 2 32K)'], dtype=object),
325
+ 'xaxis': 'x',
326
+ 'y': array([0.]),
327
+ 'yaxis': 'y'}],
328
+ 'layout': {'barmode': 'relative',
329
+ 'legend': {'title': {'text': 'Model'}, 'tracegroupgap': 0},
330
+ 'template': '...',
331
+ 'title': {'text': 'Costs of execution of 39 test queries per model'},
332
+ 'xaxis': {'anchor': 'y', 'domain': [0.0, 1.0], 'title': {'text': 'Model'}},
333
+ 'yaxis': {'anchor': 'x', 'domain': [0.0, 1.0], 'title': {'text': 'Execution cost ($)'}}}
334
+ })",Costs of execution of 39 test queries per model,Note that some providers bill by token count and some by execution time. In the second case we used averaged pausing and resuming time to calculate the cost and assumed that all queries have been done in one session. Also note that for now the Gemini-Pro model is free for under 60 queries per minute.,"{""data"":[{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-3.5-turbo"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""gpt-3.5-turbo"",""offsetgroup"":""gpt-3.5-turbo"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gpt-3.5-turbo"",""gpt-3.5-turbo""],""xaxis"":""x"",""y"":[0.020994000000000002,0.020994000000000002],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4-turbo"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""gpt-4-turbo"",""offsetgroup"":""gpt-4-turbo"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gpt-4-turbo""],""xaxis"":""x"",""y"":[0.029670000000000002],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""gpt-4"",""offsetgroup"":""gpt-4"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gpt-4""],""xaxis"":""x"",""y"":[0.07839],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""llama-2-70b-chat"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""llama-2-70b-chat"",""offsetgroup"":""llama-2-70b-chat"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""llama-2-70b-chat""],""xaxis"":""x"",""y"":[0.0039636],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mixtral-8x7B-Instruct-v0.1"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""Mixtral-8x7B-Instruct-v0.1"",""offsetgroup"":""Mixtral-8x7B-Instruct-v0.1"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""Mixtral-8x7B-Instruct-v0.1""],""xaxis"":""x"",""y"":[0.016152299999999998],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""zephyr-7b-beta"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""zephyr-7b-beta"",""offsetgroup"":""zephyr-7b-beta"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""zephyr-7b-beta""],""xaxis"":""x"",""y"":[0.005502075092660056],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral-7B-Instruct-v0.2"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""Mistral-7B-Instruct-v0.2"",""offsetgroup"":""Mistral-7B-Instruct-v0.2"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""Mistral-7B-Instruct-v0.2""],""xaxis"":""x"",""y"":[0.002025430454148187],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""offsetgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0""],""xaxis"":""x"",""y"":[0.0004668651938438415],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gemini-pro"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""gemini-pro"",""offsetgroup"":""gemini-pro"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gemini-pro""],""xaxis"":""x"",""y"":[0.005052],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison (PaLM 2)"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""chat-bison (PaLM 2)"",""offsetgroup"":""chat-bison (PaLM 2)"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""chat-bison (PaLM 2)""],""xaxis"":""x"",""y"":[0.0],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison-32k (PaLM 2 32K)"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""chat-bison-32k (PaLM 2 32K)"",""offsetgroup"":""chat-bison-32k (PaLM 2 32K)"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""chat-bison-32k (PaLM 2 32K)""],""xaxis"":""x"",""y"":[0.0],""yaxis"":""y"",""type"":""bar""}],""layout"":{""template"":{""data"":{""histogram2dcontour"":[{""type"":""histogram2dcontour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""choropleth"":[{""type"":""choropleth"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""histogram2d"":[{""type"":""histogram2d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmap"":[{""type"":""heatmap"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmapgl"":[{""type"":""heatmapgl"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""contourcarpet"":[{""type"":""contourcarpet"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""contour"":[{""type"":""contour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""surface"":[{""type"":""surface"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""mesh3d"":[{""type"":""mesh3d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""scatter"":[{""fillpattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2},""type"":""scatter""}],""parcoords"":[{""type"":""parcoords"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolargl"":[{""type"":""scatterpolargl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""bar"":[{""error_x"":{""color"":""#2a3f5f""},""error_y"":{""color"":""#2a3f5f""},""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""bar""}],""scattergeo"":[{""type"":""scattergeo"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolar"":[{""type"":""scatterpolar"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""histogram"":[{""marker"":{""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""histogram""}],""scattergl"":[{""type"":""scattergl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatter3d"":[{""type"":""scatter3d"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattermapbox"":[{""type"":""scattermapbox"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterternary"":[{""type"":""scatterternary"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattercarpet"":[{""type"":""scattercarpet"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""carpet"":[{""aaxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""baxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""type"":""carpet""}],""table"":[{""cells"":{""fill"":{""color"":""#EBF0F8""},""line"":{""color"":""white""}},""header"":{""fill"":{""color"":""#C8D4E3""},""line"":{""color"":""white""}},""type"":""table""}],""barpolar"":[{""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""barpolar""}],""pie"":[{""automargin"":true,""type"":""pie""}]},""layout"":{""autotypenumbers"":""strict"",""colorway"":[""#636efa"",""#EF553B"",""#00cc96"",""#ab63fa"",""#FFA15A"",""#19d3f3"",""#FF6692"",""#B6E880"",""#FF97FF"",""#FECB52""],""font"":{""color"":""#2a3f5f""},""hovermode"":""closest"",""hoverlabel"":{""align"":""left""},""paper_bgcolor"":""white"",""plot_bgcolor"":""#E5ECF6"",""polar"":{""bgcolor"":""#E5ECF6"",""angularaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""radialaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""ternary"":{""bgcolor"":""#E5ECF6"",""aaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""baxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""caxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""coloraxis"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""colorscale"":{""sequential"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""sequentialminus"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""diverging"":[[0,""#8e0152""],[0.1,""#c51b7d""],[0.2,""#de77ae""],[0.3,""#f1b6da""],[0.4,""#fde0ef""],[0.5,""#f7f7f7""],[0.6,""#e6f5d0""],[0.7,""#b8e186""],[0.8,""#7fbc41""],[0.9,""#4d9221""],[1,""#276419""]]},""xaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""yaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""scene"":{""xaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""yaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""zaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2}},""shapedefaults"":{""line"":{""color"":""#2a3f5f""}},""annotationdefaults"":{""arrowcolor"":""#2a3f5f"",""arrowhead"":0,""arrowwidth"":1},""geo"":{""bgcolor"":""white"",""landcolor"":""#E5ECF6"",""subunitcolor"":""white"",""showland"":true,""showlakes"":true,""lakecolor"":""white""},""title"":{""x"":0.05},""mapbox"":{""style"":""light""}}},""xaxis"":{""anchor"":""y"",""domain"":[0.0,1.0],""title"":{""text"":""Model""}},""yaxis"":{""anchor"":""x"",""domain"":[0.0,1.0],""title"":{""text"":""Execution cost ($)""}},""legend"":{""title"":{""text"":""Model""},""tracegroupgap"":0},""title"":{""text"":""Costs of execution of 39 test queries per model""},""barmode"":""relative""}}"
335
+ ./html/plots/model_sizes.html,"Figure({
336
+ 'data': [{'alignmentgroup': 'True',
337
+ 'hovertemplate': 'Model=%{x}<br>Model size (B params)=%{y}<extra></extra>',
338
+ 'legendgroup': 'Mixtral-8x7B-Instruct-v0.1',
339
+ 'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
340
+ 'name': 'Mixtral-8x7B-Instruct-v0.1',
341
+ 'offsetgroup': 'Mixtral-8x7B-Instruct-v0.1',
342
+ 'orientation': 'v',
343
+ 'showlegend': True,
344
+ 'textposition': 'auto',
345
+ 'type': 'bar',
346
+ 'x': array(['Mixtral-8x7B-Instruct-v0.1'], dtype=object),
347
+ 'xaxis': 'x',
348
+ 'y': array([56.]),
349
+ 'yaxis': 'y'},
350
+ {'alignmentgroup': 'True',
351
+ 'hovertemplate': 'Model=%{x}<br>Model size (B params)=%{y}<extra></extra>',
352
+ 'legendgroup': 'zephyr-7b-beta',
353
+ 'marker': {'color': '#EF553B', 'pattern': {'shape': ''}},
354
+ 'name': 'zephyr-7b-beta',
355
+ 'offsetgroup': 'zephyr-7b-beta',
356
+ 'orientation': 'v',
357
+ 'showlegend': True,
358
+ 'textposition': 'auto',
359
+ 'type': 'bar',
360
+ 'x': array(['zephyr-7b-beta'], dtype=object),
361
+ 'xaxis': 'x',
362
+ 'y': array([7.]),
363
+ 'yaxis': 'y'},
364
+ {'alignmentgroup': 'True',
365
+ 'hovertemplate': 'Model=%{x}<br>Model size (B params)=%{y}<extra></extra>',
366
+ 'legendgroup': 'Mistral-7B-Instruct-v0.2',
367
+ 'marker': {'color': '#00cc96', 'pattern': {'shape': ''}},
368
+ 'name': 'Mistral-7B-Instruct-v0.2',
369
+ 'offsetgroup': 'Mistral-7B-Instruct-v0.2',
370
+ 'orientation': 'v',
371
+ 'showlegend': True,
372
+ 'textposition': 'auto',
373
+ 'type': 'bar',
374
+ 'x': array(['Mistral-7B-Instruct-v0.2'], dtype=object),
375
+ 'xaxis': 'x',
376
+ 'y': array([7.]),
377
+ 'yaxis': 'y'},
378
+ {'alignmentgroup': 'True',
379
+ 'hovertemplate': 'Model=%{x}<br>Model size (B params)=%{y}<extra></extra>',
380
+ 'legendgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
381
+ 'marker': {'color': '#ab63fa', 'pattern': {'shape': ''}},
382
+ 'name': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
383
+ 'offsetgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
384
+ 'orientation': 'v',
385
+ 'showlegend': True,
386
+ 'textposition': 'auto',
387
+ 'type': 'bar',
388
+ 'x': array(['TinyLlama/TinyLlama-1.1B-Chat-v1.0'], dtype=object),
389
+ 'xaxis': 'x',
390
+ 'y': array([1.1]),
391
+ 'yaxis': 'y'}],
392
+ 'layout': {'barmode': 'relative',
393
+ 'legend': {'title': {'text': 'Model'}, 'tracegroupgap': 0},
394
+ 'template': '...',
395
+ 'title': {'text': 'Model sizes in billions of parameters'},
396
+ 'xaxis': {'anchor': 'y', 'domain': [0.0, 1.0], 'title': {'text': 'Model'}},
397
+ 'yaxis': {'anchor': 'x', 'domain': [0.0, 1.0], 'title': {'text': 'Model size (B params)'}}}
398
+ })",Model sizes in billions of parameters,Note that some models have undisclosed sizes.,"{""data"":[{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eModel size (B params)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mixtral-8x7B-Instruct-v0.1"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""Mixtral-8x7B-Instruct-v0.1"",""offsetgroup"":""Mixtral-8x7B-Instruct-v0.1"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""Mixtral-8x7B-Instruct-v0.1""],""xaxis"":""x"",""y"":[56.0],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eModel size (B params)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""zephyr-7b-beta"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""zephyr-7b-beta"",""offsetgroup"":""zephyr-7b-beta"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""zephyr-7b-beta""],""xaxis"":""x"",""y"":[7.0],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eModel size (B params)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral-7B-Instruct-v0.2"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""Mistral-7B-Instruct-v0.2"",""offsetgroup"":""Mistral-7B-Instruct-v0.2"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""Mistral-7B-Instruct-v0.2""],""xaxis"":""x"",""y"":[7.0],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eModel size (B params)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""offsetgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0""],""xaxis"":""x"",""y"":[1.1],""yaxis"":""y"",""type"":""bar""}],""layout"":{""template"":{""data"":{""histogram2dcontour"":[{""type"":""histogram2dcontour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""choropleth"":[{""type"":""choropleth"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""histogram2d"":[{""type"":""histogram2d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmap"":[{""type"":""heatmap"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmapgl"":[{""type"":""heatmapgl"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""contourcarpet"":[{""type"":""contourcarpet"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""contour"":[{""type"":""contour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""surface"":[{""type"":""surface"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""mesh3d"":[{""type"":""mesh3d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""scatter"":[{""fillpattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2},""type"":""scatter""}],""parcoords"":[{""type"":""parcoords"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolargl"":[{""type"":""scatterpolargl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""bar"":[{""error_x"":{""color"":""#2a3f5f""},""error_y"":{""color"":""#2a3f5f""},""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""bar""}],""scattergeo"":[{""type"":""scattergeo"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolar"":[{""type"":""scatterpolar"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""histogram"":[{""marker"":{""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""histogram""}],""scattergl"":[{""type"":""scattergl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatter3d"":[{""type"":""scatter3d"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattermapbox"":[{""type"":""scattermapbox"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterternary"":[{""type"":""scatterternary"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattercarpet"":[{""type"":""scattercarpet"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""carpet"":[{""aaxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""baxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""type"":""carpet""}],""table"":[{""cells"":{""fill"":{""color"":""#EBF0F8""},""line"":{""color"":""white""}},""header"":{""fill"":{""color"":""#C8D4E3""},""line"":{""color"":""white""}},""type"":""table""}],""barpolar"":[{""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""barpolar""}],""pie"":[{""automargin"":true,""type"":""pie""}]},""layout"":{""autotypenumbers"":""strict"",""colorway"":[""#636efa"",""#EF553B"",""#00cc96"",""#ab63fa"",""#FFA15A"",""#19d3f3"",""#FF6692"",""#B6E880"",""#FF97FF"",""#FECB52""],""font"":{""color"":""#2a3f5f""},""hovermode"":""closest"",""hoverlabel"":{""align"":""left""},""paper_bgcolor"":""white"",""plot_bgcolor"":""#E5ECF6"",""polar"":{""bgcolor"":""#E5ECF6"",""angularaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""radialaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""ternary"":{""bgcolor"":""#E5ECF6"",""aaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""baxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""caxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""coloraxis"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""colorscale"":{""sequential"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""sequentialminus"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""diverging"":[[0,""#8e0152""],[0.1,""#c51b7d""],[0.2,""#de77ae""],[0.3,""#f1b6da""],[0.4,""#fde0ef""],[0.5,""#f7f7f7""],[0.6,""#e6f5d0""],[0.7,""#b8e186""],[0.8,""#7fbc41""],[0.9,""#4d9221""],[1,""#276419""]]},""xaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""yaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""scene"":{""xaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""yaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""zaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2}},""shapedefaults"":{""line"":{""color"":""#2a3f5f""}},""annotationdefaults"":{""arrowcolor"":""#2a3f5f"",""arrowhead"":0,""arrowwidth"":1},""geo"":{""bgcolor"":""white"",""landcolor"":""#E5ECF6"",""subunitcolor"":""white"",""showland"":true,""showlakes"":true,""lakecolor"":""white""},""title"":{""x"":0.05},""mapbox"":{""style"":""light""}}},""xaxis"":{""anchor"":""y"",""domain"":[0.0,1.0],""title"":{""text"":""Model""}},""yaxis"":{""anchor"":""x"",""domain"":[0.0,1.0],""title"":{""text"":""Model size (B params)""}},""legend"":{""title"":{""text"":""Model""},""tracegroupgap"":0},""title"":{""text"":""Model sizes in billions of parameters""},""barmode"":""relative""}}"
data/2024-01-26 16:13:38.191636_model_costs.csv ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ model,provider,provider_pricing,cost_per_token
2
+ gpt-3.5-turbo,OpenAI,"$1 / 1M input tokens, $2 / 1M output tokens","$1 / 1M input tokens, $2 / 1M output tokens"
3
+ gpt-4-turbo,OpenAI,"$10 / 1M input tokens, $30 / 1M output tokens","$10 / 1M input tokens, $30 / 1M output tokens"
4
+ gpt-4,OpenAI,"$30 / 1M input tokens, $60 / 1M output tokens","$30 / 1M input tokens, $60 / 1M output tokens"
5
+ gpt-3.5-turbo,OpenAI,"$1 / 1M input tokens, $2 / 1M output tokens","$1 / 1M input tokens, $2 / 1M output tokens"
6
+ llama-2-70b-chat,Together AI,$0.2 / 1M tokens,$0.2 / 1M tokens
7
+ Mixtral-8x7B-Instruct-v0.1,Together AI,$0.9 / 1M tokens,$0.9 / 1M tokens
8
+ zephyr-7b-beta,Hugging Face Inference Endpoint,$1.3 / hour,$5.364983589763427e-11 / 1M tokens
9
+ Mistral-7B-Instruct-v0.2,Hugging Face Inference Endpoint,$1.3 / hour,$5.2585398066299045e-11 / 1M tokens
10
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,Hugging Face Inference Endpoint,$0.6 / hour,$1.0752204477787017e-11 / 1M tokens
11
+ gemini-pro,Google VertexAI,"$0.25 / 1M input characters, $0.5 / 1M output characters (60 queries per minute are free)","$0.25 / 1M input tokens, $0.5 / 1M output tokens"
12
+ chat-bison (PaLM 2),Google VertexAI,"$0.25 / 1M input tokens, $0.5 / 1M output tokens","$0.25 / 1M input tokens, $0.5 / 1M output tokens"
13
+ chat-bison-32k (PaLM 2 32K),Google VertexAI,"$0.25 / 1M input tokens, $0.5 / 1M output tokens","$0.25 / 1M input tokens, $0.5 / 1M output tokens"
data/2024-01-26 16:16:56.390177_model_costs.csv ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ model,provider,provider_pricing,cost_per_token
2
+ gpt-3.5-turbo,OpenAI,"$1.00 / 1M input tokens, $2.00 / 1M output tokens","$1.00 / 1M input tokens, $2.00 / 1M output tokens"
3
+ gpt-4-turbo,OpenAI,"$10.00 / 1M input tokens, $30.00 / 1M output tokens","$10.00 / 1M input tokens, $30.00 / 1M output tokens"
4
+ gpt-4,OpenAI,"$30.00 / 1M input tokens, $60.00 / 1M output tokens","$30.00 / 1M input tokens, $60.00 / 1M output tokens"
5
+ gpt-3.5-turbo,OpenAI,"$1.00 / 1M input tokens, $2.00 / 1M output tokens","$1.00 / 1M input tokens, $2.00 / 1M output tokens"
6
+ llama-2-70b-chat,Together AI,$0.20 / 1M tokens,$0.20 / 1M tokens
7
+ Mixtral-8x7B-Instruct-v0.1,Together AI,$0.90 / 1M tokens,$0.90 / 1M tokens
8
+ zephyr-7b-beta,Hugging Face Inference Endpoint,$1.30 / hour,$0.00 / 1M tokens
9
+ Mistral-7B-Instruct-v0.2,Hugging Face Inference Endpoint,$1.30 / hour,$0.00 / 1M tokens
10
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,Hugging Face Inference Endpoint,$0.60 / hour,$0.00 / 1M tokens
11
+ gemini-pro,Google VertexAI,"$0.25 / 1M input characters, $0.5 / 1M output characters (60 queries per minute are free)","$0.25 / 1M input tokens, $0.50 / 1M output tokens"
12
+ chat-bison (PaLM 2),Google VertexAI,"$0.25 / 1M input tokens, $0.50 / 1M output tokens","$0.25 / 1M input tokens, $0.50 / 1M output tokens"
13
+ chat-bison-32k (PaLM 2 32K),Google VertexAI,"$0.25 / 1M input tokens, $0.50 / 1M output tokens","$0.25 / 1M input tokens, $0.50 / 1M output tokens"
data/2024-01-26 16:19:55.237955_model_costs.csv ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ model,provider,provider_pricing,cost_per_token
2
+ gpt-3.5-turbo,OpenAI,"$1 / 1M input tokens, $2 / 1M output tokens","$1 / 1M input tokens, $2 / 1M output tokens"
3
+ gpt-4-turbo,OpenAI,"$10 / 1M input tokens, $30 / 1M output tokens","$10 / 1M input tokens, $30 / 1M output tokens"
4
+ gpt-4,OpenAI,"$30 / 1M input tokens, $60 / 1M output tokens","$30 / 1M input tokens, $60 / 1M output tokens"
5
+ gpt-3.5-turbo,OpenAI,"$1 / 1M input tokens, $2 / 1M output tokens","$1 / 1M input tokens, $2 / 1M output tokens"
6
+ llama-2-70b-chat,Together AI,$0.2 / 1M tokens,$0.2 / 1M tokens
7
+ Mixtral-8x7B-Instruct-v0.1,Together AI,$0.9 / 1M tokens,$0.9 / 1M tokens
8
+ zephyr-7b-beta,Hugging Face Inference Endpoint,$1.3 / hour,$5.4e-11 / 1M tokens
9
+ Mistral-7B-Instruct-v0.2,Hugging Face Inference Endpoint,$1.3 / hour,$5.3e-11 / 1M tokens
10
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,Hugging Face Inference Endpoint,$0.6 / hour,$1.1e-11 / 1M tokens
11
+ gemini-pro,Google VertexAI,"$0.25 / 1M input characters, $0.5 / 1M output characters (60 queries per minute are free)","$0.25 / 1M input tokens, $0.5 / 1M output tokens"
12
+ chat-bison (PaLM 2),Google VertexAI,"$0.25 / 1M input tokens, $0.5 / 1M output tokens","$0.25 / 1M input tokens, $0.5 / 1M output tokens"
13
+ chat-bison-32k (PaLM 2 32K),Google VertexAI,"$0.25 / 1M input tokens, $0.5 / 1M output tokens","$0.25 / 1M input tokens, $0.5 / 1M output tokens"
data/2024-01-26 16:21:10.212177_model_costs.csv ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ model,provider,provider_pricing,cost_per_token
2
+ gpt-3.5-turbo,OpenAI,"$1 / 1M input tokens, $2 / 1M output tokens","$1 / 1M input tokens, $2 / 1M output tokens"
3
+ gpt-4-turbo,OpenAI,"$10 / 1M input tokens, $30 / 1M output tokens","$10 / 1M input tokens, $30 / 1M output tokens"
4
+ gpt-4,OpenAI,"$30 / 1M input tokens, $60 / 1M output tokens","$30 / 1M input tokens, $60 / 1M output tokens"
5
+ gpt-3.5-turbo,OpenAI,"$1 / 1M input tokens, $2 / 1M output tokens","$1 / 1M input tokens, $2 / 1M output tokens"
6
+ llama-2-70b-chat,Together AI,$0.2 / 1M tokens,$0.2 / 1M tokens
7
+ Mixtral-8x7B-Instruct-v0.1,Together AI,$0.9 / 1M tokens,$0.9 / 1M tokens
8
+ zephyr-7b-beta,Hugging Face Inference Endpoint,$1.3 / hour,$54 / 1M tokens
9
+ Mistral-7B-Instruct-v0.2,Hugging Face Inference Endpoint,$1.3 / hour,$53 / 1M tokens
10
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,Hugging Face Inference Endpoint,$0.6 / hour,$11 / 1M tokens
11
+ gemini-pro,Google VertexAI,"$0.25 / 1M input characters, $0.5 / 1M output characters (60 queries per minute are free)","$0.25 / 1M input tokens, $0.5 / 1M output tokens"
12
+ chat-bison (PaLM 2),Google VertexAI,"$0.25 / 1M input tokens, $0.5 / 1M output tokens","$0.25 / 1M input tokens, $0.5 / 1M output tokens"
13
+ chat-bison-32k (PaLM 2 32K),Google VertexAI,"$0.25 / 1M input tokens, $0.5 / 1M output tokens","$0.25 / 1M input tokens, $0.5 / 1M output tokens"
data/2024-01-26 16:21:34.661653_model_costs.csv ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ model,provider,provider_pricing,cost_per_token
2
+ gpt-3.5-turbo,OpenAI,"$1 / 1M input tokens, $2 / 1M output tokens","$1 / 1M input tokens, $2 / 1M output tokens"
3
+ gpt-4-turbo,OpenAI,"$10 / 1M input tokens, $30 / 1M output tokens","$10 / 1M input tokens, $30 / 1M output tokens"
4
+ gpt-4,OpenAI,"$30 / 1M input tokens, $60 / 1M output tokens","$30 / 1M input tokens, $60 / 1M output tokens"
5
+ gpt-3.5-turbo,OpenAI,"$1 / 1M input tokens, $2 / 1M output tokens","$1 / 1M input tokens, $2 / 1M output tokens"
6
+ llama-2-70b-chat,Together AI,$0.2 / 1M tokens,$0.2 / 1M tokens
7
+ Mixtral-8x7B-Instruct-v0.1,Together AI,$0.9 / 1M tokens,$0.9 / 1M tokens
8
+ zephyr-7b-beta,Hugging Face Inference Endpoint,$1.3 / hour,$54 / 1M tokens
9
+ Mistral-7B-Instruct-v0.2,Hugging Face Inference Endpoint,$1.3 / hour,$53 / 1M tokens
10
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,Hugging Face Inference Endpoint,$0.6 / hour,$11 / 1M tokens
11
+ gemini-pro,Google VertexAI,"$0.25 / 1M input characters, $0.5 / 1M output characters (60 queries per minute are free)","$0.25 / 1M input tokens, $0.5 / 1M output tokens"
12
+ chat-bison (PaLM 2),Google VertexAI,"$0.25 / 1M input tokens, $0.5 / 1M output tokens","$0.25 / 1M input tokens, $0.5 / 1M output tokens"
13
+ chat-bison-32k (PaLM 2 32K),Google VertexAI,"$0.25 / 1M input tokens, $0.5 / 1M output tokens","$0.25 / 1M input tokens, $0.5 / 1M output tokens"
data/2024-01-26 16:25:47.914140_model_costs.csv ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ model,provider,provider_pricing,cost_per_token
2
+ gpt-3.5-turbo,OpenAI,"$1 / 1M input tokens, $2 / 1M output tokens","$1 / 1M input tokens, $2 / 1M output tokens"
3
+ gpt-4-turbo,OpenAI,"$10 / 1M input tokens, $30 / 1M output tokens","$10 / 1M input tokens, $30 / 1M output tokens"
4
+ gpt-4,OpenAI,"$30 / 1M input tokens, $60 / 1M output tokens","$30 / 1M input tokens, $60 / 1M output tokens"
5
+ gpt-3.5-turbo,OpenAI,"$1 / 1M input tokens, $2 / 1M output tokens","$1 / 1M input tokens, $2 / 1M output tokens"
6
+ llama-2-70b-chat,Together AI,$0.2 / 1M tokens,$0.2 / 1M tokens
7
+ Mixtral-8x7B-Instruct-v0.1,Together AI,$0.9 / 1M tokens,$0.9 / 1M tokens
8
+ zephyr-7b-beta,Hugging Face Inference Endpoint,$1.3 / hour,$0.14 / 1M tokens
9
+ Mistral-7B-Instruct-v0.2,Hugging Face Inference Endpoint,$1.3 / hour,$0.14 / 1M tokens
10
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,Hugging Face Inference Endpoint,$0.6 / hour,$0.026 / 1M tokens
11
+ gemini-pro,Google VertexAI,"$0.25 / 1M input characters, $0.5 / 1M output characters (60 queries per minute are free)","$0.25 / 1M input tokens, $0.5 / 1M output tokens"
12
+ chat-bison (PaLM 2),Google VertexAI,"$0.25 / 1M input tokens, $0.5 / 1M output tokens","$0.25 / 1M input tokens, $0.5 / 1M output tokens"
13
+ chat-bison-32k (PaLM 2 32K),Google VertexAI,"$0.25 / 1M input tokens, $0.5 / 1M output tokens","$0.25 / 1M input tokens, $0.5 / 1M output tokens"
data/2024-01-26 16:32:54.481637_model_costs.csv ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ model,provider,cost_per_token,provider_pricing
2
+ gpt-3.5-turbo,OpenAI,"$1 / 1M input tokens, $2 / 1M output tokens","$1 / 1M input tokens, $2 / 1M output tokens"
3
+ gpt-4-turbo,OpenAI,"$10 / 1M input tokens, $30 / 1M output tokens","$10 / 1M input tokens, $30 / 1M output tokens"
4
+ gpt-4,OpenAI,"$30 / 1M input tokens, $60 / 1M output tokens","$30 / 1M input tokens, $60 / 1M output tokens"
5
+ gpt-3.5-turbo,OpenAI,"$1 / 1M input tokens, $2 / 1M output tokens","$1 / 1M input tokens, $2 / 1M output tokens"
6
+ llama-2-70b-chat,Together AI,$0.2 / 1M tokens,$0.2 / 1M tokens
7
+ Mixtral-8x7B-Instruct-v0.1,Together AI,$0.9 / 1M tokens,$0.9 / 1M tokens
8
+ zephyr-7b-beta,Hugging Face Inference Endpoint,$0.14 / 1M tokens,$1.3 / hour
9
+ Mistral-7B-Instruct-v0.2,Hugging Face Inference Endpoint,$0.14 / 1M tokens,$1.3 / hour
10
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,Hugging Face Inference Endpoint,$0.026 / 1M tokens,$0.6 / hour
11
+ gemini-pro,Google VertexAI,"$0.25 / 1M input tokens, $0.5 / 1M output tokens","$0.25 / 1M input characters, $0.5 / 1M output characters (60 queries per minute are free)"
12
+ chat-bison (PaLM 2),Google VertexAI,"$0.25 / 1M input tokens, $0.5 / 1M output tokens","$0.25 / 1M input tokens, $0.5 / 1M output tokens"
13
+ chat-bison-32k (PaLM 2 32K),Google VertexAI,"$0.25 / 1M input tokens, $0.5 / 1M output tokens","$0.25 / 1M input tokens, $0.5 / 1M output tokens"
data/2024-01-26 16:43:36.843194_general_plot.csv ADDED
@@ -0,0 +1,398 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ path,plot_object,description,comment,plot_json
2
+ ./html/plots/response_times.html,"Figure({
3
+ 'data': [{'alignmentgroup': 'True',
4
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
5
+ 'legendgroup': 'Mistral-7B-Instruct-v0.2',
6
+ 'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
7
+ 'name': 'Mistral-7B-Instruct-v0.2',
8
+ 'offsetgroup': 'Mistral-7B-Instruct-v0.2',
9
+ 'orientation': 'v',
10
+ 'showlegend': True,
11
+ 'textposition': 'auto',
12
+ 'type': 'bar',
13
+ 'x': array(['Mistral-7B-Instruct-v0.2'], dtype=object),
14
+ 'xaxis': 'x',
15
+ 'y': array([3.17454003]),
16
+ 'yaxis': 'y'},
17
+ {'alignmentgroup': 'True',
18
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
19
+ 'legendgroup': 'Mixtral-8x7B-Instruct-v0.1',
20
+ 'marker': {'color': '#EF553B', 'pattern': {'shape': ''}},
21
+ 'name': 'Mixtral-8x7B-Instruct-v0.1',
22
+ 'offsetgroup': 'Mixtral-8x7B-Instruct-v0.1',
23
+ 'orientation': 'v',
24
+ 'showlegend': True,
25
+ 'textposition': 'auto',
26
+ 'type': 'bar',
27
+ 'x': array(['Mixtral-8x7B-Instruct-v0.1'], dtype=object),
28
+ 'xaxis': 'x',
29
+ 'y': array([7.14219763]),
30
+ 'yaxis': 'y'},
31
+ {'alignmentgroup': 'True',
32
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
33
+ 'legendgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
34
+ 'marker': {'color': '#00cc96', 'pattern': {'shape': ''}},
35
+ 'name': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
36
+ 'offsetgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
37
+ 'orientation': 'v',
38
+ 'showlegend': True,
39
+ 'textposition': 'auto',
40
+ 'type': 'bar',
41
+ 'x': array(['TinyLlama/TinyLlama-1.1B-Chat-v1.0'], dtype=object),
42
+ 'xaxis': 'x',
43
+ 'y': array([1.29026454]),
44
+ 'yaxis': 'y'},
45
+ {'alignmentgroup': 'True',
46
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
47
+ 'legendgroup': 'chat-bison',
48
+ 'marker': {'color': '#ab63fa', 'pattern': {'shape': ''}},
49
+ 'name': 'chat-bison',
50
+ 'offsetgroup': 'chat-bison',
51
+ 'orientation': 'v',
52
+ 'showlegend': True,
53
+ 'textposition': 'auto',
54
+ 'type': 'bar',
55
+ 'x': array(['chat-bison'], dtype=object),
56
+ 'xaxis': 'x',
57
+ 'y': array([3.89024363]),
58
+ 'yaxis': 'y'},
59
+ {'alignmentgroup': 'True',
60
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
61
+ 'legendgroup': 'chat-bison-32k',
62
+ 'marker': {'color': '#FFA15A', 'pattern': {'shape': ''}},
63
+ 'name': 'chat-bison-32k',
64
+ 'offsetgroup': 'chat-bison-32k',
65
+ 'orientation': 'v',
66
+ 'showlegend': True,
67
+ 'textposition': 'auto',
68
+ 'type': 'bar',
69
+ 'x': array(['chat-bison-32k'], dtype=object),
70
+ 'xaxis': 'x',
71
+ 'y': array([4.12817777]),
72
+ 'yaxis': 'y'},
73
+ {'alignmentgroup': 'True',
74
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
75
+ 'legendgroup': 'gemini-pro',
76
+ 'marker': {'color': '#19d3f3', 'pattern': {'shape': ''}},
77
+ 'name': 'gemini-pro',
78
+ 'offsetgroup': 'gemini-pro',
79
+ 'orientation': 'v',
80
+ 'showlegend': True,
81
+ 'textposition': 'auto',
82
+ 'type': 'bar',
83
+ 'x': array(['gemini-pro'], dtype=object),
84
+ 'xaxis': 'x',
85
+ 'y': array([4.72138064]),
86
+ 'yaxis': 'y'},
87
+ {'alignmentgroup': 'True',
88
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
89
+ 'legendgroup': 'gpt-3.5-turbo',
90
+ 'marker': {'color': '#FF6692', 'pattern': {'shape': ''}},
91
+ 'name': 'gpt-3.5-turbo',
92
+ 'offsetgroup': 'gpt-3.5-turbo',
93
+ 'orientation': 'v',
94
+ 'showlegend': True,
95
+ 'textposition': 'auto',
96
+ 'type': 'bar',
97
+ 'x': array(['gpt-3.5-turbo'], dtype=object),
98
+ 'xaxis': 'x',
99
+ 'y': array([5.28237349]),
100
+ 'yaxis': 'y'},
101
+ {'alignmentgroup': 'True',
102
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
103
+ 'legendgroup': 'gpt-4',
104
+ 'marker': {'color': '#B6E880', 'pattern': {'shape': ''}},
105
+ 'name': 'gpt-4',
106
+ 'offsetgroup': 'gpt-4',
107
+ 'orientation': 'v',
108
+ 'showlegend': True,
109
+ 'textposition': 'auto',
110
+ 'type': 'bar',
111
+ 'x': array(['gpt-4'], dtype=object),
112
+ 'xaxis': 'x',
113
+ 'y': array([15.52184566]),
114
+ 'yaxis': 'y'},
115
+ {'alignmentgroup': 'True',
116
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
117
+ 'legendgroup': 'gpt-4-turbo',
118
+ 'marker': {'color': '#FF97FF', 'pattern': {'shape': ''}},
119
+ 'name': 'gpt-4-turbo',
120
+ 'offsetgroup': 'gpt-4-turbo',
121
+ 'orientation': 'v',
122
+ 'showlegend': True,
123
+ 'textposition': 'auto',
124
+ 'type': 'bar',
125
+ 'x': array(['gpt-4-turbo'], dtype=object),
126
+ 'xaxis': 'x',
127
+ 'y': array([14.00852903]),
128
+ 'yaxis': 'y'},
129
+ {'alignmentgroup': 'True',
130
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
131
+ 'legendgroup': 'llama-2-70b-chat',
132
+ 'marker': {'color': '#FECB52', 'pattern': {'shape': ''}},
133
+ 'name': 'llama-2-70b-chat',
134
+ 'offsetgroup': 'llama-2-70b-chat',
135
+ 'orientation': 'v',
136
+ 'showlegend': True,
137
+ 'textposition': 'auto',
138
+ 'type': 'bar',
139
+ 'x': array(['llama-2-70b-chat'], dtype=object),
140
+ 'xaxis': 'x',
141
+ 'y': array([6.0658799]),
142
+ 'yaxis': 'y'},
143
+ {'alignmentgroup': 'True',
144
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
145
+ 'legendgroup': 'zephyr-7b-beta',
146
+ 'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
147
+ 'name': 'zephyr-7b-beta',
148
+ 'offsetgroup': 'zephyr-7b-beta',
149
+ 'orientation': 'v',
150
+ 'showlegend': True,
151
+ 'textposition': 'auto',
152
+ 'type': 'bar',
153
+ 'x': array(['zephyr-7b-beta'], dtype=object),
154
+ 'xaxis': 'x',
155
+ 'y': array([3.23879932]),
156
+ 'yaxis': 'y'}],
157
+ 'layout': {'barmode': 'relative',
158
+ 'legend': {'title': {'text': 'Model'}, 'tracegroupgap': 0},
159
+ 'template': '...',
160
+ 'title': {'text': 'Model endpoints response times'},
161
+ 'xaxis': {'anchor': 'y',
162
+ 'categoryarray': [Mistral-7B-Instruct-v0.2,
163
+ Mixtral-8x7B-Instruct-v0.1,
164
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,
165
+ chat-bison, chat-bison-32k, gemini-pro,
166
+ gpt-3.5-turbo, gpt-4, gpt-4-turbo,
167
+ llama-2-70b-chat, zephyr-7b-beta],
168
+ 'categoryorder': 'array',
169
+ 'domain': [0.0, 1.0],
170
+ 'title': {'text': 'Model'}},
171
+ 'yaxis': {'anchor': 'x', 'domain': [0.0, 1.0], 'title': {'text': 'Execution time (s)'}}}
172
+ })",Model endpoints response times,,"{""data"":[{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral-7B-Instruct-v0.2"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""Mistral-7B-Instruct-v0.2"",""offsetgroup"":""Mistral-7B-Instruct-v0.2"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""Mistral-7B-Instruct-v0.2""],""xaxis"":""x"",""y"":[3.174540030956268],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mixtral-8x7B-Instruct-v0.1"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""Mixtral-8x7B-Instruct-v0.1"",""offsetgroup"":""Mixtral-8x7B-Instruct-v0.1"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""Mixtral-8x7B-Instruct-v0.1""],""xaxis"":""x"",""y"":[7.142197625471814],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""offsetgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0""],""xaxis"":""x"",""y"":[1.2902645373344421],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""chat-bison"",""offsetgroup"":""chat-bison"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""chat-bison""],""xaxis"":""x"",""y"":[3.890243631601334],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison-32k"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""chat-bison-32k"",""offsetgroup"":""chat-bison-32k"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""chat-bison-32k""],""xaxis"":""x"",""y"":[4.128177767992019],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gemini-pro"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""gemini-pro"",""offsetgroup"":""gemini-pro"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gemini-pro""],""xaxis"":""x"",""y"":[4.72138064004937],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-3.5-turbo"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""gpt-3.5-turbo"",""offsetgroup"":""gpt-3.5-turbo"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gpt-3.5-turbo""],""xaxis"":""x"",""y"":[5.282373493889353],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""gpt-4"",""offsetgroup"":""gpt-4"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gpt-4""],""xaxis"":""x"",""y"":[15.5218456586202],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4-turbo"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""gpt-4-turbo"",""offsetgroup"":""gpt-4-turbo"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gpt-4-turbo""],""xaxis"":""x"",""y"":[14.008529031276703],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""llama-2-70b-chat"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""llama-2-70b-chat"",""offsetgroup"":""llama-2-70b-chat"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""llama-2-70b-chat""],""xaxis"":""x"",""y"":[6.06587989590749],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""zephyr-7b-beta"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""zephyr-7b-beta"",""offsetgroup"":""zephyr-7b-beta"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""zephyr-7b-beta""],""xaxis"":""x"",""y"":[3.2387993240356447],""yaxis"":""y"",""type"":""bar""}],""layout"":{""template"":{""data"":{""histogram2dcontour"":[{""type"":""histogram2dcontour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""choropleth"":[{""type"":""choropleth"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""histogram2d"":[{""type"":""histogram2d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmap"":[{""type"":""heatmap"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmapgl"":[{""type"":""heatmapgl"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""contourcarpet"":[{""type"":""contourcarpet"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""contour"":[{""type"":""contour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""surface"":[{""type"":""surface"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""mesh3d"":[{""type"":""mesh3d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""scatter"":[{""fillpattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2},""type"":""scatter""}],""parcoords"":[{""type"":""parcoords"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolargl"":[{""type"":""scatterpolargl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""bar"":[{""error_x"":{""color"":""#2a3f5f""},""error_y"":{""color"":""#2a3f5f""},""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""bar""}],""scattergeo"":[{""type"":""scattergeo"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolar"":[{""type"":""scatterpolar"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""histogram"":[{""marker"":{""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""histogram""}],""scattergl"":[{""type"":""scattergl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatter3d"":[{""type"":""scatter3d"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattermapbox"":[{""type"":""scattermapbox"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterternary"":[{""type"":""scatterternary"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattercarpet"":[{""type"":""scattercarpet"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""carpet"":[{""aaxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""baxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""type"":""carpet""}],""table"":[{""cells"":{""fill"":{""color"":""#EBF0F8""},""line"":{""color"":""white""}},""header"":{""fill"":{""color"":""#C8D4E3""},""line"":{""color"":""white""}},""type"":""table""}],""barpolar"":[{""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""barpolar""}],""pie"":[{""automargin"":true,""type"":""pie""}]},""layout"":{""autotypenumbers"":""strict"",""colorway"":[""#636efa"",""#EF553B"",""#00cc96"",""#ab63fa"",""#FFA15A"",""#19d3f3"",""#FF6692"",""#B6E880"",""#FF97FF"",""#FECB52""],""font"":{""color"":""#2a3f5f""},""hovermode"":""closest"",""hoverlabel"":{""align"":""left""},""paper_bgcolor"":""white"",""plot_bgcolor"":""#E5ECF6"",""polar"":{""bgcolor"":""#E5ECF6"",""angularaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""radialaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""ternary"":{""bgcolor"":""#E5ECF6"",""aaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""baxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""caxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""coloraxis"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""colorscale"":{""sequential"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""sequentialminus"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""diverging"":[[0,""#8e0152""],[0.1,""#c51b7d""],[0.2,""#de77ae""],[0.3,""#f1b6da""],[0.4,""#fde0ef""],[0.5,""#f7f7f7""],[0.6,""#e6f5d0""],[0.7,""#b8e186""],[0.8,""#7fbc41""],[0.9,""#4d9221""],[1,""#276419""]]},""xaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""yaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""scene"":{""xaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""yaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""zaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2}},""shapedefaults"":{""line"":{""color"":""#2a3f5f""}},""annotationdefaults"":{""arrowcolor"":""#2a3f5f"",""arrowhead"":0,""arrowwidth"":1},""geo"":{""bgcolor"":""white"",""landcolor"":""#E5ECF6"",""subunitcolor"":""white"",""showland"":true,""showlakes"":true,""lakecolor"":""white""},""title"":{""x"":0.05},""mapbox"":{""style"":""light""}}},""xaxis"":{""anchor"":""y"",""domain"":[0.0,1.0],""title"":{""text"":""Model""},""categoryorder"":""array"",""categoryarray"":[""Mistral-7B-Instruct-v0.2"",""Mixtral-8x7B-Instruct-v0.1"",""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""chat-bison"",""chat-bison-32k"",""gemini-pro"",""gpt-3.5-turbo"",""gpt-4"",""gpt-4-turbo"",""llama-2-70b-chat"",""zephyr-7b-beta""]},""yaxis"":{""anchor"":""x"",""domain"":[0.0,1.0],""title"":{""text"":""Execution time (s)""}},""legend"":{""title"":{""text"":""Model""},""tracegroupgap"":0},""title"":{""text"":""Model endpoints response times""},""barmode"":""relative""}}"
173
+ ./html/plots/execution_costs.html,"Figure({
174
+ 'data': [{'alignmentgroup': 'True',
175
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
176
+ 'legendgroup': 'gpt-3.5-turbo',
177
+ 'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
178
+ 'name': 'gpt-3.5-turbo',
179
+ 'offsetgroup': 'gpt-3.5-turbo',
180
+ 'orientation': 'v',
181
+ 'showlegend': True,
182
+ 'textposition': 'auto',
183
+ 'type': 'bar',
184
+ 'x': array(['gpt-3.5-turbo', 'gpt-3.5-turbo'], dtype=object),
185
+ 'xaxis': 'x',
186
+ 'y': array([0.002619, 0.002619]),
187
+ 'yaxis': 'y'},
188
+ {'alignmentgroup': 'True',
189
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
190
+ 'legendgroup': 'gpt-4-turbo',
191
+ 'marker': {'color': '#EF553B', 'pattern': {'shape': ''}},
192
+ 'name': 'gpt-4-turbo',
193
+ 'offsetgroup': 'gpt-4-turbo',
194
+ 'orientation': 'v',
195
+ 'showlegend': True,
196
+ 'textposition': 'auto',
197
+ 'type': 'bar',
198
+ 'x': array(['gpt-4-turbo'], dtype=object),
199
+ 'xaxis': 'x',
200
+ 'y': array([0.19886]),
201
+ 'yaxis': 'y'},
202
+ {'alignmentgroup': 'True',
203
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
204
+ 'legendgroup': 'gpt-4',
205
+ 'marker': {'color': '#00cc96', 'pattern': {'shape': ''}},
206
+ 'name': 'gpt-4',
207
+ 'offsetgroup': 'gpt-4',
208
+ 'orientation': 'v',
209
+ 'showlegend': True,
210
+ 'textposition': 'auto',
211
+ 'type': 'bar',
212
+ 'x': array(['gpt-4'], dtype=object),
213
+ 'xaxis': 'x',
214
+ 'y': array([0.54303]),
215
+ 'yaxis': 'y'},
216
+ {'alignmentgroup': 'True',
217
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
218
+ 'legendgroup': 'llama-2-70b-chat',
219
+ 'marker': {'color': '#ab63fa', 'pattern': {'shape': ''}},
220
+ 'name': 'llama-2-70b-chat',
221
+ 'offsetgroup': 'llama-2-70b-chat',
222
+ 'orientation': 'v',
223
+ 'showlegend': True,
224
+ 'textposition': 'auto',
225
+ 'type': 'bar',
226
+ 'x': array(['llama-2-70b-chat'], dtype=object),
227
+ 'xaxis': 'x',
228
+ 'y': array([0.000809]),
229
+ 'yaxis': 'y'},
230
+ {'alignmentgroup': 'True',
231
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
232
+ 'legendgroup': 'Mixtral-8x7B-Instruct-v0.1',
233
+ 'marker': {'color': '#FFA15A', 'pattern': {'shape': ''}},
234
+ 'name': 'Mixtral-8x7B-Instruct-v0.1',
235
+ 'offsetgroup': 'Mixtral-8x7B-Instruct-v0.1',
236
+ 'orientation': 'v',
237
+ 'showlegend': True,
238
+ 'textposition': 'auto',
239
+ 'type': 'bar',
240
+ 'x': array(['Mixtral-8x7B-Instruct-v0.1'], dtype=object),
241
+ 'xaxis': 'x',
242
+ 'y': array([0.0042849]),
243
+ 'yaxis': 'y'},
244
+ {'alignmentgroup': 'True',
245
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
246
+ 'legendgroup': 'zephyr-7b-beta',
247
+ 'marker': {'color': '#19d3f3', 'pattern': {'shape': ''}},
248
+ 'name': 'zephyr-7b-beta',
249
+ 'offsetgroup': 'zephyr-7b-beta',
250
+ 'orientation': 'v',
251
+ 'showlegend': True,
252
+ 'textposition': 'auto',
253
+ 'type': 'bar',
254
+ 'x': array(['zephyr-7b-beta'], dtype=object),
255
+ 'xaxis': 'x',
256
+ 'y': array([0.00255326]),
257
+ 'yaxis': 'y'},
258
+ {'alignmentgroup': 'True',
259
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
260
+ 'legendgroup': 'Mistral-7B-Instruct-v0.2',
261
+ 'marker': {'color': '#FF6692', 'pattern': {'shape': ''}},
262
+ 'name': 'Mistral-7B-Instruct-v0.2',
263
+ 'offsetgroup': 'Mistral-7B-Instruct-v0.2',
264
+ 'orientation': 'v',
265
+ 'showlegend': True,
266
+ 'textposition': 'auto',
267
+ 'type': 'bar',
268
+ 'x': array(['Mistral-7B-Instruct-v0.2'], dtype=object),
269
+ 'xaxis': 'x',
270
+ 'y': array([0.00256334]),
271
+ 'yaxis': 'y'},
272
+ {'alignmentgroup': 'True',
273
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
274
+ 'legendgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
275
+ 'marker': {'color': '#B6E880', 'pattern': {'shape': ''}},
276
+ 'name': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
277
+ 'offsetgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
278
+ 'orientation': 'v',
279
+ 'showlegend': True,
280
+ 'textposition': 'auto',
281
+ 'type': 'bar',
282
+ 'x': array(['TinyLlama/TinyLlama-1.1B-Chat-v1.0'], dtype=object),
283
+ 'xaxis': 'x',
284
+ 'y': array([0.00080414]),
285
+ 'yaxis': 'y'},
286
+ {'alignmentgroup': 'True',
287
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
288
+ 'legendgroup': 'gemini-pro',
289
+ 'marker': {'color': '#FF97FF', 'pattern': {'shape': ''}},
290
+ 'name': 'gemini-pro',
291
+ 'offsetgroup': 'gemini-pro',
292
+ 'orientation': 'v',
293
+ 'showlegend': True,
294
+ 'textposition': 'auto',
295
+ 'type': 'bar',
296
+ 'x': array(['gemini-pro'], dtype=object),
297
+ 'xaxis': 'x',
298
+ 'y': array([0.00070525]),
299
+ 'yaxis': 'y'},
300
+ {'alignmentgroup': 'True',
301
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
302
+ 'legendgroup': 'chat-bison (PaLM 2)',
303
+ 'marker': {'color': '#FECB52', 'pattern': {'shape': ''}},
304
+ 'name': 'chat-bison (PaLM 2)',
305
+ 'offsetgroup': 'chat-bison (PaLM 2)',
306
+ 'orientation': 'v',
307
+ 'showlegend': True,
308
+ 'textposition': 'auto',
309
+ 'type': 'bar',
310
+ 'x': array(['chat-bison (PaLM 2)'], dtype=object),
311
+ 'xaxis': 'x',
312
+ 'y': array([0.]),
313
+ 'yaxis': 'y'},
314
+ {'alignmentgroup': 'True',
315
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
316
+ 'legendgroup': 'chat-bison-32k (PaLM 2 32K)',
317
+ 'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
318
+ 'name': 'chat-bison-32k (PaLM 2 32K)',
319
+ 'offsetgroup': 'chat-bison-32k (PaLM 2 32K)',
320
+ 'orientation': 'v',
321
+ 'showlegend': True,
322
+ 'textposition': 'auto',
323
+ 'type': 'bar',
324
+ 'x': array(['chat-bison-32k (PaLM 2 32K)'], dtype=object),
325
+ 'xaxis': 'x',
326
+ 'y': array([0.]),
327
+ 'yaxis': 'y'}],
328
+ 'layout': {'barmode': 'relative',
329
+ 'legend': {'title': {'text': 'Model'}, 'tracegroupgap': 0},
330
+ 'template': '...',
331
+ 'title': {'text': 'Costs of execution of 39 test queries per model'},
332
+ 'xaxis': {'anchor': 'y', 'domain': [0.0, 1.0], 'title': {'text': 'Model'}},
333
+ 'yaxis': {'anchor': 'x', 'domain': [0.0, 1.0], 'title': {'text': 'Execution cost ($)'}}}
334
+ })",Costs of execution of 39 test queries per model,Note that pause and resume time cost was not included in the cost calculation for the models billed hourly. Also although Gemini-Pro model is free for under 60 queries per minute we calculated the full cost for generating the tokens.,"{""data"":[{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-3.5-turbo"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""gpt-3.5-turbo"",""offsetgroup"":""gpt-3.5-turbo"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gpt-3.5-turbo"",""gpt-3.5-turbo""],""xaxis"":""x"",""y"":[0.002619,0.002619],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4-turbo"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""gpt-4-turbo"",""offsetgroup"":""gpt-4-turbo"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gpt-4-turbo""],""xaxis"":""x"",""y"":[0.19885999999999998],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""gpt-4"",""offsetgroup"":""gpt-4"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gpt-4""],""xaxis"":""x"",""y"":[0.54303],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""llama-2-70b-chat"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""llama-2-70b-chat"",""offsetgroup"":""llama-2-70b-chat"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""llama-2-70b-chat""],""xaxis"":""x"",""y"":[0.000809],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mixtral-8x7B-Instruct-v0.1"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""Mixtral-8x7B-Instruct-v0.1"",""offsetgroup"":""Mixtral-8x7B-Instruct-v0.1"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""Mixtral-8x7B-Instruct-v0.1""],""xaxis"":""x"",""y"":[0.0042848999999999995],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""zephyr-7b-beta"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""zephyr-7b-beta"",""offsetgroup"":""zephyr-7b-beta"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""zephyr-7b-beta""],""xaxis"":""x"",""y"":[0.0025532607919640012],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral-7B-Instruct-v0.2"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""Mistral-7B-Instruct-v0.2"",""offsetgroup"":""Mistral-7B-Instruct-v0.2"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""Mistral-7B-Instruct-v0.2""],""xaxis"":""x"",""y"":[0.0025633392459816404],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""offsetgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0""],""xaxis"":""x"",""y"":[0.0008041446367899577],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gemini-pro"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""gemini-pro"",""offsetgroup"":""gemini-pro"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gemini-pro""],""xaxis"":""x"",""y"":[0.0007052499999999999],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison (PaLM 2)"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""chat-bison (PaLM 2)"",""offsetgroup"":""chat-bison (PaLM 2)"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""chat-bison (PaLM 2)""],""xaxis"":""x"",""y"":[0.0],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison-32k (PaLM 2 32K)"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""chat-bison-32k (PaLM 2 32K)"",""offsetgroup"":""chat-bison-32k (PaLM 2 32K)"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""chat-bison-32k (PaLM 2 32K)""],""xaxis"":""x"",""y"":[0.0],""yaxis"":""y"",""type"":""bar""}],""layout"":{""template"":{""data"":{""histogram2dcontour"":[{""type"":""histogram2dcontour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""choropleth"":[{""type"":""choropleth"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""histogram2d"":[{""type"":""histogram2d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmap"":[{""type"":""heatmap"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmapgl"":[{""type"":""heatmapgl"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""contourcarpet"":[{""type"":""contourcarpet"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""contour"":[{""type"":""contour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""surface"":[{""type"":""surface"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""mesh3d"":[{""type"":""mesh3d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""scatter"":[{""fillpattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2},""type"":""scatter""}],""parcoords"":[{""type"":""parcoords"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolargl"":[{""type"":""scatterpolargl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""bar"":[{""error_x"":{""color"":""#2a3f5f""},""error_y"":{""color"":""#2a3f5f""},""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""bar""}],""scattergeo"":[{""type"":""scattergeo"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolar"":[{""type"":""scatterpolar"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""histogram"":[{""marker"":{""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""histogram""}],""scattergl"":[{""type"":""scattergl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatter3d"":[{""type"":""scatter3d"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattermapbox"":[{""type"":""scattermapbox"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterternary"":[{""type"":""scatterternary"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattercarpet"":[{""type"":""scattercarpet"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""carpet"":[{""aaxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""baxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""type"":""carpet""}],""table"":[{""cells"":{""fill"":{""color"":""#EBF0F8""},""line"":{""color"":""white""}},""header"":{""fill"":{""color"":""#C8D4E3""},""line"":{""color"":""white""}},""type"":""table""}],""barpolar"":[{""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""barpolar""}],""pie"":[{""automargin"":true,""type"":""pie""}]},""layout"":{""autotypenumbers"":""strict"",""colorway"":[""#636efa"",""#EF553B"",""#00cc96"",""#ab63fa"",""#FFA15A"",""#19d3f3"",""#FF6692"",""#B6E880"",""#FF97FF"",""#FECB52""],""font"":{""color"":""#2a3f5f""},""hovermode"":""closest"",""hoverlabel"":{""align"":""left""},""paper_bgcolor"":""white"",""plot_bgcolor"":""#E5ECF6"",""polar"":{""bgcolor"":""#E5ECF6"",""angularaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""radialaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""ternary"":{""bgcolor"":""#E5ECF6"",""aaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""baxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""caxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""coloraxis"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""colorscale"":{""sequential"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""sequentialminus"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""diverging"":[[0,""#8e0152""],[0.1,""#c51b7d""],[0.2,""#de77ae""],[0.3,""#f1b6da""],[0.4,""#fde0ef""],[0.5,""#f7f7f7""],[0.6,""#e6f5d0""],[0.7,""#b8e186""],[0.8,""#7fbc41""],[0.9,""#4d9221""],[1,""#276419""]]},""xaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""yaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""scene"":{""xaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""yaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""zaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2}},""shapedefaults"":{""line"":{""color"":""#2a3f5f""}},""annotationdefaults"":{""arrowcolor"":""#2a3f5f"",""arrowhead"":0,""arrowwidth"":1},""geo"":{""bgcolor"":""white"",""landcolor"":""#E5ECF6"",""subunitcolor"":""white"",""showland"":true,""showlakes"":true,""lakecolor"":""white""},""title"":{""x"":0.05},""mapbox"":{""style"":""light""}}},""xaxis"":{""anchor"":""y"",""domain"":[0.0,1.0],""title"":{""text"":""Model""}},""yaxis"":{""anchor"":""x"",""domain"":[0.0,1.0],""title"":{""text"":""Execution cost ($)""}},""legend"":{""title"":{""text"":""Model""},""tracegroupgap"":0},""title"":{""text"":""Costs of execution of 39 test queries per model""},""barmode"":""relative""}}"
335
+ ./html/plots/model_sizes.html,"Figure({
336
+ 'data': [{'alignmentgroup': 'True',
337
+ 'hovertemplate': 'Model=%{x}<br>Model size (B params)=%{y}<extra></extra>',
338
+ 'legendgroup': 'Mixtral-8x7B-Instruct-v0.1',
339
+ 'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
340
+ 'name': 'Mixtral-8x7B-Instruct-v0.1',
341
+ 'offsetgroup': 'Mixtral-8x7B-Instruct-v0.1',
342
+ 'orientation': 'v',
343
+ 'showlegend': True,
344
+ 'textposition': 'auto',
345
+ 'type': 'bar',
346
+ 'x': array(['Mixtral-8x7B-Instruct-v0.1'], dtype=object),
347
+ 'xaxis': 'x',
348
+ 'y': array([56.]),
349
+ 'yaxis': 'y'},
350
+ {'alignmentgroup': 'True',
351
+ 'hovertemplate': 'Model=%{x}<br>Model size (B params)=%{y}<extra></extra>',
352
+ 'legendgroup': 'zephyr-7b-beta',
353
+ 'marker': {'color': '#EF553B', 'pattern': {'shape': ''}},
354
+ 'name': 'zephyr-7b-beta',
355
+ 'offsetgroup': 'zephyr-7b-beta',
356
+ 'orientation': 'v',
357
+ 'showlegend': True,
358
+ 'textposition': 'auto',
359
+ 'type': 'bar',
360
+ 'x': array(['zephyr-7b-beta'], dtype=object),
361
+ 'xaxis': 'x',
362
+ 'y': array([7.]),
363
+ 'yaxis': 'y'},
364
+ {'alignmentgroup': 'True',
365
+ 'hovertemplate': 'Model=%{x}<br>Model size (B params)=%{y}<extra></extra>',
366
+ 'legendgroup': 'Mistral-7B-Instruct-v0.2',
367
+ 'marker': {'color': '#00cc96', 'pattern': {'shape': ''}},
368
+ 'name': 'Mistral-7B-Instruct-v0.2',
369
+ 'offsetgroup': 'Mistral-7B-Instruct-v0.2',
370
+ 'orientation': 'v',
371
+ 'showlegend': True,
372
+ 'textposition': 'auto',
373
+ 'type': 'bar',
374
+ 'x': array(['Mistral-7B-Instruct-v0.2'], dtype=object),
375
+ 'xaxis': 'x',
376
+ 'y': array([7.]),
377
+ 'yaxis': 'y'},
378
+ {'alignmentgroup': 'True',
379
+ 'hovertemplate': 'Model=%{x}<br>Model size (B params)=%{y}<extra></extra>',
380
+ 'legendgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
381
+ 'marker': {'color': '#ab63fa', 'pattern': {'shape': ''}},
382
+ 'name': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
383
+ 'offsetgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
384
+ 'orientation': 'v',
385
+ 'showlegend': True,
386
+ 'textposition': 'auto',
387
+ 'type': 'bar',
388
+ 'x': array(['TinyLlama/TinyLlama-1.1B-Chat-v1.0'], dtype=object),
389
+ 'xaxis': 'x',
390
+ 'y': array([1.1]),
391
+ 'yaxis': 'y'}],
392
+ 'layout': {'barmode': 'relative',
393
+ 'legend': {'title': {'text': 'Model'}, 'tracegroupgap': 0},
394
+ 'template': '...',
395
+ 'title': {'text': 'Model sizes in billions of parameters'},
396
+ 'xaxis': {'anchor': 'y', 'domain': [0.0, 1.0], 'title': {'text': 'Model'}},
397
+ 'yaxis': {'anchor': 'x', 'domain': [0.0, 1.0], 'title': {'text': 'Model size (B params)'}}}
398
+ })",Model sizes in billions of parameters,Note that some models have undisclosed sizes.,"{""data"":[{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eModel size (B params)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mixtral-8x7B-Instruct-v0.1"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""Mixtral-8x7B-Instruct-v0.1"",""offsetgroup"":""Mixtral-8x7B-Instruct-v0.1"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""Mixtral-8x7B-Instruct-v0.1""],""xaxis"":""x"",""y"":[56.0],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eModel size (B params)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""zephyr-7b-beta"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""zephyr-7b-beta"",""offsetgroup"":""zephyr-7b-beta"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""zephyr-7b-beta""],""xaxis"":""x"",""y"":[7.0],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eModel size (B params)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral-7B-Instruct-v0.2"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""Mistral-7B-Instruct-v0.2"",""offsetgroup"":""Mistral-7B-Instruct-v0.2"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""Mistral-7B-Instruct-v0.2""],""xaxis"":""x"",""y"":[7.0],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eModel size (B params)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""offsetgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0""],""xaxis"":""x"",""y"":[1.1],""yaxis"":""y"",""type"":""bar""}],""layout"":{""template"":{""data"":{""histogram2dcontour"":[{""type"":""histogram2dcontour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""choropleth"":[{""type"":""choropleth"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""histogram2d"":[{""type"":""histogram2d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmap"":[{""type"":""heatmap"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmapgl"":[{""type"":""heatmapgl"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""contourcarpet"":[{""type"":""contourcarpet"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""contour"":[{""type"":""contour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""surface"":[{""type"":""surface"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""mesh3d"":[{""type"":""mesh3d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""scatter"":[{""fillpattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2},""type"":""scatter""}],""parcoords"":[{""type"":""parcoords"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolargl"":[{""type"":""scatterpolargl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""bar"":[{""error_x"":{""color"":""#2a3f5f""},""error_y"":{""color"":""#2a3f5f""},""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""bar""}],""scattergeo"":[{""type"":""scattergeo"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolar"":[{""type"":""scatterpolar"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""histogram"":[{""marker"":{""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""histogram""}],""scattergl"":[{""type"":""scattergl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatter3d"":[{""type"":""scatter3d"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattermapbox"":[{""type"":""scattermapbox"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterternary"":[{""type"":""scatterternary"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattercarpet"":[{""type"":""scattercarpet"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""carpet"":[{""aaxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""baxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""type"":""carpet""}],""table"":[{""cells"":{""fill"":{""color"":""#EBF0F8""},""line"":{""color"":""white""}},""header"":{""fill"":{""color"":""#C8D4E3""},""line"":{""color"":""white""}},""type"":""table""}],""barpolar"":[{""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""barpolar""}],""pie"":[{""automargin"":true,""type"":""pie""}]},""layout"":{""autotypenumbers"":""strict"",""colorway"":[""#636efa"",""#EF553B"",""#00cc96"",""#ab63fa"",""#FFA15A"",""#19d3f3"",""#FF6692"",""#B6E880"",""#FF97FF"",""#FECB52""],""font"":{""color"":""#2a3f5f""},""hovermode"":""closest"",""hoverlabel"":{""align"":""left""},""paper_bgcolor"":""white"",""plot_bgcolor"":""#E5ECF6"",""polar"":{""bgcolor"":""#E5ECF6"",""angularaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""radialaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""ternary"":{""bgcolor"":""#E5ECF6"",""aaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""baxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""caxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""coloraxis"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""colorscale"":{""sequential"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""sequentialminus"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""diverging"":[[0,""#8e0152""],[0.1,""#c51b7d""],[0.2,""#de77ae""],[0.3,""#f1b6da""],[0.4,""#fde0ef""],[0.5,""#f7f7f7""],[0.6,""#e6f5d0""],[0.7,""#b8e186""],[0.8,""#7fbc41""],[0.9,""#4d9221""],[1,""#276419""]]},""xaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""yaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""scene"":{""xaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""yaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""zaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2}},""shapedefaults"":{""line"":{""color"":""#2a3f5f""}},""annotationdefaults"":{""arrowcolor"":""#2a3f5f"",""arrowhead"":0,""arrowwidth"":1},""geo"":{""bgcolor"":""white"",""landcolor"":""#E5ECF6"",""subunitcolor"":""white"",""showland"":true,""showlakes"":true,""lakecolor"":""white""},""title"":{""x"":0.05},""mapbox"":{""style"":""light""}}},""xaxis"":{""anchor"":""y"",""domain"":[0.0,1.0],""title"":{""text"":""Model""}},""yaxis"":{""anchor"":""x"",""domain"":[0.0,1.0],""title"":{""text"":""Model size (B params)""}},""legend"":{""title"":{""text"":""Model""},""tracegroupgap"":0},""title"":{""text"":""Model sizes in billions of parameters""},""barmode"":""relative""}}"
data/2024-01-26 16:44:14.180186_general_plot.csv ADDED
@@ -0,0 +1,398 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ path,plot_object,description,comment,plot_json
2
+ ./html/plots/response_times.html,"Figure({
3
+ 'data': [{'alignmentgroup': 'True',
4
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
5
+ 'legendgroup': 'Mistral-7B-Instruct-v0.2',
6
+ 'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
7
+ 'name': 'Mistral-7B-Instruct-v0.2',
8
+ 'offsetgroup': 'Mistral-7B-Instruct-v0.2',
9
+ 'orientation': 'v',
10
+ 'showlegend': True,
11
+ 'textposition': 'auto',
12
+ 'type': 'bar',
13
+ 'x': array(['Mistral-7B-Instruct-v0.2'], dtype=object),
14
+ 'xaxis': 'x',
15
+ 'y': array([3.17454003]),
16
+ 'yaxis': 'y'},
17
+ {'alignmentgroup': 'True',
18
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
19
+ 'legendgroup': 'Mixtral-8x7B-Instruct-v0.1',
20
+ 'marker': {'color': '#EF553B', 'pattern': {'shape': ''}},
21
+ 'name': 'Mixtral-8x7B-Instruct-v0.1',
22
+ 'offsetgroup': 'Mixtral-8x7B-Instruct-v0.1',
23
+ 'orientation': 'v',
24
+ 'showlegend': True,
25
+ 'textposition': 'auto',
26
+ 'type': 'bar',
27
+ 'x': array(['Mixtral-8x7B-Instruct-v0.1'], dtype=object),
28
+ 'xaxis': 'x',
29
+ 'y': array([7.14219763]),
30
+ 'yaxis': 'y'},
31
+ {'alignmentgroup': 'True',
32
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
33
+ 'legendgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
34
+ 'marker': {'color': '#00cc96', 'pattern': {'shape': ''}},
35
+ 'name': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
36
+ 'offsetgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
37
+ 'orientation': 'v',
38
+ 'showlegend': True,
39
+ 'textposition': 'auto',
40
+ 'type': 'bar',
41
+ 'x': array(['TinyLlama/TinyLlama-1.1B-Chat-v1.0'], dtype=object),
42
+ 'xaxis': 'x',
43
+ 'y': array([1.29026454]),
44
+ 'yaxis': 'y'},
45
+ {'alignmentgroup': 'True',
46
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
47
+ 'legendgroup': 'chat-bison',
48
+ 'marker': {'color': '#ab63fa', 'pattern': {'shape': ''}},
49
+ 'name': 'chat-bison',
50
+ 'offsetgroup': 'chat-bison',
51
+ 'orientation': 'v',
52
+ 'showlegend': True,
53
+ 'textposition': 'auto',
54
+ 'type': 'bar',
55
+ 'x': array(['chat-bison'], dtype=object),
56
+ 'xaxis': 'x',
57
+ 'y': array([3.89024363]),
58
+ 'yaxis': 'y'},
59
+ {'alignmentgroup': 'True',
60
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
61
+ 'legendgroup': 'chat-bison-32k',
62
+ 'marker': {'color': '#FFA15A', 'pattern': {'shape': ''}},
63
+ 'name': 'chat-bison-32k',
64
+ 'offsetgroup': 'chat-bison-32k',
65
+ 'orientation': 'v',
66
+ 'showlegend': True,
67
+ 'textposition': 'auto',
68
+ 'type': 'bar',
69
+ 'x': array(['chat-bison-32k'], dtype=object),
70
+ 'xaxis': 'x',
71
+ 'y': array([4.12817777]),
72
+ 'yaxis': 'y'},
73
+ {'alignmentgroup': 'True',
74
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
75
+ 'legendgroup': 'gemini-pro',
76
+ 'marker': {'color': '#19d3f3', 'pattern': {'shape': ''}},
77
+ 'name': 'gemini-pro',
78
+ 'offsetgroup': 'gemini-pro',
79
+ 'orientation': 'v',
80
+ 'showlegend': True,
81
+ 'textposition': 'auto',
82
+ 'type': 'bar',
83
+ 'x': array(['gemini-pro'], dtype=object),
84
+ 'xaxis': 'x',
85
+ 'y': array([4.72138064]),
86
+ 'yaxis': 'y'},
87
+ {'alignmentgroup': 'True',
88
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
89
+ 'legendgroup': 'gpt-3.5-turbo',
90
+ 'marker': {'color': '#FF6692', 'pattern': {'shape': ''}},
91
+ 'name': 'gpt-3.5-turbo',
92
+ 'offsetgroup': 'gpt-3.5-turbo',
93
+ 'orientation': 'v',
94
+ 'showlegend': True,
95
+ 'textposition': 'auto',
96
+ 'type': 'bar',
97
+ 'x': array(['gpt-3.5-turbo'], dtype=object),
98
+ 'xaxis': 'x',
99
+ 'y': array([5.28237349]),
100
+ 'yaxis': 'y'},
101
+ {'alignmentgroup': 'True',
102
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
103
+ 'legendgroup': 'gpt-4',
104
+ 'marker': {'color': '#B6E880', 'pattern': {'shape': ''}},
105
+ 'name': 'gpt-4',
106
+ 'offsetgroup': 'gpt-4',
107
+ 'orientation': 'v',
108
+ 'showlegend': True,
109
+ 'textposition': 'auto',
110
+ 'type': 'bar',
111
+ 'x': array(['gpt-4'], dtype=object),
112
+ 'xaxis': 'x',
113
+ 'y': array([15.52184566]),
114
+ 'yaxis': 'y'},
115
+ {'alignmentgroup': 'True',
116
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
117
+ 'legendgroup': 'gpt-4-turbo',
118
+ 'marker': {'color': '#FF97FF', 'pattern': {'shape': ''}},
119
+ 'name': 'gpt-4-turbo',
120
+ 'offsetgroup': 'gpt-4-turbo',
121
+ 'orientation': 'v',
122
+ 'showlegend': True,
123
+ 'textposition': 'auto',
124
+ 'type': 'bar',
125
+ 'x': array(['gpt-4-turbo'], dtype=object),
126
+ 'xaxis': 'x',
127
+ 'y': array([14.00852903]),
128
+ 'yaxis': 'y'},
129
+ {'alignmentgroup': 'True',
130
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
131
+ 'legendgroup': 'llama-2-70b-chat',
132
+ 'marker': {'color': '#FECB52', 'pattern': {'shape': ''}},
133
+ 'name': 'llama-2-70b-chat',
134
+ 'offsetgroup': 'llama-2-70b-chat',
135
+ 'orientation': 'v',
136
+ 'showlegend': True,
137
+ 'textposition': 'auto',
138
+ 'type': 'bar',
139
+ 'x': array(['llama-2-70b-chat'], dtype=object),
140
+ 'xaxis': 'x',
141
+ 'y': array([6.0658799]),
142
+ 'yaxis': 'y'},
143
+ {'alignmentgroup': 'True',
144
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
145
+ 'legendgroup': 'zephyr-7b-beta',
146
+ 'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
147
+ 'name': 'zephyr-7b-beta',
148
+ 'offsetgroup': 'zephyr-7b-beta',
149
+ 'orientation': 'v',
150
+ 'showlegend': True,
151
+ 'textposition': 'auto',
152
+ 'type': 'bar',
153
+ 'x': array(['zephyr-7b-beta'], dtype=object),
154
+ 'xaxis': 'x',
155
+ 'y': array([3.23879932]),
156
+ 'yaxis': 'y'}],
157
+ 'layout': {'barmode': 'relative',
158
+ 'legend': {'title': {'text': 'Model'}, 'tracegroupgap': 0},
159
+ 'template': '...',
160
+ 'title': {'text': 'Model endpoints response times'},
161
+ 'xaxis': {'anchor': 'y',
162
+ 'categoryarray': [Mistral-7B-Instruct-v0.2,
163
+ Mixtral-8x7B-Instruct-v0.1,
164
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,
165
+ chat-bison, chat-bison-32k, gemini-pro,
166
+ gpt-3.5-turbo, gpt-4, gpt-4-turbo,
167
+ llama-2-70b-chat, zephyr-7b-beta],
168
+ 'categoryorder': 'array',
169
+ 'domain': [0.0, 1.0],
170
+ 'title': {'text': 'Model'}},
171
+ 'yaxis': {'anchor': 'x', 'domain': [0.0, 1.0], 'title': {'text': 'Execution time (s)'}}}
172
+ })",Model endpoints response times,,"{""data"":[{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral-7B-Instruct-v0.2"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""Mistral-7B-Instruct-v0.2"",""offsetgroup"":""Mistral-7B-Instruct-v0.2"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""Mistral-7B-Instruct-v0.2""],""xaxis"":""x"",""y"":[3.174540030956268],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mixtral-8x7B-Instruct-v0.1"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""Mixtral-8x7B-Instruct-v0.1"",""offsetgroup"":""Mixtral-8x7B-Instruct-v0.1"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""Mixtral-8x7B-Instruct-v0.1""],""xaxis"":""x"",""y"":[7.142197625471814],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""offsetgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0""],""xaxis"":""x"",""y"":[1.2902645373344421],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""chat-bison"",""offsetgroup"":""chat-bison"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""chat-bison""],""xaxis"":""x"",""y"":[3.890243631601334],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison-32k"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""chat-bison-32k"",""offsetgroup"":""chat-bison-32k"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""chat-bison-32k""],""xaxis"":""x"",""y"":[4.128177767992019],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gemini-pro"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""gemini-pro"",""offsetgroup"":""gemini-pro"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gemini-pro""],""xaxis"":""x"",""y"":[4.72138064004937],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-3.5-turbo"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""gpt-3.5-turbo"",""offsetgroup"":""gpt-3.5-turbo"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gpt-3.5-turbo""],""xaxis"":""x"",""y"":[5.282373493889353],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""gpt-4"",""offsetgroup"":""gpt-4"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gpt-4""],""xaxis"":""x"",""y"":[15.5218456586202],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4-turbo"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""gpt-4-turbo"",""offsetgroup"":""gpt-4-turbo"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gpt-4-turbo""],""xaxis"":""x"",""y"":[14.008529031276703],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""llama-2-70b-chat"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""llama-2-70b-chat"",""offsetgroup"":""llama-2-70b-chat"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""llama-2-70b-chat""],""xaxis"":""x"",""y"":[6.06587989590749],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""zephyr-7b-beta"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""zephyr-7b-beta"",""offsetgroup"":""zephyr-7b-beta"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""zephyr-7b-beta""],""xaxis"":""x"",""y"":[3.2387993240356447],""yaxis"":""y"",""type"":""bar""}],""layout"":{""template"":{""data"":{""histogram2dcontour"":[{""type"":""histogram2dcontour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""choropleth"":[{""type"":""choropleth"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""histogram2d"":[{""type"":""histogram2d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmap"":[{""type"":""heatmap"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmapgl"":[{""type"":""heatmapgl"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""contourcarpet"":[{""type"":""contourcarpet"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""contour"":[{""type"":""contour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""surface"":[{""type"":""surface"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""mesh3d"":[{""type"":""mesh3d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""scatter"":[{""fillpattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2},""type"":""scatter""}],""parcoords"":[{""type"":""parcoords"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolargl"":[{""type"":""scatterpolargl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""bar"":[{""error_x"":{""color"":""#2a3f5f""},""error_y"":{""color"":""#2a3f5f""},""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""bar""}],""scattergeo"":[{""type"":""scattergeo"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolar"":[{""type"":""scatterpolar"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""histogram"":[{""marker"":{""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""histogram""}],""scattergl"":[{""type"":""scattergl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatter3d"":[{""type"":""scatter3d"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattermapbox"":[{""type"":""scattermapbox"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterternary"":[{""type"":""scatterternary"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattercarpet"":[{""type"":""scattercarpet"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""carpet"":[{""aaxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""baxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""type"":""carpet""}],""table"":[{""cells"":{""fill"":{""color"":""#EBF0F8""},""line"":{""color"":""white""}},""header"":{""fill"":{""color"":""#C8D4E3""},""line"":{""color"":""white""}},""type"":""table""}],""barpolar"":[{""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""barpolar""}],""pie"":[{""automargin"":true,""type"":""pie""}]},""layout"":{""autotypenumbers"":""strict"",""colorway"":[""#636efa"",""#EF553B"",""#00cc96"",""#ab63fa"",""#FFA15A"",""#19d3f3"",""#FF6692"",""#B6E880"",""#FF97FF"",""#FECB52""],""font"":{""color"":""#2a3f5f""},""hovermode"":""closest"",""hoverlabel"":{""align"":""left""},""paper_bgcolor"":""white"",""plot_bgcolor"":""#E5ECF6"",""polar"":{""bgcolor"":""#E5ECF6"",""angularaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""radialaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""ternary"":{""bgcolor"":""#E5ECF6"",""aaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""baxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""caxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""coloraxis"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""colorscale"":{""sequential"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""sequentialminus"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""diverging"":[[0,""#8e0152""],[0.1,""#c51b7d""],[0.2,""#de77ae""],[0.3,""#f1b6da""],[0.4,""#fde0ef""],[0.5,""#f7f7f7""],[0.6,""#e6f5d0""],[0.7,""#b8e186""],[0.8,""#7fbc41""],[0.9,""#4d9221""],[1,""#276419""]]},""xaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""yaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""scene"":{""xaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""yaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""zaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2}},""shapedefaults"":{""line"":{""color"":""#2a3f5f""}},""annotationdefaults"":{""arrowcolor"":""#2a3f5f"",""arrowhead"":0,""arrowwidth"":1},""geo"":{""bgcolor"":""white"",""landcolor"":""#E5ECF6"",""subunitcolor"":""white"",""showland"":true,""showlakes"":true,""lakecolor"":""white""},""title"":{""x"":0.05},""mapbox"":{""style"":""light""}}},""xaxis"":{""anchor"":""y"",""domain"":[0.0,1.0],""title"":{""text"":""Model""},""categoryorder"":""array"",""categoryarray"":[""Mistral-7B-Instruct-v0.2"",""Mixtral-8x7B-Instruct-v0.1"",""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""chat-bison"",""chat-bison-32k"",""gemini-pro"",""gpt-3.5-turbo"",""gpt-4"",""gpt-4-turbo"",""llama-2-70b-chat"",""zephyr-7b-beta""]},""yaxis"":{""anchor"":""x"",""domain"":[0.0,1.0],""title"":{""text"":""Execution time (s)""}},""legend"":{""title"":{""text"":""Model""},""tracegroupgap"":0},""title"":{""text"":""Model endpoints response times""},""barmode"":""relative""}}"
173
+ ./html/plots/execution_costs.html,"Figure({
174
+ 'data': [{'alignmentgroup': 'True',
175
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
176
+ 'legendgroup': 'gpt-3.5-turbo',
177
+ 'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
178
+ 'name': 'gpt-3.5-turbo',
179
+ 'offsetgroup': 'gpt-3.5-turbo',
180
+ 'orientation': 'v',
181
+ 'showlegend': True,
182
+ 'textposition': 'auto',
183
+ 'type': 'bar',
184
+ 'x': array(['gpt-3.5-turbo', 'gpt-3.5-turbo'], dtype=object),
185
+ 'xaxis': 'x',
186
+ 'y': array([0.020994, 0.020994]),
187
+ 'yaxis': 'y'},
188
+ {'alignmentgroup': 'True',
189
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
190
+ 'legendgroup': 'gpt-4-turbo',
191
+ 'marker': {'color': '#EF553B', 'pattern': {'shape': ''}},
192
+ 'name': 'gpt-4-turbo',
193
+ 'offsetgroup': 'gpt-4-turbo',
194
+ 'orientation': 'v',
195
+ 'showlegend': True,
196
+ 'textposition': 'auto',
197
+ 'type': 'bar',
198
+ 'x': array(['gpt-4-turbo'], dtype=object),
199
+ 'xaxis': 'x',
200
+ 'y': array([0.02967]),
201
+ 'yaxis': 'y'},
202
+ {'alignmentgroup': 'True',
203
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
204
+ 'legendgroup': 'gpt-4',
205
+ 'marker': {'color': '#00cc96', 'pattern': {'shape': ''}},
206
+ 'name': 'gpt-4',
207
+ 'offsetgroup': 'gpt-4',
208
+ 'orientation': 'v',
209
+ 'showlegend': True,
210
+ 'textposition': 'auto',
211
+ 'type': 'bar',
212
+ 'x': array(['gpt-4'], dtype=object),
213
+ 'xaxis': 'x',
214
+ 'y': array([0.07839]),
215
+ 'yaxis': 'y'},
216
+ {'alignmentgroup': 'True',
217
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
218
+ 'legendgroup': 'llama-2-70b-chat',
219
+ 'marker': {'color': '#ab63fa', 'pattern': {'shape': ''}},
220
+ 'name': 'llama-2-70b-chat',
221
+ 'offsetgroup': 'llama-2-70b-chat',
222
+ 'orientation': 'v',
223
+ 'showlegend': True,
224
+ 'textposition': 'auto',
225
+ 'type': 'bar',
226
+ 'x': array(['llama-2-70b-chat'], dtype=object),
227
+ 'xaxis': 'x',
228
+ 'y': array([0.0039636]),
229
+ 'yaxis': 'y'},
230
+ {'alignmentgroup': 'True',
231
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
232
+ 'legendgroup': 'Mixtral-8x7B-Instruct-v0.1',
233
+ 'marker': {'color': '#FFA15A', 'pattern': {'shape': ''}},
234
+ 'name': 'Mixtral-8x7B-Instruct-v0.1',
235
+ 'offsetgroup': 'Mixtral-8x7B-Instruct-v0.1',
236
+ 'orientation': 'v',
237
+ 'showlegend': True,
238
+ 'textposition': 'auto',
239
+ 'type': 'bar',
240
+ 'x': array(['Mixtral-8x7B-Instruct-v0.1'], dtype=object),
241
+ 'xaxis': 'x',
242
+ 'y': array([0.0161523]),
243
+ 'yaxis': 'y'},
244
+ {'alignmentgroup': 'True',
245
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
246
+ 'legendgroup': 'zephyr-7b-beta',
247
+ 'marker': {'color': '#19d3f3', 'pattern': {'shape': ''}},
248
+ 'name': 'zephyr-7b-beta',
249
+ 'offsetgroup': 'zephyr-7b-beta',
250
+ 'orientation': 'v',
251
+ 'showlegend': True,
252
+ 'textposition': 'auto',
253
+ 'type': 'bar',
254
+ 'x': array(['zephyr-7b-beta'], dtype=object),
255
+ 'xaxis': 'x',
256
+ 'y': array([0.00550208]),
257
+ 'yaxis': 'y'},
258
+ {'alignmentgroup': 'True',
259
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
260
+ 'legendgroup': 'Mistral-7B-Instruct-v0.2',
261
+ 'marker': {'color': '#FF6692', 'pattern': {'shape': ''}},
262
+ 'name': 'Mistral-7B-Instruct-v0.2',
263
+ 'offsetgroup': 'Mistral-7B-Instruct-v0.2',
264
+ 'orientation': 'v',
265
+ 'showlegend': True,
266
+ 'textposition': 'auto',
267
+ 'type': 'bar',
268
+ 'x': array(['Mistral-7B-Instruct-v0.2'], dtype=object),
269
+ 'xaxis': 'x',
270
+ 'y': array([0.00202543]),
271
+ 'yaxis': 'y'},
272
+ {'alignmentgroup': 'True',
273
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
274
+ 'legendgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
275
+ 'marker': {'color': '#B6E880', 'pattern': {'shape': ''}},
276
+ 'name': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
277
+ 'offsetgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
278
+ 'orientation': 'v',
279
+ 'showlegend': True,
280
+ 'textposition': 'auto',
281
+ 'type': 'bar',
282
+ 'x': array(['TinyLlama/TinyLlama-1.1B-Chat-v1.0'], dtype=object),
283
+ 'xaxis': 'x',
284
+ 'y': array([0.00046687]),
285
+ 'yaxis': 'y'},
286
+ {'alignmentgroup': 'True',
287
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
288
+ 'legendgroup': 'gemini-pro',
289
+ 'marker': {'color': '#FF97FF', 'pattern': {'shape': ''}},
290
+ 'name': 'gemini-pro',
291
+ 'offsetgroup': 'gemini-pro',
292
+ 'orientation': 'v',
293
+ 'showlegend': True,
294
+ 'textposition': 'auto',
295
+ 'type': 'bar',
296
+ 'x': array(['gemini-pro'], dtype=object),
297
+ 'xaxis': 'x',
298
+ 'y': array([0.005052]),
299
+ 'yaxis': 'y'},
300
+ {'alignmentgroup': 'True',
301
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
302
+ 'legendgroup': 'chat-bison (PaLM 2)',
303
+ 'marker': {'color': '#FECB52', 'pattern': {'shape': ''}},
304
+ 'name': 'chat-bison (PaLM 2)',
305
+ 'offsetgroup': 'chat-bison (PaLM 2)',
306
+ 'orientation': 'v',
307
+ 'showlegend': True,
308
+ 'textposition': 'auto',
309
+ 'type': 'bar',
310
+ 'x': array(['chat-bison (PaLM 2)'], dtype=object),
311
+ 'xaxis': 'x',
312
+ 'y': array([0.]),
313
+ 'yaxis': 'y'},
314
+ {'alignmentgroup': 'True',
315
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
316
+ 'legendgroup': 'chat-bison-32k (PaLM 2 32K)',
317
+ 'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
318
+ 'name': 'chat-bison-32k (PaLM 2 32K)',
319
+ 'offsetgroup': 'chat-bison-32k (PaLM 2 32K)',
320
+ 'orientation': 'v',
321
+ 'showlegend': True,
322
+ 'textposition': 'auto',
323
+ 'type': 'bar',
324
+ 'x': array(['chat-bison-32k (PaLM 2 32K)'], dtype=object),
325
+ 'xaxis': 'x',
326
+ 'y': array([0.]),
327
+ 'yaxis': 'y'}],
328
+ 'layout': {'barmode': 'relative',
329
+ 'legend': {'title': {'text': 'Model'}, 'tracegroupgap': 0},
330
+ 'template': '...',
331
+ 'title': {'text': 'Costs of execution of 39 test queries per model'},
332
+ 'xaxis': {'anchor': 'y', 'domain': [0.0, 1.0], 'title': {'text': 'Model'}},
333
+ 'yaxis': {'anchor': 'x', 'domain': [0.0, 1.0], 'title': {'text': 'Execution cost ($)'}}}
334
+ })",Costs of execution of 39 test queries per model,Note that pause and resume time cost was not included in the cost calculation for the models billed hourly. Also although Gemini-Pro model is free for under 60 queries per minute we calculated the full cost for generating the tokens.,"{""data"":[{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-3.5-turbo"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""gpt-3.5-turbo"",""offsetgroup"":""gpt-3.5-turbo"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gpt-3.5-turbo"",""gpt-3.5-turbo""],""xaxis"":""x"",""y"":[0.020994000000000002,0.020994000000000002],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4-turbo"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""gpt-4-turbo"",""offsetgroup"":""gpt-4-turbo"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gpt-4-turbo""],""xaxis"":""x"",""y"":[0.029670000000000002],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""gpt-4"",""offsetgroup"":""gpt-4"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gpt-4""],""xaxis"":""x"",""y"":[0.07839],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""llama-2-70b-chat"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""llama-2-70b-chat"",""offsetgroup"":""llama-2-70b-chat"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""llama-2-70b-chat""],""xaxis"":""x"",""y"":[0.0039636],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mixtral-8x7B-Instruct-v0.1"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""Mixtral-8x7B-Instruct-v0.1"",""offsetgroup"":""Mixtral-8x7B-Instruct-v0.1"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""Mixtral-8x7B-Instruct-v0.1""],""xaxis"":""x"",""y"":[0.016152299999999998],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""zephyr-7b-beta"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""zephyr-7b-beta"",""offsetgroup"":""zephyr-7b-beta"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""zephyr-7b-beta""],""xaxis"":""x"",""y"":[0.005502075092660056],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral-7B-Instruct-v0.2"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""Mistral-7B-Instruct-v0.2"",""offsetgroup"":""Mistral-7B-Instruct-v0.2"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""Mistral-7B-Instruct-v0.2""],""xaxis"":""x"",""y"":[0.002025430454148187],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""offsetgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0""],""xaxis"":""x"",""y"":[0.0004668651938438415],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gemini-pro"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""gemini-pro"",""offsetgroup"":""gemini-pro"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gemini-pro""],""xaxis"":""x"",""y"":[0.005052],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison (PaLM 2)"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""chat-bison (PaLM 2)"",""offsetgroup"":""chat-bison (PaLM 2)"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""chat-bison (PaLM 2)""],""xaxis"":""x"",""y"":[0.0],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison-32k (PaLM 2 32K)"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""chat-bison-32k (PaLM 2 32K)"",""offsetgroup"":""chat-bison-32k (PaLM 2 32K)"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""chat-bison-32k (PaLM 2 32K)""],""xaxis"":""x"",""y"":[0.0],""yaxis"":""y"",""type"":""bar""}],""layout"":{""template"":{""data"":{""histogram2dcontour"":[{""type"":""histogram2dcontour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""choropleth"":[{""type"":""choropleth"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""histogram2d"":[{""type"":""histogram2d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmap"":[{""type"":""heatmap"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmapgl"":[{""type"":""heatmapgl"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""contourcarpet"":[{""type"":""contourcarpet"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""contour"":[{""type"":""contour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""surface"":[{""type"":""surface"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""mesh3d"":[{""type"":""mesh3d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""scatter"":[{""fillpattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2},""type"":""scatter""}],""parcoords"":[{""type"":""parcoords"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolargl"":[{""type"":""scatterpolargl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""bar"":[{""error_x"":{""color"":""#2a3f5f""},""error_y"":{""color"":""#2a3f5f""},""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""bar""}],""scattergeo"":[{""type"":""scattergeo"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolar"":[{""type"":""scatterpolar"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""histogram"":[{""marker"":{""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""histogram""}],""scattergl"":[{""type"":""scattergl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatter3d"":[{""type"":""scatter3d"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattermapbox"":[{""type"":""scattermapbox"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterternary"":[{""type"":""scatterternary"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattercarpet"":[{""type"":""scattercarpet"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""carpet"":[{""aaxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""baxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""type"":""carpet""}],""table"":[{""cells"":{""fill"":{""color"":""#EBF0F8""},""line"":{""color"":""white""}},""header"":{""fill"":{""color"":""#C8D4E3""},""line"":{""color"":""white""}},""type"":""table""}],""barpolar"":[{""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""barpolar""}],""pie"":[{""automargin"":true,""type"":""pie""}]},""layout"":{""autotypenumbers"":""strict"",""colorway"":[""#636efa"",""#EF553B"",""#00cc96"",""#ab63fa"",""#FFA15A"",""#19d3f3"",""#FF6692"",""#B6E880"",""#FF97FF"",""#FECB52""],""font"":{""color"":""#2a3f5f""},""hovermode"":""closest"",""hoverlabel"":{""align"":""left""},""paper_bgcolor"":""white"",""plot_bgcolor"":""#E5ECF6"",""polar"":{""bgcolor"":""#E5ECF6"",""angularaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""radialaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""ternary"":{""bgcolor"":""#E5ECF6"",""aaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""baxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""caxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""coloraxis"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""colorscale"":{""sequential"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""sequentialminus"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""diverging"":[[0,""#8e0152""],[0.1,""#c51b7d""],[0.2,""#de77ae""],[0.3,""#f1b6da""],[0.4,""#fde0ef""],[0.5,""#f7f7f7""],[0.6,""#e6f5d0""],[0.7,""#b8e186""],[0.8,""#7fbc41""],[0.9,""#4d9221""],[1,""#276419""]]},""xaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""yaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""scene"":{""xaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""yaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""zaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2}},""shapedefaults"":{""line"":{""color"":""#2a3f5f""}},""annotationdefaults"":{""arrowcolor"":""#2a3f5f"",""arrowhead"":0,""arrowwidth"":1},""geo"":{""bgcolor"":""white"",""landcolor"":""#E5ECF6"",""subunitcolor"":""white"",""showland"":true,""showlakes"":true,""lakecolor"":""white""},""title"":{""x"":0.05},""mapbox"":{""style"":""light""}}},""xaxis"":{""anchor"":""y"",""domain"":[0.0,1.0],""title"":{""text"":""Model""}},""yaxis"":{""anchor"":""x"",""domain"":[0.0,1.0],""title"":{""text"":""Execution cost ($)""}},""legend"":{""title"":{""text"":""Model""},""tracegroupgap"":0},""title"":{""text"":""Costs of execution of 39 test queries per model""},""barmode"":""relative""}}"
335
+ ./html/plots/model_sizes.html,"Figure({
336
+ 'data': [{'alignmentgroup': 'True',
337
+ 'hovertemplate': 'Model=%{x}<br>Model size (B params)=%{y}<extra></extra>',
338
+ 'legendgroup': 'Mixtral-8x7B-Instruct-v0.1',
339
+ 'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
340
+ 'name': 'Mixtral-8x7B-Instruct-v0.1',
341
+ 'offsetgroup': 'Mixtral-8x7B-Instruct-v0.1',
342
+ 'orientation': 'v',
343
+ 'showlegend': True,
344
+ 'textposition': 'auto',
345
+ 'type': 'bar',
346
+ 'x': array(['Mixtral-8x7B-Instruct-v0.1'], dtype=object),
347
+ 'xaxis': 'x',
348
+ 'y': array([56.]),
349
+ 'yaxis': 'y'},
350
+ {'alignmentgroup': 'True',
351
+ 'hovertemplate': 'Model=%{x}<br>Model size (B params)=%{y}<extra></extra>',
352
+ 'legendgroup': 'zephyr-7b-beta',
353
+ 'marker': {'color': '#EF553B', 'pattern': {'shape': ''}},
354
+ 'name': 'zephyr-7b-beta',
355
+ 'offsetgroup': 'zephyr-7b-beta',
356
+ 'orientation': 'v',
357
+ 'showlegend': True,
358
+ 'textposition': 'auto',
359
+ 'type': 'bar',
360
+ 'x': array(['zephyr-7b-beta'], dtype=object),
361
+ 'xaxis': 'x',
362
+ 'y': array([7.]),
363
+ 'yaxis': 'y'},
364
+ {'alignmentgroup': 'True',
365
+ 'hovertemplate': 'Model=%{x}<br>Model size (B params)=%{y}<extra></extra>',
366
+ 'legendgroup': 'Mistral-7B-Instruct-v0.2',
367
+ 'marker': {'color': '#00cc96', 'pattern': {'shape': ''}},
368
+ 'name': 'Mistral-7B-Instruct-v0.2',
369
+ 'offsetgroup': 'Mistral-7B-Instruct-v0.2',
370
+ 'orientation': 'v',
371
+ 'showlegend': True,
372
+ 'textposition': 'auto',
373
+ 'type': 'bar',
374
+ 'x': array(['Mistral-7B-Instruct-v0.2'], dtype=object),
375
+ 'xaxis': 'x',
376
+ 'y': array([7.]),
377
+ 'yaxis': 'y'},
378
+ {'alignmentgroup': 'True',
379
+ 'hovertemplate': 'Model=%{x}<br>Model size (B params)=%{y}<extra></extra>',
380
+ 'legendgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
381
+ 'marker': {'color': '#ab63fa', 'pattern': {'shape': ''}},
382
+ 'name': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
383
+ 'offsetgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
384
+ 'orientation': 'v',
385
+ 'showlegend': True,
386
+ 'textposition': 'auto',
387
+ 'type': 'bar',
388
+ 'x': array(['TinyLlama/TinyLlama-1.1B-Chat-v1.0'], dtype=object),
389
+ 'xaxis': 'x',
390
+ 'y': array([1.1]),
391
+ 'yaxis': 'y'}],
392
+ 'layout': {'barmode': 'relative',
393
+ 'legend': {'title': {'text': 'Model'}, 'tracegroupgap': 0},
394
+ 'template': '...',
395
+ 'title': {'text': 'Model sizes in billions of parameters'},
396
+ 'xaxis': {'anchor': 'y', 'domain': [0.0, 1.0], 'title': {'text': 'Model'}},
397
+ 'yaxis': {'anchor': 'x', 'domain': [0.0, 1.0], 'title': {'text': 'Model size (B params)'}}}
398
+ })",Model sizes in billions of parameters,Note that some models have undisclosed sizes.,"{""data"":[{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eModel size (B params)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mixtral-8x7B-Instruct-v0.1"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""Mixtral-8x7B-Instruct-v0.1"",""offsetgroup"":""Mixtral-8x7B-Instruct-v0.1"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""Mixtral-8x7B-Instruct-v0.1""],""xaxis"":""x"",""y"":[56.0],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eModel size (B params)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""zephyr-7b-beta"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""zephyr-7b-beta"",""offsetgroup"":""zephyr-7b-beta"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""zephyr-7b-beta""],""xaxis"":""x"",""y"":[7.0],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eModel size (B params)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral-7B-Instruct-v0.2"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""Mistral-7B-Instruct-v0.2"",""offsetgroup"":""Mistral-7B-Instruct-v0.2"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""Mistral-7B-Instruct-v0.2""],""xaxis"":""x"",""y"":[7.0],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eModel size (B params)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""offsetgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0""],""xaxis"":""x"",""y"":[1.1],""yaxis"":""y"",""type"":""bar""}],""layout"":{""template"":{""data"":{""histogram2dcontour"":[{""type"":""histogram2dcontour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""choropleth"":[{""type"":""choropleth"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""histogram2d"":[{""type"":""histogram2d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmap"":[{""type"":""heatmap"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmapgl"":[{""type"":""heatmapgl"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""contourcarpet"":[{""type"":""contourcarpet"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""contour"":[{""type"":""contour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""surface"":[{""type"":""surface"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""mesh3d"":[{""type"":""mesh3d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""scatter"":[{""fillpattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2},""type"":""scatter""}],""parcoords"":[{""type"":""parcoords"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolargl"":[{""type"":""scatterpolargl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""bar"":[{""error_x"":{""color"":""#2a3f5f""},""error_y"":{""color"":""#2a3f5f""},""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""bar""}],""scattergeo"":[{""type"":""scattergeo"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolar"":[{""type"":""scatterpolar"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""histogram"":[{""marker"":{""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""histogram""}],""scattergl"":[{""type"":""scattergl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatter3d"":[{""type"":""scatter3d"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattermapbox"":[{""type"":""scattermapbox"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterternary"":[{""type"":""scatterternary"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattercarpet"":[{""type"":""scattercarpet"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""carpet"":[{""aaxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""baxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""type"":""carpet""}],""table"":[{""cells"":{""fill"":{""color"":""#EBF0F8""},""line"":{""color"":""white""}},""header"":{""fill"":{""color"":""#C8D4E3""},""line"":{""color"":""white""}},""type"":""table""}],""barpolar"":[{""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""barpolar""}],""pie"":[{""automargin"":true,""type"":""pie""}]},""layout"":{""autotypenumbers"":""strict"",""colorway"":[""#636efa"",""#EF553B"",""#00cc96"",""#ab63fa"",""#FFA15A"",""#19d3f3"",""#FF6692"",""#B6E880"",""#FF97FF"",""#FECB52""],""font"":{""color"":""#2a3f5f""},""hovermode"":""closest"",""hoverlabel"":{""align"":""left""},""paper_bgcolor"":""white"",""plot_bgcolor"":""#E5ECF6"",""polar"":{""bgcolor"":""#E5ECF6"",""angularaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""radialaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""ternary"":{""bgcolor"":""#E5ECF6"",""aaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""baxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""caxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""coloraxis"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""colorscale"":{""sequential"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""sequentialminus"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""diverging"":[[0,""#8e0152""],[0.1,""#c51b7d""],[0.2,""#de77ae""],[0.3,""#f1b6da""],[0.4,""#fde0ef""],[0.5,""#f7f7f7""],[0.6,""#e6f5d0""],[0.7,""#b8e186""],[0.8,""#7fbc41""],[0.9,""#4d9221""],[1,""#276419""]]},""xaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""yaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""scene"":{""xaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""yaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""zaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2}},""shapedefaults"":{""line"":{""color"":""#2a3f5f""}},""annotationdefaults"":{""arrowcolor"":""#2a3f5f"",""arrowhead"":0,""arrowwidth"":1},""geo"":{""bgcolor"":""white"",""landcolor"":""#E5ECF6"",""subunitcolor"":""white"",""showland"":true,""showlakes"":true,""lakecolor"":""white""},""title"":{""x"":0.05},""mapbox"":{""style"":""light""}}},""xaxis"":{""anchor"":""y"",""domain"":[0.0,1.0],""title"":{""text"":""Model""}},""yaxis"":{""anchor"":""x"",""domain"":[0.0,1.0],""title"":{""text"":""Model size (B params)""}},""legend"":{""title"":{""text"":""Model""},""tracegroupgap"":0},""title"":{""text"":""Model sizes in billions of parameters""},""barmode"":""relative""}}"
data/2024-01-30 13:08:12.199559_general_plot.csv ADDED
@@ -0,0 +1,398 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ path,plot_object,description,comment,plot_json
2
+ ./html/plots/response_times.html,"Figure({
3
+ 'data': [{'alignmentgroup': 'True',
4
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
5
+ 'legendgroup': 'Mistral-7B-Instruct-v0.2',
6
+ 'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
7
+ 'name': 'Mistral-7B-Instruct-v0.2',
8
+ 'offsetgroup': 'Mistral-7B-Instruct-v0.2',
9
+ 'orientation': 'v',
10
+ 'showlegend': True,
11
+ 'textposition': 'auto',
12
+ 'type': 'bar',
13
+ 'x': array(['Mistral-7B-Instruct-v0.2'], dtype=object),
14
+ 'xaxis': 'x',
15
+ 'y': array([3.17454003]),
16
+ 'yaxis': 'y'},
17
+ {'alignmentgroup': 'True',
18
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
19
+ 'legendgroup': 'Mixtral-8x7B-Instruct-v0.1',
20
+ 'marker': {'color': '#EF553B', 'pattern': {'shape': ''}},
21
+ 'name': 'Mixtral-8x7B-Instruct-v0.1',
22
+ 'offsetgroup': 'Mixtral-8x7B-Instruct-v0.1',
23
+ 'orientation': 'v',
24
+ 'showlegend': True,
25
+ 'textposition': 'auto',
26
+ 'type': 'bar',
27
+ 'x': array(['Mixtral-8x7B-Instruct-v0.1'], dtype=object),
28
+ 'xaxis': 'x',
29
+ 'y': array([7.14219763]),
30
+ 'yaxis': 'y'},
31
+ {'alignmentgroup': 'True',
32
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
33
+ 'legendgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
34
+ 'marker': {'color': '#00cc96', 'pattern': {'shape': ''}},
35
+ 'name': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
36
+ 'offsetgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
37
+ 'orientation': 'v',
38
+ 'showlegend': True,
39
+ 'textposition': 'auto',
40
+ 'type': 'bar',
41
+ 'x': array(['TinyLlama/TinyLlama-1.1B-Chat-v1.0'], dtype=object),
42
+ 'xaxis': 'x',
43
+ 'y': array([1.29026454]),
44
+ 'yaxis': 'y'},
45
+ {'alignmentgroup': 'True',
46
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
47
+ 'legendgroup': 'chat-bison',
48
+ 'marker': {'color': '#ab63fa', 'pattern': {'shape': ''}},
49
+ 'name': 'chat-bison',
50
+ 'offsetgroup': 'chat-bison',
51
+ 'orientation': 'v',
52
+ 'showlegend': True,
53
+ 'textposition': 'auto',
54
+ 'type': 'bar',
55
+ 'x': array(['chat-bison'], dtype=object),
56
+ 'xaxis': 'x',
57
+ 'y': array([3.89024363]),
58
+ 'yaxis': 'y'},
59
+ {'alignmentgroup': 'True',
60
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
61
+ 'legendgroup': 'chat-bison-32k',
62
+ 'marker': {'color': '#FFA15A', 'pattern': {'shape': ''}},
63
+ 'name': 'chat-bison-32k',
64
+ 'offsetgroup': 'chat-bison-32k',
65
+ 'orientation': 'v',
66
+ 'showlegend': True,
67
+ 'textposition': 'auto',
68
+ 'type': 'bar',
69
+ 'x': array(['chat-bison-32k'], dtype=object),
70
+ 'xaxis': 'x',
71
+ 'y': array([4.12817777]),
72
+ 'yaxis': 'y'},
73
+ {'alignmentgroup': 'True',
74
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
75
+ 'legendgroup': 'gemini-pro',
76
+ 'marker': {'color': '#19d3f3', 'pattern': {'shape': ''}},
77
+ 'name': 'gemini-pro',
78
+ 'offsetgroup': 'gemini-pro',
79
+ 'orientation': 'v',
80
+ 'showlegend': True,
81
+ 'textposition': 'auto',
82
+ 'type': 'bar',
83
+ 'x': array(['gemini-pro'], dtype=object),
84
+ 'xaxis': 'x',
85
+ 'y': array([4.72138064]),
86
+ 'yaxis': 'y'},
87
+ {'alignmentgroup': 'True',
88
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
89
+ 'legendgroup': 'gpt-3.5-turbo',
90
+ 'marker': {'color': '#FF6692', 'pattern': {'shape': ''}},
91
+ 'name': 'gpt-3.5-turbo',
92
+ 'offsetgroup': 'gpt-3.5-turbo',
93
+ 'orientation': 'v',
94
+ 'showlegend': True,
95
+ 'textposition': 'auto',
96
+ 'type': 'bar',
97
+ 'x': array(['gpt-3.5-turbo'], dtype=object),
98
+ 'xaxis': 'x',
99
+ 'y': array([5.28237349]),
100
+ 'yaxis': 'y'},
101
+ {'alignmentgroup': 'True',
102
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
103
+ 'legendgroup': 'gpt-4',
104
+ 'marker': {'color': '#B6E880', 'pattern': {'shape': ''}},
105
+ 'name': 'gpt-4',
106
+ 'offsetgroup': 'gpt-4',
107
+ 'orientation': 'v',
108
+ 'showlegend': True,
109
+ 'textposition': 'auto',
110
+ 'type': 'bar',
111
+ 'x': array(['gpt-4'], dtype=object),
112
+ 'xaxis': 'x',
113
+ 'y': array([15.52184566]),
114
+ 'yaxis': 'y'},
115
+ {'alignmentgroup': 'True',
116
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
117
+ 'legendgroup': 'gpt-4-turbo',
118
+ 'marker': {'color': '#FF97FF', 'pattern': {'shape': ''}},
119
+ 'name': 'gpt-4-turbo',
120
+ 'offsetgroup': 'gpt-4-turbo',
121
+ 'orientation': 'v',
122
+ 'showlegend': True,
123
+ 'textposition': 'auto',
124
+ 'type': 'bar',
125
+ 'x': array(['gpt-4-turbo'], dtype=object),
126
+ 'xaxis': 'x',
127
+ 'y': array([14.00852903]),
128
+ 'yaxis': 'y'},
129
+ {'alignmentgroup': 'True',
130
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
131
+ 'legendgroup': 'llama-2-70b-chat',
132
+ 'marker': {'color': '#FECB52', 'pattern': {'shape': ''}},
133
+ 'name': 'llama-2-70b-chat',
134
+ 'offsetgroup': 'llama-2-70b-chat',
135
+ 'orientation': 'v',
136
+ 'showlegend': True,
137
+ 'textposition': 'auto',
138
+ 'type': 'bar',
139
+ 'x': array(['llama-2-70b-chat'], dtype=object),
140
+ 'xaxis': 'x',
141
+ 'y': array([6.0658799]),
142
+ 'yaxis': 'y'},
143
+ {'alignmentgroup': 'True',
144
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
145
+ 'legendgroup': 'zephyr-7b-beta',
146
+ 'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
147
+ 'name': 'zephyr-7b-beta',
148
+ 'offsetgroup': 'zephyr-7b-beta',
149
+ 'orientation': 'v',
150
+ 'showlegend': True,
151
+ 'textposition': 'auto',
152
+ 'type': 'bar',
153
+ 'x': array(['zephyr-7b-beta'], dtype=object),
154
+ 'xaxis': 'x',
155
+ 'y': array([3.23879932]),
156
+ 'yaxis': 'y'}],
157
+ 'layout': {'barmode': 'relative',
158
+ 'legend': {'title': {'text': 'Model'}, 'tracegroupgap': 0},
159
+ 'template': '...',
160
+ 'title': {'text': 'Model endpoints response times'},
161
+ 'xaxis': {'anchor': 'y',
162
+ 'categoryarray': [Mistral-7B-Instruct-v0.2,
163
+ Mixtral-8x7B-Instruct-v0.1,
164
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,
165
+ chat-bison, chat-bison-32k, gemini-pro,
166
+ gpt-3.5-turbo, gpt-4, gpt-4-turbo,
167
+ llama-2-70b-chat, zephyr-7b-beta],
168
+ 'categoryorder': 'array',
169
+ 'domain': [0.0, 1.0],
170
+ 'title': {'text': 'Model'}},
171
+ 'yaxis': {'anchor': 'x', 'domain': [0.0, 1.0], 'title': {'text': 'Execution time (s)'}}}
172
+ })",Model endpoints response times,,"{""data"":[{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral-7B-Instruct-v0.2"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""Mistral-7B-Instruct-v0.2"",""offsetgroup"":""Mistral-7B-Instruct-v0.2"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""Mistral-7B-Instruct-v0.2""],""xaxis"":""x"",""y"":[3.174540030956268],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mixtral-8x7B-Instruct-v0.1"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""Mixtral-8x7B-Instruct-v0.1"",""offsetgroup"":""Mixtral-8x7B-Instruct-v0.1"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""Mixtral-8x7B-Instruct-v0.1""],""xaxis"":""x"",""y"":[7.142197625471814],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""offsetgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0""],""xaxis"":""x"",""y"":[1.2902645373344421],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""chat-bison"",""offsetgroup"":""chat-bison"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""chat-bison""],""xaxis"":""x"",""y"":[3.890243631601334],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison-32k"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""chat-bison-32k"",""offsetgroup"":""chat-bison-32k"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""chat-bison-32k""],""xaxis"":""x"",""y"":[4.128177767992019],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gemini-pro"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""gemini-pro"",""offsetgroup"":""gemini-pro"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gemini-pro""],""xaxis"":""x"",""y"":[4.72138064004937],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-3.5-turbo"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""gpt-3.5-turbo"",""offsetgroup"":""gpt-3.5-turbo"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gpt-3.5-turbo""],""xaxis"":""x"",""y"":[5.282373493889353],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""gpt-4"",""offsetgroup"":""gpt-4"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gpt-4""],""xaxis"":""x"",""y"":[15.5218456586202],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4-turbo"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""gpt-4-turbo"",""offsetgroup"":""gpt-4-turbo"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gpt-4-turbo""],""xaxis"":""x"",""y"":[14.008529031276703],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""llama-2-70b-chat"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""llama-2-70b-chat"",""offsetgroup"":""llama-2-70b-chat"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""llama-2-70b-chat""],""xaxis"":""x"",""y"":[6.06587989590749],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""zephyr-7b-beta"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""zephyr-7b-beta"",""offsetgroup"":""zephyr-7b-beta"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""zephyr-7b-beta""],""xaxis"":""x"",""y"":[3.2387993240356447],""yaxis"":""y"",""type"":""bar""}],""layout"":{""template"":{""data"":{""histogram2dcontour"":[{""type"":""histogram2dcontour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""choropleth"":[{""type"":""choropleth"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""histogram2d"":[{""type"":""histogram2d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmap"":[{""type"":""heatmap"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmapgl"":[{""type"":""heatmapgl"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""contourcarpet"":[{""type"":""contourcarpet"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""contour"":[{""type"":""contour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""surface"":[{""type"":""surface"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""mesh3d"":[{""type"":""mesh3d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""scatter"":[{""fillpattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2},""type"":""scatter""}],""parcoords"":[{""type"":""parcoords"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolargl"":[{""type"":""scatterpolargl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""bar"":[{""error_x"":{""color"":""#2a3f5f""},""error_y"":{""color"":""#2a3f5f""},""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""bar""}],""scattergeo"":[{""type"":""scattergeo"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolar"":[{""type"":""scatterpolar"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""histogram"":[{""marker"":{""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""histogram""}],""scattergl"":[{""type"":""scattergl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatter3d"":[{""type"":""scatter3d"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattermapbox"":[{""type"":""scattermapbox"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterternary"":[{""type"":""scatterternary"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattercarpet"":[{""type"":""scattercarpet"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""carpet"":[{""aaxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""baxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""type"":""carpet""}],""table"":[{""cells"":{""fill"":{""color"":""#EBF0F8""},""line"":{""color"":""white""}},""header"":{""fill"":{""color"":""#C8D4E3""},""line"":{""color"":""white""}},""type"":""table""}],""barpolar"":[{""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""barpolar""}],""pie"":[{""automargin"":true,""type"":""pie""}]},""layout"":{""autotypenumbers"":""strict"",""colorway"":[""#636efa"",""#EF553B"",""#00cc96"",""#ab63fa"",""#FFA15A"",""#19d3f3"",""#FF6692"",""#B6E880"",""#FF97FF"",""#FECB52""],""font"":{""color"":""#2a3f5f""},""hovermode"":""closest"",""hoverlabel"":{""align"":""left""},""paper_bgcolor"":""white"",""plot_bgcolor"":""#E5ECF6"",""polar"":{""bgcolor"":""#E5ECF6"",""angularaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""radialaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""ternary"":{""bgcolor"":""#E5ECF6"",""aaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""baxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""caxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""coloraxis"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""colorscale"":{""sequential"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""sequentialminus"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""diverging"":[[0,""#8e0152""],[0.1,""#c51b7d""],[0.2,""#de77ae""],[0.3,""#f1b6da""],[0.4,""#fde0ef""],[0.5,""#f7f7f7""],[0.6,""#e6f5d0""],[0.7,""#b8e186""],[0.8,""#7fbc41""],[0.9,""#4d9221""],[1,""#276419""]]},""xaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""yaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""scene"":{""xaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""yaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""zaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2}},""shapedefaults"":{""line"":{""color"":""#2a3f5f""}},""annotationdefaults"":{""arrowcolor"":""#2a3f5f"",""arrowhead"":0,""arrowwidth"":1},""geo"":{""bgcolor"":""white"",""landcolor"":""#E5ECF6"",""subunitcolor"":""white"",""showland"":true,""showlakes"":true,""lakecolor"":""white""},""title"":{""x"":0.05},""mapbox"":{""style"":""light""}}},""xaxis"":{""anchor"":""y"",""domain"":[0.0,1.0],""title"":{""text"":""Model""},""categoryorder"":""array"",""categoryarray"":[""Mistral-7B-Instruct-v0.2"",""Mixtral-8x7B-Instruct-v0.1"",""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""chat-bison"",""chat-bison-32k"",""gemini-pro"",""gpt-3.5-turbo"",""gpt-4"",""gpt-4-turbo"",""llama-2-70b-chat"",""zephyr-7b-beta""]},""yaxis"":{""anchor"":""x"",""domain"":[0.0,1.0],""title"":{""text"":""Execution time (s)""}},""legend"":{""title"":{""text"":""Model""},""tracegroupgap"":0},""title"":{""text"":""Model endpoints response times""},""barmode"":""relative""}}"
173
+ ./html/plots/execution_costs.html,"Figure({
174
+ 'data': [{'alignmentgroup': 'True',
175
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
176
+ 'legendgroup': 'gpt-3.5-turbo',
177
+ 'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
178
+ 'name': 'gpt-3.5-turbo',
179
+ 'offsetgroup': 'gpt-3.5-turbo',
180
+ 'orientation': 'v',
181
+ 'showlegend': True,
182
+ 'textposition': 'auto',
183
+ 'type': 'bar',
184
+ 'x': array(['gpt-3.5-turbo'], dtype=object),
185
+ 'xaxis': 'x',
186
+ 'y': array([0.471009]),
187
+ 'yaxis': 'y'},
188
+ {'alignmentgroup': 'True',
189
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
190
+ 'legendgroup': 'gpt-4-turbo',
191
+ 'marker': {'color': '#EF553B', 'pattern': {'shape': ''}},
192
+ 'name': 'gpt-4-turbo',
193
+ 'offsetgroup': 'gpt-4-turbo',
194
+ 'orientation': 'v',
195
+ 'showlegend': True,
196
+ 'textposition': 'auto',
197
+ 'type': 'bar',
198
+ 'x': array(['gpt-4-turbo'], dtype=object),
199
+ 'xaxis': 'x',
200
+ 'y': array([4.49821]),
201
+ 'yaxis': 'y'},
202
+ {'alignmentgroup': 'True',
203
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
204
+ 'legendgroup': 'gpt-4',
205
+ 'marker': {'color': '#00cc96', 'pattern': {'shape': ''}},
206
+ 'name': 'gpt-4',
207
+ 'offsetgroup': 'gpt-4',
208
+ 'orientation': 'v',
209
+ 'showlegend': True,
210
+ 'textposition': 'auto',
211
+ 'type': 'bar',
212
+ 'x': array(['gpt-4'], dtype=object),
213
+ 'xaxis': 'x',
214
+ 'y': array([11.69823]),
215
+ 'yaxis': 'y'},
216
+ {'alignmentgroup': 'True',
217
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
218
+ 'legendgroup': 'llama-2-70b-chat',
219
+ 'marker': {'color': '#ab63fa', 'pattern': {'shape': ''}},
220
+ 'name': 'llama-2-70b-chat',
221
+ 'offsetgroup': 'llama-2-70b-chat',
222
+ 'orientation': 'v',
223
+ 'showlegend': True,
224
+ 'textposition': 'auto',
225
+ 'type': 'bar',
226
+ 'x': array(['llama-2-70b-chat'], dtype=object),
227
+ 'xaxis': 'x',
228
+ 'y': array([0.095657]),
229
+ 'yaxis': 'y'},
230
+ {'alignmentgroup': 'True',
231
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
232
+ 'legendgroup': 'Mixtral-8x7B-Instruct-v0.1',
233
+ 'marker': {'color': '#FFA15A', 'pattern': {'shape': ''}},
234
+ 'name': 'Mixtral-8x7B-Instruct-v0.1',
235
+ 'offsetgroup': 'Mixtral-8x7B-Instruct-v0.1',
236
+ 'orientation': 'v',
237
+ 'showlegend': True,
238
+ 'textposition': 'auto',
239
+ 'type': 'bar',
240
+ 'x': array(['Mixtral-8x7B-Instruct-v0.1'], dtype=object),
241
+ 'xaxis': 'x',
242
+ 'y': array([0.3244509]),
243
+ 'yaxis': 'y'},
244
+ {'alignmentgroup': 'True',
245
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
246
+ 'legendgroup': 'zephyr-7b-beta',
247
+ 'marker': {'color': '#19d3f3', 'pattern': {'shape': ''}},
248
+ 'name': 'zephyr-7b-beta',
249
+ 'offsetgroup': 'zephyr-7b-beta',
250
+ 'orientation': 'v',
251
+ 'showlegend': True,
252
+ 'textposition': 'auto',
253
+ 'type': 'bar',
254
+ 'x': array(['zephyr-7b-beta'], dtype=object),
255
+ 'xaxis': 'x',
256
+ 'y': array([0.1279793]),
257
+ 'yaxis': 'y'},
258
+ {'alignmentgroup': 'True',
259
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
260
+ 'legendgroup': 'Mistral-7B-Instruct-v0.2',
261
+ 'marker': {'color': '#FF6692', 'pattern': {'shape': ''}},
262
+ 'name': 'Mistral-7B-Instruct-v0.2',
263
+ 'offsetgroup': 'Mistral-7B-Instruct-v0.2',
264
+ 'orientation': 'v',
265
+ 'showlegend': True,
266
+ 'textposition': 'auto',
267
+ 'type': 'bar',
268
+ 'x': array(['Mistral-7B-Instruct-v0.2'], dtype=object),
269
+ 'xaxis': 'x',
270
+ 'y': array([0.05851047]),
271
+ 'yaxis': 'y'},
272
+ {'alignmentgroup': 'True',
273
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
274
+ 'legendgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
275
+ 'marker': {'color': '#B6E880', 'pattern': {'shape': ''}},
276
+ 'name': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
277
+ 'offsetgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
278
+ 'orientation': 'v',
279
+ 'showlegend': True,
280
+ 'textposition': 'auto',
281
+ 'type': 'bar',
282
+ 'x': array(['TinyLlama/TinyLlama-1.1B-Chat-v1.0'], dtype=object),
283
+ 'xaxis': 'x',
284
+ 'y': array([0.01705275]),
285
+ 'yaxis': 'y'},
286
+ {'alignmentgroup': 'True',
287
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
288
+ 'legendgroup': 'gemini-pro',
289
+ 'marker': {'color': '#FF97FF', 'pattern': {'shape': ''}},
290
+ 'name': 'gemini-pro',
291
+ 'offsetgroup': 'gemini-pro',
292
+ 'orientation': 'v',
293
+ 'showlegend': True,
294
+ 'textposition': 'auto',
295
+ 'type': 'bar',
296
+ 'x': array(['gemini-pro'], dtype=object),
297
+ 'xaxis': 'x',
298
+ 'y': array([0.10229025]),
299
+ 'yaxis': 'y'},
300
+ {'alignmentgroup': 'True',
301
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
302
+ 'legendgroup': 'chat-bison (PaLM 2)',
303
+ 'marker': {'color': '#FECB52', 'pattern': {'shape': ''}},
304
+ 'name': 'chat-bison (PaLM 2)',
305
+ 'offsetgroup': 'chat-bison (PaLM 2)',
306
+ 'orientation': 'v',
307
+ 'showlegend': True,
308
+ 'textposition': 'auto',
309
+ 'type': 'bar',
310
+ 'x': array(['chat-bison (PaLM 2)'], dtype=object),
311
+ 'xaxis': 'x',
312
+ 'y': array([0.]),
313
+ 'yaxis': 'y'},
314
+ {'alignmentgroup': 'True',
315
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
316
+ 'legendgroup': 'chat-bison-32k (PaLM 2 32K)',
317
+ 'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
318
+ 'name': 'chat-bison-32k (PaLM 2 32K)',
319
+ 'offsetgroup': 'chat-bison-32k (PaLM 2 32K)',
320
+ 'orientation': 'v',
321
+ 'showlegend': True,
322
+ 'textposition': 'auto',
323
+ 'type': 'bar',
324
+ 'x': array(['chat-bison-32k (PaLM 2 32K)'], dtype=object),
325
+ 'xaxis': 'x',
326
+ 'y': array([0.]),
327
+ 'yaxis': 'y'}],
328
+ 'layout': {'barmode': 'relative',
329
+ 'legend': {'title': {'text': 'Model'}, 'tracegroupgap': 0},
330
+ 'template': '...',
331
+ 'title': {'text': 'Costs of execution of 780 test queries per model'},
332
+ 'xaxis': {'anchor': 'y', 'domain': [0.0, 1.0], 'title': {'text': 'Model'}},
333
+ 'yaxis': {'anchor': 'x', 'domain': [0.0, 1.0], 'title': {'text': 'Execution cost ($)'}}}
334
+ })",Costs of execution of 780 test queries per model,Note that pause and resume time cost was not included in the cost calculation for the models billed hourly. Also although Gemini-Pro model is free for under 60 queries per minute we calculated the full cost for generating the tokens.,"{""data"":[{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-3.5-turbo"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""gpt-3.5-turbo"",""offsetgroup"":""gpt-3.5-turbo"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gpt-3.5-turbo""],""xaxis"":""x"",""y"":[0.47100899999999996],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4-turbo"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""gpt-4-turbo"",""offsetgroup"":""gpt-4-turbo"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gpt-4-turbo""],""xaxis"":""x"",""y"":[4.49821],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""gpt-4"",""offsetgroup"":""gpt-4"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gpt-4""],""xaxis"":""x"",""y"":[11.698229999999999],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""llama-2-70b-chat"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""llama-2-70b-chat"",""offsetgroup"":""llama-2-70b-chat"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""llama-2-70b-chat""],""xaxis"":""x"",""y"":[0.095657],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mixtral-8x7B-Instruct-v0.1"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""Mixtral-8x7B-Instruct-v0.1"",""offsetgroup"":""Mixtral-8x7B-Instruct-v0.1"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""Mixtral-8x7B-Instruct-v0.1""],""xaxis"":""x"",""y"":[0.3244509],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""zephyr-7b-beta"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""zephyr-7b-beta"",""offsetgroup"":""zephyr-7b-beta"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""zephyr-7b-beta""],""xaxis"":""x"",""y"":[0.1279792968829473],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral-7B-Instruct-v0.2"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""Mistral-7B-Instruct-v0.2"",""offsetgroup"":""Mistral-7B-Instruct-v0.2"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""Mistral-7B-Instruct-v0.2""],""xaxis"":""x"",""y"":[0.05851047111882104],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""offsetgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0""],""xaxis"":""x"",""y"":[0.017052749236424764],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gemini-pro"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""gemini-pro"",""offsetgroup"":""gemini-pro"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gemini-pro""],""xaxis"":""x"",""y"":[0.10229025],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison (PaLM 2)"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""chat-bison (PaLM 2)"",""offsetgroup"":""chat-bison (PaLM 2)"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""chat-bison (PaLM 2)""],""xaxis"":""x"",""y"":[0.0],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison-32k (PaLM 2 32K)"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""chat-bison-32k (PaLM 2 32K)"",""offsetgroup"":""chat-bison-32k (PaLM 2 32K)"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""chat-bison-32k (PaLM 2 32K)""],""xaxis"":""x"",""y"":[0.0],""yaxis"":""y"",""type"":""bar""}],""layout"":{""template"":{""data"":{""histogram2dcontour"":[{""type"":""histogram2dcontour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""choropleth"":[{""type"":""choropleth"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""histogram2d"":[{""type"":""histogram2d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmap"":[{""type"":""heatmap"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmapgl"":[{""type"":""heatmapgl"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""contourcarpet"":[{""type"":""contourcarpet"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""contour"":[{""type"":""contour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""surface"":[{""type"":""surface"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""mesh3d"":[{""type"":""mesh3d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""scatter"":[{""fillpattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2},""type"":""scatter""}],""parcoords"":[{""type"":""parcoords"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolargl"":[{""type"":""scatterpolargl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""bar"":[{""error_x"":{""color"":""#2a3f5f""},""error_y"":{""color"":""#2a3f5f""},""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""bar""}],""scattergeo"":[{""type"":""scattergeo"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolar"":[{""type"":""scatterpolar"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""histogram"":[{""marker"":{""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""histogram""}],""scattergl"":[{""type"":""scattergl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatter3d"":[{""type"":""scatter3d"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattermapbox"":[{""type"":""scattermapbox"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterternary"":[{""type"":""scatterternary"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattercarpet"":[{""type"":""scattercarpet"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""carpet"":[{""aaxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""baxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""type"":""carpet""}],""table"":[{""cells"":{""fill"":{""color"":""#EBF0F8""},""line"":{""color"":""white""}},""header"":{""fill"":{""color"":""#C8D4E3""},""line"":{""color"":""white""}},""type"":""table""}],""barpolar"":[{""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""barpolar""}],""pie"":[{""automargin"":true,""type"":""pie""}]},""layout"":{""autotypenumbers"":""strict"",""colorway"":[""#636efa"",""#EF553B"",""#00cc96"",""#ab63fa"",""#FFA15A"",""#19d3f3"",""#FF6692"",""#B6E880"",""#FF97FF"",""#FECB52""],""font"":{""color"":""#2a3f5f""},""hovermode"":""closest"",""hoverlabel"":{""align"":""left""},""paper_bgcolor"":""white"",""plot_bgcolor"":""#E5ECF6"",""polar"":{""bgcolor"":""#E5ECF6"",""angularaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""radialaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""ternary"":{""bgcolor"":""#E5ECF6"",""aaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""baxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""caxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""coloraxis"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""colorscale"":{""sequential"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""sequentialminus"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""diverging"":[[0,""#8e0152""],[0.1,""#c51b7d""],[0.2,""#de77ae""],[0.3,""#f1b6da""],[0.4,""#fde0ef""],[0.5,""#f7f7f7""],[0.6,""#e6f5d0""],[0.7,""#b8e186""],[0.8,""#7fbc41""],[0.9,""#4d9221""],[1,""#276419""]]},""xaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""yaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""scene"":{""xaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""yaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""zaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2}},""shapedefaults"":{""line"":{""color"":""#2a3f5f""}},""annotationdefaults"":{""arrowcolor"":""#2a3f5f"",""arrowhead"":0,""arrowwidth"":1},""geo"":{""bgcolor"":""white"",""landcolor"":""#E5ECF6"",""subunitcolor"":""white"",""showland"":true,""showlakes"":true,""lakecolor"":""white""},""title"":{""x"":0.05},""mapbox"":{""style"":""light""}}},""xaxis"":{""anchor"":""y"",""domain"":[0.0,1.0],""title"":{""text"":""Model""}},""yaxis"":{""anchor"":""x"",""domain"":[0.0,1.0],""title"":{""text"":""Execution cost ($)""}},""legend"":{""title"":{""text"":""Model""},""tracegroupgap"":0},""title"":{""text"":""Costs of execution of 780 test queries per model""},""barmode"":""relative""}}"
335
+ ./html/plots/model_sizes.html,"Figure({
336
+ 'data': [{'alignmentgroup': 'True',
337
+ 'hovertemplate': 'Model=%{x}<br>Model size (B params)=%{y}<extra></extra>',
338
+ 'legendgroup': 'Mixtral-8x7B-Instruct-v0.1',
339
+ 'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
340
+ 'name': 'Mixtral-8x7B-Instruct-v0.1',
341
+ 'offsetgroup': 'Mixtral-8x7B-Instruct-v0.1',
342
+ 'orientation': 'v',
343
+ 'showlegend': True,
344
+ 'textposition': 'auto',
345
+ 'type': 'bar',
346
+ 'x': array(['Mixtral-8x7B-Instruct-v0.1'], dtype=object),
347
+ 'xaxis': 'x',
348
+ 'y': array([56.]),
349
+ 'yaxis': 'y'},
350
+ {'alignmentgroup': 'True',
351
+ 'hovertemplate': 'Model=%{x}<br>Model size (B params)=%{y}<extra></extra>',
352
+ 'legendgroup': 'zephyr-7b-beta',
353
+ 'marker': {'color': '#EF553B', 'pattern': {'shape': ''}},
354
+ 'name': 'zephyr-7b-beta',
355
+ 'offsetgroup': 'zephyr-7b-beta',
356
+ 'orientation': 'v',
357
+ 'showlegend': True,
358
+ 'textposition': 'auto',
359
+ 'type': 'bar',
360
+ 'x': array(['zephyr-7b-beta'], dtype=object),
361
+ 'xaxis': 'x',
362
+ 'y': array([7.]),
363
+ 'yaxis': 'y'},
364
+ {'alignmentgroup': 'True',
365
+ 'hovertemplate': 'Model=%{x}<br>Model size (B params)=%{y}<extra></extra>',
366
+ 'legendgroup': 'Mistral-7B-Instruct-v0.2',
367
+ 'marker': {'color': '#00cc96', 'pattern': {'shape': ''}},
368
+ 'name': 'Mistral-7B-Instruct-v0.2',
369
+ 'offsetgroup': 'Mistral-7B-Instruct-v0.2',
370
+ 'orientation': 'v',
371
+ 'showlegend': True,
372
+ 'textposition': 'auto',
373
+ 'type': 'bar',
374
+ 'x': array(['Mistral-7B-Instruct-v0.2'], dtype=object),
375
+ 'xaxis': 'x',
376
+ 'y': array([7.]),
377
+ 'yaxis': 'y'},
378
+ {'alignmentgroup': 'True',
379
+ 'hovertemplate': 'Model=%{x}<br>Model size (B params)=%{y}<extra></extra>',
380
+ 'legendgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
381
+ 'marker': {'color': '#ab63fa', 'pattern': {'shape': ''}},
382
+ 'name': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
383
+ 'offsetgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
384
+ 'orientation': 'v',
385
+ 'showlegend': True,
386
+ 'textposition': 'auto',
387
+ 'type': 'bar',
388
+ 'x': array(['TinyLlama/TinyLlama-1.1B-Chat-v1.0'], dtype=object),
389
+ 'xaxis': 'x',
390
+ 'y': array([1.1]),
391
+ 'yaxis': 'y'}],
392
+ 'layout': {'barmode': 'relative',
393
+ 'legend': {'title': {'text': 'Model'}, 'tracegroupgap': 0},
394
+ 'template': '...',
395
+ 'title': {'text': 'Model sizes in billions of parameters'},
396
+ 'xaxis': {'anchor': 'y', 'domain': [0.0, 1.0], 'title': {'text': 'Model'}},
397
+ 'yaxis': {'anchor': 'x', 'domain': [0.0, 1.0], 'title': {'text': 'Model size (B params)'}}}
398
+ })",Model sizes in billions of parameters,Note that some models have undisclosed sizes.,"{""data"":[{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eModel size (B params)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mixtral-8x7B-Instruct-v0.1"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""Mixtral-8x7B-Instruct-v0.1"",""offsetgroup"":""Mixtral-8x7B-Instruct-v0.1"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""Mixtral-8x7B-Instruct-v0.1""],""xaxis"":""x"",""y"":[56.0],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eModel size (B params)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""zephyr-7b-beta"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""zephyr-7b-beta"",""offsetgroup"":""zephyr-7b-beta"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""zephyr-7b-beta""],""xaxis"":""x"",""y"":[7.0],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eModel size (B params)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral-7B-Instruct-v0.2"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""Mistral-7B-Instruct-v0.2"",""offsetgroup"":""Mistral-7B-Instruct-v0.2"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""Mistral-7B-Instruct-v0.2""],""xaxis"":""x"",""y"":[7.0],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eModel size (B params)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""offsetgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0""],""xaxis"":""x"",""y"":[1.1],""yaxis"":""y"",""type"":""bar""}],""layout"":{""template"":{""data"":{""histogram2dcontour"":[{""type"":""histogram2dcontour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""choropleth"":[{""type"":""choropleth"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""histogram2d"":[{""type"":""histogram2d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmap"":[{""type"":""heatmap"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmapgl"":[{""type"":""heatmapgl"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""contourcarpet"":[{""type"":""contourcarpet"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""contour"":[{""type"":""contour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""surface"":[{""type"":""surface"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""mesh3d"":[{""type"":""mesh3d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""scatter"":[{""fillpattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2},""type"":""scatter""}],""parcoords"":[{""type"":""parcoords"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolargl"":[{""type"":""scatterpolargl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""bar"":[{""error_x"":{""color"":""#2a3f5f""},""error_y"":{""color"":""#2a3f5f""},""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""bar""}],""scattergeo"":[{""type"":""scattergeo"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolar"":[{""type"":""scatterpolar"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""histogram"":[{""marker"":{""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""histogram""}],""scattergl"":[{""type"":""scattergl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatter3d"":[{""type"":""scatter3d"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattermapbox"":[{""type"":""scattermapbox"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterternary"":[{""type"":""scatterternary"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattercarpet"":[{""type"":""scattercarpet"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""carpet"":[{""aaxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""baxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""type"":""carpet""}],""table"":[{""cells"":{""fill"":{""color"":""#EBF0F8""},""line"":{""color"":""white""}},""header"":{""fill"":{""color"":""#C8D4E3""},""line"":{""color"":""white""}},""type"":""table""}],""barpolar"":[{""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""barpolar""}],""pie"":[{""automargin"":true,""type"":""pie""}]},""layout"":{""autotypenumbers"":""strict"",""colorway"":[""#636efa"",""#EF553B"",""#00cc96"",""#ab63fa"",""#FFA15A"",""#19d3f3"",""#FF6692"",""#B6E880"",""#FF97FF"",""#FECB52""],""font"":{""color"":""#2a3f5f""},""hovermode"":""closest"",""hoverlabel"":{""align"":""left""},""paper_bgcolor"":""white"",""plot_bgcolor"":""#E5ECF6"",""polar"":{""bgcolor"":""#E5ECF6"",""angularaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""radialaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""ternary"":{""bgcolor"":""#E5ECF6"",""aaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""baxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""caxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""coloraxis"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""colorscale"":{""sequential"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""sequentialminus"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""diverging"":[[0,""#8e0152""],[0.1,""#c51b7d""],[0.2,""#de77ae""],[0.3,""#f1b6da""],[0.4,""#fde0ef""],[0.5,""#f7f7f7""],[0.6,""#e6f5d0""],[0.7,""#b8e186""],[0.8,""#7fbc41""],[0.9,""#4d9221""],[1,""#276419""]]},""xaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""yaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""scene"":{""xaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""yaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""zaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2}},""shapedefaults"":{""line"":{""color"":""#2a3f5f""}},""annotationdefaults"":{""arrowcolor"":""#2a3f5f"",""arrowhead"":0,""arrowwidth"":1},""geo"":{""bgcolor"":""white"",""landcolor"":""#E5ECF6"",""subunitcolor"":""white"",""showland"":true,""showlakes"":true,""lakecolor"":""white""},""title"":{""x"":0.05},""mapbox"":{""style"":""light""}}},""xaxis"":{""anchor"":""y"",""domain"":[0.0,1.0],""title"":{""text"":""Model""}},""yaxis"":{""anchor"":""x"",""domain"":[0.0,1.0],""title"":{""text"":""Model size (B params)""}},""legend"":{""title"":{""text"":""Model""},""tracegroupgap"":0},""title"":{""text"":""Model sizes in billions of parameters""},""barmode"":""relative""}}"
data/2024-01-30 18:39:54.448407_time_of_day_comparison.csv ADDED
@@ -0,0 +1,27 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ model,time_of_day,execution_time,characters_count,words_count
2
+ Mistral-7B-Instruct-v0.2,afternoon,3.023258109887441,172.18333333333334,22.95
3
+ Mistral-7B-Instruct-v0.2,evening,,,
4
+ Mistral-7B-Instruct-v0.2,morning,3.174540030956268,113.0,16.27
5
+ Mixtral-8x7B-Instruct-v0.1,afternoon,7.426922065019608,450.4875,51.85
6
+ Mixtral-8x7B-Instruct-v0.1,morning,7.142197625471814,494.9583333333333,57.74166666666667
7
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,afternoon,1.538642168045044,169.46666666666667,26.083333333333332
8
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,morning,1.2902645373344421,106.18,16.74
9
+ chat-bison,morning,3.890243631601334,398.075,49.0
10
+ chat-bison (PaLM 2),afternoon,3.866238150000572,381.7875,40.3875
11
+ chat-bison-32k,morning,4.128177767992019,389.925,48.025
12
+ chat-bison-32k (PaLM 2 32K),afternoon,4.844334444403648,371.25,38.7375
13
+ gemini-pro,afternoon,3.6972034962972007,352.2,33.9375
14
+ gemini-pro,morning,4.72138064004937,425.09166666666664,49.891666666666666
15
+ gpt-3.5-turbo,afternoon,4.228875203738137,364.92857142857144,36.42857142857143
16
+ gpt-3.5-turbo,evening,4.351089119911194,305.25,28.5
17
+ gpt-3.5-turbo,morning,5.336839800789242,479.2785714285714,53.92142857142857
18
+ gpt-4,afternoon,20.52127287968868,307.175,31.975
19
+ gpt-4,morning,15.5218456586202,389.1875,44.125
20
+ gpt-4-turbo,afternoon,23.51892908215523,396.40833333333336,41.858333333333334
21
+ gpt-4-turbo,morning,14.008529031276703,433.075,49.975
22
+ llama-2-70b-chat,afternoon,4.851686128755895,671.2317073170732,83.5609756097561
23
+ llama-2-70b-chat,evening,5.552149415016174,967.5,141.25
24
+ llama-2-70b-chat,morning,6.175082007679371,662.7416666666667,94.30833333333334
25
+ zephyr-7b-beta,afternoon,3.0400254487991334,163.45,23.8
26
+ zephyr-7b-beta,evening,,,
27
+ zephyr-7b-beta,morning,3.2387993240356447,112.57,17.26
data/2024-01-30 18:40:08.467683_summary.csv ADDED
@@ -0,0 +1,75 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ model,language,template_name,execution_time,characters_count,words_count,chunk_sizes_mean,chunk_sizes_min,chunk_sizes_max,chunk_generation_times_mean,chunk_generation_times_min,chunk_generation_times_max
2
+ Mistral-7B-Instruct-v0.2,english,call,,,,,,,,,
3
+ Mistral-7B-Instruct-v0.2,english,json,7.318650853633881,222.2,35.95,4.157156220767072,1.0,14.0,0.10865272596910582,0.00024437904357910156,60.7178213596344
4
+ Mistral-7B-Instruct-v0.2,english,markdown,3.4006769716739655,324.0,50.9,4.217377155873739,1.0,16.0,0.03379235289362949,0.020945072174072266,0.25538039207458496
5
+ Mistral-7B-Instruct-v0.2,japanese,call,,,,,,,,,
6
+ Mistral-7B-Instruct-v0.2,japanese,json,2.129413692156474,44.516666666666666,3.1666666666666665,1.338176352705411,1.0,11.0,0.038890062568182934,0.020466089248657227,0.23994874954223633
7
+ Mistral-7B-Instruct-v0.2,japanese,markdown,2.217114305496216,38.9,1.475,1.1035460992907802,1.0,6.0,0.03959447390644263,0.0004932880401611328,0.2205650806427002
8
+ Mixtral-8x7B-Instruct-v0.1,english,call,,,,,,,,,
9
+ Mixtral-8x7B-Instruct-v0.1,english,json,3.2277008444070816,397.18333333333334,61.68333333333333,4.278456014362657,1.0,15.0,0.016790826658800218,0.0002071857452392578,1.011472463607788
10
+ Mixtral-8x7B-Instruct-v0.1,english,markdown,7.234642684459686,565.725,90.475,4.366846777306059,1.0,15.0,0.018897794563767535,0.00021576881408691406,1.7103569507598877
11
+ Mixtral-8x7B-Instruct-v0.1,japanese,call,,,,,,,,,
12
+ Mixtral-8x7B-Instruct-v0.1,japanese,json,8.271932434617428,536.4833333333333,58.78333333333333,2.1412226435175947,1.0,15.0,0.026507280039896726,0.00021338462829589844,76.45081758499146
13
+ Mixtral-8x7B-Instruct-v0.1,japanese,markdown,10.715969985723495,419.625,5.75,1.0792824074074074,1.0,10.0,0.018218461148164892,0.00021529197692871094,2.994176149368286
14
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,english,call,,,,,,,,,
15
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,english,json,1.3998499751091003,203.15,34.6,4.120689655172414,1.0,13.0,0.01180358711652775,0.0003421306610107422,0.13397955894470215
16
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,english,markdown,1.5995279610157014,248.2,41.625,3.9303246239113223,1.0,14.0,0.012339331286348055,0.0003273487091064453,0.15227961540222168
17
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,japanese,call,,,,,,,,,
18
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,japanese,json,1.2796377182006835,59.766666666666666,7.2,1.9966592427616927,1.0,13.0,0.01475177509482029,0.00041413307189941406,0.18952107429504395
19
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,japanese,markdown,1.3147150695323944,80.225,11.25,2.3595588235294116,1.0,13.0,0.013936110629754908,0.0005300045013427734,0.176621675491333
20
+ chat-bison,english,call,,,,,,,,,
21
+ chat-bison,english,json,3.446989095211029,550.05,86.0,89.4390243902439,1.0,138.0,0.4258628240445765,0.0006544589996337891,2.2015340328216553
22
+ chat-bison,japanese,call,,,,,,,,,
23
+ chat-bison,japanese,json,4.333498167991638,246.1,12.0,33.48299319727891,3.0,124.0,0.47770044917152044,0.0005426406860351562,3.5425846576690674
24
+ chat-bison (PaLM 2),english,call,,,,,,,,,
25
+ chat-bison (PaLM 2),english,json,2.9914507985115053,380.9,60.65,81.91397849462365,1.0,135.0,0.46110378285889986,0.0008225440979003906,2.025282144546509
26
+ chat-bison (PaLM 2),english,markdown,3.1855568289756775,480.45,76.6,86.56756756756756,12.0,129.0,0.4221067342672262,0.00087738037109375,2.063969373703003
27
+ chat-bison (PaLM 2),japanese,call,,,,,,,,,
28
+ chat-bison (PaLM 2),japanese,json,3.69934686422348,230.85,10.5,34.714285714285715,6.0,124.0,0.4294193310845167,0.0006532669067382812,2.7724690437316895
29
+ chat-bison (PaLM 2),japanese,markdown,5.588598108291626,434.95,13.8,32.09963099630996,10.0,124.0,0.3500617219073306,0.0005550384521484375,7.114030122756958
30
+ chat-bison-32k,english,call,,,,,,,,,
31
+ chat-bison-32k,english,json,3.74513863325119,538.4,84.25,88.26229508196721,1.0,134.0,0.47832588094179745,0.0006556510925292969,3.0114917755126953
32
+ chat-bison-32k,japanese,call,,,,,,,,,
33
+ chat-bison-32k,japanese,json,4.5112169027328495,241.45,11.8,35.77037037037037,6.0,124.0,0.5467217816246881,0.0005869865417480469,4.387756824493408
34
+ chat-bison-32k (PaLM 2 32K),english,call,,,,,,,,,
35
+ chat-bison-32k (PaLM 2 32K),english,json,2.968719494342804,335.75,53.85,77.183908045977,1.0,133.0,0.4880794711496638,0.0005464553833007812,1.8793001174926758
36
+ chat-bison-32k (PaLM 2 32K),english,markdown,3.229217529296875,429.95,69.35,82.6826923076923,1.0,133.0,0.4584116041660309,0.0005412101745605469,2.0599677562713623
37
+ chat-bison-32k (PaLM 2 32K),japanese,call,,,,,,,,,
38
+ chat-bison-32k (PaLM 2 32K),japanese,json,6.968563377857208,272.85,10.35,34.320754716981135,4.0,124.0,0.7706441234492656,0.0005052089691162109,52.47814655303955
39
+ chat-bison-32k (PaLM 2 32K),japanese,markdown,6.2108373761177065,446.45,21.4,32.118705035971225,5.0,124.0,0.38614349571063367,0.0007460117340087891,7.091885089874268
40
+ gemini-pro,english,call,,,,,,,,,
41
+ gemini-pro,english,json,3.3069549907337534,478.03333333333336,75.23333333333333,178.14906832298138,1.0,988.0,1.107387858147947,0.0006723403930664062,8.669384241104126
42
+ gemini-pro,english,markdown,3.3248310733485864,547.225,90.025,159.77372262773721,12.0,472.0,0.879381437371247,0.0007510185241699219,2.820554733276367
43
+ gemini-pro,japanese,call,,,,,,,,,
44
+ gemini-pro,japanese,json,4.618957793458979,220.95,4.666666666666667,77.52631578947368,4.0,237.0,1.2511649340914006,0.0006062984466552734,5.698127031326294
45
+ gemini-pro,japanese,markdown,6.4115668955971215,383.975,7.675,83.02162162162162,14.0,266.0,1.1660070625511376,0.0006639957427978516,13.754565954208374
46
+ gpt-3.5-turbo,english,call,3.124613248166584,602.9285714285714,97.85714285714286,,,,,,
47
+ gpt-3.5-turbo,english,json,2.4552148609626583,520.0853658536586,83.79268292682927,4.997304898054839,1.0,16.0,0.017422531230516167,0.0005590915679931641,0.4925534725189209
48
+ gpt-3.5-turbo,english,markdown,2.666209004142068,564.75,91.06818181818181,5.092008196721311,1.0,16.0,0.017853882908821107,0.0005643367767333984,1.127073049545288
49
+ gpt-3.5-turbo,japanese,call,8.609365148308836,372.23809523809524,4.392857142857143,,,,,,
50
+ gpt-3.5-turbo,japanese,json,5.703425769564472,236.84146341463415,3.341463414634146,1.1251375934186896,1.0,7.0,0.022491555757866794,0.0005545616149902344,13.75982117652893
51
+ gpt-3.5-turbo,japanese,markdown,7.63344073877102,357.4047619047619,6.880952380952381,1.2151704039504574,1.0,15.0,0.02293831178999754,0.0005612373352050781,13.71114993095398
52
+ gpt-4,english,call,10.829727350137173,441.225,69.05,,,,,,
53
+ gpt-4,english,json,9.5267409324646,470.65,74.625,4.912839248434238,1.0,16.0,0.08728140598796852,0.0005440711975097656,1.9534873962402344
54
+ gpt-4,english,markdown,10.24732003211975,427.8,67.45,5.041838538597525,1.0,15.0,0.10614711590633719,0.0005447864532470703,2.087376117706299
55
+ gpt-4,japanese,call,26.076972967539078,223.9,1.15,,,,,,
56
+ gpt-4,japanese,json,23.192965501394028,208.9,4.05,1.1566998892580287,1.0,7.0,0.11818944638881705,0.0005507469177246094,2.4770302772521973
57
+ gpt-4,japanese,markdown,36.14162145853042,282.65,3.15,1.1283433133732534,1.0,9.0,0.13859879746884404,0.0005800724029541016,2.9794347286224365
58
+ gpt-4-turbo,english,call,8.286203730106354,462.8,72.1,,,,,,
59
+ gpt-4-turbo,english,json,7.81642444729805,544.875,84.45,4.914317925591883,1.0,17.0,0.06131222159376005,0.0007143020629882812,0.7760622501373291
60
+ gpt-4-turbo,english,markdown,8.539259791374207,472.6,73.15,5.014323607427055,1.0,15.0,0.0789825123248113,0.0007131099700927734,2.0926766395568848
61
+ gpt-4-turbo,japanese,call,47.0068474650383,402.2,24.35,,,,,,
62
+ gpt-4-turbo,japanese,json,20.065124291181565,270.525,6.075,1.1806873977086743,1.0,8.0,0.08205758946486919,0.0006937980651855469,13.252992153167725
63
+ gpt-4-turbo,japanese,markdown,22.259230959415437,277.35,3.95,1.1460743801652893,1.0,8.0,0.0860337075123117,0.0007085800170898438,2.3845231533050537
64
+ llama-2-70b-chat,english,call,,,,,,,,,
65
+ llama-2-70b-chat,english,json,3.174426339921497,405.09375,62.359375,4.130975143403441,1.0,15.0,0.016708370984322405,0.00021314620971679688,0.5100884437561035
66
+ llama-2-70b-chat,english,markdown,4.972272306680679,951.7857142857143,147.47619047619048,4.128369307032944,1.0,16.0,0.01363343600582685,0.0002124309539794922,0.5661592483520508
67
+ llama-2-70b-chat,japanese,call,,,,,,,,,
68
+ llama-2-70b-chat,japanese,json,4.583555459976196,356.2741935483871,42.41935483870968,2.4138345536006995,1.0,15.0,0.017530749553071386,0.00020837783813476562,0.35228896141052246
69
+ llama-2-70b-chat,japanese,markdown,11.858248114585876,1293.3333333333333,154.38095238095238,2.3937951701040014,1.0,16.0,0.017392761688814075,0.0002117156982421875,76.44498753547668
70
+ zephyr-7b-beta,english,call,,,,,,,,,
71
+ zephyr-7b-beta,english,json,2.845248854160309,238.1,39.2,4.274685816876122,1.0,14.0,0.03622233246986485,0.0003070831298828125,0.4896988868713379
72
+ zephyr-7b-beta,english,markdown,5.826004445552826,318.825,51.825,4.382474226804124,1.0,15.0,0.06875277114488006,0.00040459632873535156,75.15552616119385
73
+ zephyr-7b-beta,japanese,call,,,,,,,,,
74
+ zephyr-7b-beta,japanese,json,2.1363336205482484,35.666666666666664,3.466666666666667,1.1674849972722312,1.0,7.0,0.042095991411432825,0.018090486526489258,0.4599947929382324
75
+ zephyr-7b-beta,japanese,markdown,2.2039071798324583,35.225,2.225,1.0345080763582966,1.0,4.0,0.041054743327058184,0.02583909034729004,0.4606599807739258
data/2024-02-01 08:08:06.822774_time_of_day_comparison.csv ADDED
@@ -0,0 +1,34 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ model,time_of_day,execution_time,characters_count,words_count
2
+ Mistral-7B-Instruct-v0.2,afternoon,3.023258109887441,172.18333333333334,22.95
3
+ Mistral-7B-Instruct-v0.2,evening,3.2679351409276327,216.63333333333333,31.5
4
+ Mistral-7B-Instruct-v0.2,morning,3.174540030956268,113.0,16.27
5
+ Mixtral-8x7B-Instruct-v0.1,afternoon,7.426922065019608,450.4875,51.85
6
+ Mixtral-8x7B-Instruct-v0.1,evening,4.979682341865871,457.8,53.708333333333336
7
+ Mixtral-8x7B-Instruct-v0.1,morning,7.142197625471814,494.9583333333333,57.74166666666667
8
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,afternoon,1.538642168045044,169.46666666666667,26.083333333333332
9
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,evening,1.7001954774061838,222.51666666666668,35.575
10
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,morning,1.2902645373344421,106.18,16.74
11
+ chat-bison,morning,3.890243631601334,398.075,49.0
12
+ chat-bison (PaLM 2),afternoon,3.866238150000572,381.7875,40.3875
13
+ chat-bison (PaLM 2),evening,2.8466253956158956,358.525,39.25833333333333
14
+ chat-bison-32k,morning,4.128177767992019,389.925,48.025
15
+ chat-bison-32k (PaLM 2 32K),afternoon,4.844334444403648,371.25,38.7375
16
+ chat-bison-32k (PaLM 2 32K),evening,3.981116022666295,348.93333333333334,36.525
17
+ gemini-pro,afternoon,3.6972034962972007,352.2,33.9375
18
+ gemini-pro,evening,3.810917937329837,335.68333333333334,36.21666666666667
19
+ gemini-pro,morning,4.72138064004937,425.09166666666664,49.891666666666666
20
+ gpt-3.5-turbo,afternoon,4.228875203738137,364.92857142857144,36.42857142857143
21
+ gpt-3.5-turbo,evening,3.9572247514184915,375.75,37.660377358490564
22
+ gpt-3.5-turbo,morning,5.336839800789242,479.2785714285714,53.92142857142857
23
+ gpt-4,afternoon,20.52127287968868,307.175,31.975
24
+ gpt-4,evening,16.028902428833085,306.075,31.925
25
+ gpt-4,morning,15.5218456586202,389.1875,44.125
26
+ gpt-4-turbo,afternoon,23.51892908215523,396.40833333333336,41.858333333333334
27
+ gpt-4-turbo,evening,15.113789739608764,455.105,39.97
28
+ gpt-4-turbo,morning,14.008529031276703,433.075,49.975
29
+ llama-2-70b-chat,afternoon,4.851686128755895,671.2317073170732,83.5609756097561
30
+ llama-2-70b-chat,evening,4.701648034746685,582.578125,73.9921875
31
+ llama-2-70b-chat,morning,6.175082007679371,662.7416666666667,94.30833333333334
32
+ zephyr-7b-beta,afternoon,3.0400254487991334,163.45,23.8
33
+ zephyr-7b-beta,evening,3.3303639868895214,218.425,33.65
34
+ zephyr-7b-beta,morning,3.2387993240356447,112.57,17.26
data/2024-02-02 10:02:32.863904_time_of_day_comparison.csv ADDED
@@ -0,0 +1,58 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ model,time_of_day,execution_time,characters_count,words_count
2
+ Mistral-7B-Instruct-v0.2,afternoon,3.2297915895779927,224.50833333333333,32.375
3
+ Mistral-7B-Instruct-v0.2,evening,3.335640662057059,237.52857142857144,35.33571428571429
4
+ Mistral-7B-Instruct-v0.2,midnight,,,
5
+ Mistral-7B-Instruct-v0.2,morning,3.267787692944209,154.65,23.283333333333335
6
+ Mistral-7B-Instruct-v0.2,noon,3.1783012986183166,210.325,30.975
7
+ Mixtral-8x7B-Instruct-v0.1,afternoon,6.686205209493637,451.71,60.95
8
+ Mixtral-8x7B-Instruct-v0.1,evening,4.822802252936781,414.6791666666667,55.68333333333333
9
+ Mixtral-8x7B-Instruct-v0.1,midnight,5.600324046611786,399.5,61.7
10
+ Mixtral-8x7B-Instruct-v0.1,morning,4.805075550901479,350.13125,47.046875
11
+ Mixtral-8x7B-Instruct-v0.1,noon,6.976712214946747,492.05,66.15
12
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,afternoon,1.6058823029200235,213.325,33.90833333333333
13
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,evening,1.722607149396624,243.87857142857143,39.43571428571428
14
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,midnight,2.0674875736236573,372.05,62.6
15
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,morning,1.6125914414723714,224.34444444444443,37.12222222222222
16
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,noon,1.6206423223018647,227.325,36.3
17
+ chat-bison,morning,3.890243631601334,398.075,49.0
18
+ chat-bison (PaLM 2),afternoon,3.2259692871570587,389.43,51.34
19
+ chat-bison (PaLM 2),evening,2.756077417731285,370.17083333333335,50.0625
20
+ chat-bison (PaLM 2),midnight,2.501569759845734,381.95,60.9
21
+ chat-bison (PaLM 2),morning,2.4648332941532134,381.865,60.92
22
+ chat-bison (PaLM 2),noon,2.706343245506287,307.6,35.7
23
+ chat-bison-32k,morning,4.128177767992019,389.925,48.025
24
+ chat-bison-32k (PaLM 2 32K),afternoon,4.288204146623611,362.5,46.555
25
+ chat-bison-32k (PaLM 2 32K),evening,8.945300988356273,342.34166666666664,45.1875
26
+ chat-bison-32k (PaLM 2 32K),midnight,7.170754861831665,335.75,53.85
27
+ chat-bison-32k (PaLM 2 32K),morning,5.129021260738373,335.75,53.85
28
+ chat-bison-32k (PaLM 2 32K),noon,4.41904046535492,304.3,32.1
29
+ gemini-pro,afternoon,3.268519560079924,360.825,45.92
30
+ gemini-pro,evening,3.265133913461264,355.7375,48.05416666666667
31
+ gemini-pro,midnight,2.8754740890703703,364.45,57.0
32
+ gemini-pro,morning,3.592642272646363,396.7375,56.6
33
+ gemini-pro,noon,3.1745591791052568,309.125,33.675
34
+ gpt-3.5-turbo,afternoon,4.410703988353233,390.6659192825112,42.2914798206278
35
+ gpt-3.5-turbo,evening,4.809755622192356,392.99825174825173,43.07867132867133
36
+ gpt-3.5-turbo,midnight,3.440265198548635,380.8333333333333,43.05
37
+ gpt-3.5-turbo,morning,4.75027750830197,426.46590909090907,50.22386363636364
38
+ gpt-3.5-turbo,noon,4.429612889289856,323.81,27.68
39
+ gpt-4,afternoon,18.126467501112433,315.16136363636366,36.856818181818184
40
+ gpt-4,evening,15.545672736714817,313.95,37.3
41
+ gpt-4,midnight,12.410712122917175,330.6166666666667,41.416666666666664
42
+ gpt-4,morning,14.07501753171285,335.77647058823527,42.84117647058824
43
+ gpt-4,noon,19.315037021636964,273.52,25.12
44
+ gpt-4-turbo,afternoon,22.23356882767244,366.7227272727273,45.41590909090909
45
+ gpt-4-turbo,evening,16.361396548577716,400.25892857142856,45.276785714285715
46
+ gpt-4-turbo,midnight,9.732182610034943,387.1,51.4
47
+ gpt-4-turbo,morning,13.437257664694506,361.0573529411765,47.733823529411765
48
+ gpt-4-turbo,noon,16.244312160015106,346.79,37.4
49
+ llama-2-70b-chat,afternoon,4.869195998604618,553.0742574257425,75.0990099009901
50
+ llama-2-70b-chat,evening,3.9572451173042764,470.4717741935484,64.35887096774194
51
+ llama-2-70b-chat,midnight,2.7049551407496133,312.85,48.55
52
+ llama-2-70b-chat,morning,4.015529702738376,456.196875,67.375
53
+ llama-2-70b-chat,noon,5.845867207175807,337.275,44.625
54
+ zephyr-7b-beta,afternoon,3.5596186633871385,273.65833333333336,43.233333333333334
55
+ zephyr-7b-beta,evening,3.4374013015202114,242.40714285714284,37.892857142857146
56
+ zephyr-7b-beta,midnight,,,
57
+ zephyr-7b-beta,morning,3.3750870446364085,158.19166666666666,24.941666666666666
58
+ zephyr-7b-beta,noon,3.3402509868144987,216.9,33.575
data/2024-02-02 10:13:06.642849_general_plot.csv ADDED
@@ -0,0 +1,428 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ path,plot_object,description,comment,plot_json
2
+ ./html/plots/response_times.html,"Figure({
3
+ 'data': [{'alignmentgroup': 'True',
4
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
5
+ 'legendgroup': 'Mistral-7B-Instruct-v0.2',
6
+ 'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
7
+ 'name': 'Mistral-7B-Instruct-v0.2',
8
+ 'offsetgroup': 'Mistral-7B-Instruct-v0.2',
9
+ 'orientation': 'v',
10
+ 'showlegend': True,
11
+ 'textposition': 'auto',
12
+ 'type': 'bar',
13
+ 'x': array(['Mistral-7B-Instruct-v0.2'], dtype=object),
14
+ 'xaxis': 'x',
15
+ 'y': array([3.27102681]),
16
+ 'yaxis': 'y'},
17
+ {'alignmentgroup': 'True',
18
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
19
+ 'legendgroup': 'Mixtral-8x7B-Instruct-v0.1',
20
+ 'marker': {'color': '#EF553B', 'pattern': {'shape': ''}},
21
+ 'name': 'Mixtral-8x7B-Instruct-v0.1',
22
+ 'offsetgroup': 'Mixtral-8x7B-Instruct-v0.1',
23
+ 'orientation': 'v',
24
+ 'showlegend': True,
25
+ 'textposition': 'auto',
26
+ 'type': 'bar',
27
+ 'x': array(['Mixtral-8x7B-Instruct-v0.1'], dtype=object),
28
+ 'xaxis': 'x',
29
+ 'y': array([5.47596174]),
30
+ 'yaxis': 'y'},
31
+ {'alignmentgroup': 'True',
32
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
33
+ 'legendgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
34
+ 'marker': {'color': '#00cc96', 'pattern': {'shape': ''}},
35
+ 'name': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
36
+ 'offsetgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
37
+ 'orientation': 'v',
38
+ 'showlegend': True,
39
+ 'textposition': 'auto',
40
+ 'type': 'bar',
41
+ 'x': array(['TinyLlama/TinyLlama-1.1B-Chat-v1.0'], dtype=object),
42
+ 'xaxis': 'x',
43
+ 'y': array([1.66062556]),
44
+ 'yaxis': 'y'},
45
+ {'alignmentgroup': 'True',
46
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
47
+ 'legendgroup': 'chat-bison',
48
+ 'marker': {'color': '#ab63fa', 'pattern': {'shape': ''}},
49
+ 'name': 'chat-bison',
50
+ 'offsetgroup': 'chat-bison',
51
+ 'orientation': 'v',
52
+ 'showlegend': True,
53
+ 'textposition': 'auto',
54
+ 'type': 'bar',
55
+ 'x': array(['chat-bison'], dtype=object),
56
+ 'xaxis': 'x',
57
+ 'y': array([3.89024363]),
58
+ 'yaxis': 'y'},
59
+ {'alignmentgroup': 'True',
60
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
61
+ 'legendgroup': 'chat-bison (PaLM 2)',
62
+ 'marker': {'color': '#FFA15A', 'pattern': {'shape': ''}},
63
+ 'name': 'chat-bison (PaLM 2)',
64
+ 'offsetgroup': 'chat-bison (PaLM 2)',
65
+ 'orientation': 'v',
66
+ 'showlegend': True,
67
+ 'textposition': 'auto',
68
+ 'type': 'bar',
69
+ 'x': array(['chat-bison (PaLM 2)'], dtype=object),
70
+ 'xaxis': 'x',
71
+ 'y': array([2.79700603]),
72
+ 'yaxis': 'y'},
73
+ {'alignmentgroup': 'True',
74
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
75
+ 'legendgroup': 'chat-bison-32k',
76
+ 'marker': {'color': '#19d3f3', 'pattern': {'shape': ''}},
77
+ 'name': 'chat-bison-32k',
78
+ 'offsetgroup': 'chat-bison-32k',
79
+ 'orientation': 'v',
80
+ 'showlegend': True,
81
+ 'textposition': 'auto',
82
+ 'type': 'bar',
83
+ 'x': array(['chat-bison-32k'], dtype=object),
84
+ 'xaxis': 'x',
85
+ 'y': array([4.12817777]),
86
+ 'yaxis': 'y'},
87
+ {'alignmentgroup': 'True',
88
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
89
+ 'legendgroup': 'chat-bison-32k (PaLM 2 32K)',
90
+ 'marker': {'color': '#FF6692', 'pattern': {'shape': ''}},
91
+ 'name': 'chat-bison-32k (PaLM 2 32K)',
92
+ 'offsetgroup': 'chat-bison-32k (PaLM 2 32K)',
93
+ 'orientation': 'v',
94
+ 'showlegend': True,
95
+ 'textposition': 'auto',
96
+ 'type': 'bar',
97
+ 'x': array(['chat-bison-32k (PaLM 2 32K)'], dtype=object),
98
+ 'xaxis': 'x',
99
+ 'y': array([6.21499148]),
100
+ 'yaxis': 'y'},
101
+ {'alignmentgroup': 'True',
102
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
103
+ 'legendgroup': 'gemini-pro',
104
+ 'marker': {'color': '#B6E880', 'pattern': {'shape': ''}},
105
+ 'name': 'gemini-pro',
106
+ 'offsetgroup': 'gemini-pro',
107
+ 'orientation': 'v',
108
+ 'showlegend': True,
109
+ 'textposition': 'auto',
110
+ 'type': 'bar',
111
+ 'x': array(['gemini-pro'], dtype=object),
112
+ 'xaxis': 'x',
113
+ 'y': array([3.37706134]),
114
+ 'yaxis': 'y'},
115
+ {'alignmentgroup': 'True',
116
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
117
+ 'legendgroup': 'gpt-3.5-turbo',
118
+ 'marker': {'color': '#FF97FF', 'pattern': {'shape': ''}},
119
+ 'name': 'gpt-3.5-turbo',
120
+ 'offsetgroup': 'gpt-3.5-turbo',
121
+ 'orientation': 'v',
122
+ 'showlegend': True,
123
+ 'textposition': 'auto',
124
+ 'type': 'bar',
125
+ 'x': array(['gpt-3.5-turbo'], dtype=object),
126
+ 'xaxis': 'x',
127
+ 'y': array([4.63898239]),
128
+ 'yaxis': 'y'},
129
+ {'alignmentgroup': 'True',
130
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
131
+ 'legendgroup': 'gpt-4',
132
+ 'marker': {'color': '#FECB52', 'pattern': {'shape': ''}},
133
+ 'name': 'gpt-4',
134
+ 'offsetgroup': 'gpt-4',
135
+ 'orientation': 'v',
136
+ 'showlegend': True,
137
+ 'textposition': 'auto',
138
+ 'type': 'bar',
139
+ 'x': array(['gpt-4'], dtype=object),
140
+ 'xaxis': 'x',
141
+ 'y': array([15.72262285]),
142
+ 'yaxis': 'y'},
143
+ {'alignmentgroup': 'True',
144
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
145
+ 'legendgroup': 'gpt-4-turbo',
146
+ 'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
147
+ 'name': 'gpt-4-turbo',
148
+ 'offsetgroup': 'gpt-4-turbo',
149
+ 'orientation': 'v',
150
+ 'showlegend': True,
151
+ 'textposition': 'auto',
152
+ 'type': 'bar',
153
+ 'x': array(['gpt-4-turbo'], dtype=object),
154
+ 'xaxis': 'x',
155
+ 'y': array([16.46241833]),
156
+ 'yaxis': 'y'},
157
+ {'alignmentgroup': 'True',
158
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
159
+ 'legendgroup': 'llama-2-70b-chat',
160
+ 'marker': {'color': '#EF553B', 'pattern': {'shape': ''}},
161
+ 'name': 'llama-2-70b-chat',
162
+ 'offsetgroup': 'llama-2-70b-chat',
163
+ 'orientation': 'v',
164
+ 'showlegend': True,
165
+ 'textposition': 'auto',
166
+ 'type': 'bar',
167
+ 'x': array(['llama-2-70b-chat'], dtype=object),
168
+ 'xaxis': 'x',
169
+ 'y': array([4.2692996]),
170
+ 'yaxis': 'y'},
171
+ {'alignmentgroup': 'True',
172
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
173
+ 'legendgroup': 'zephyr-7b-beta',
174
+ 'marker': {'color': '#00cc96', 'pattern': {'shape': ''}},
175
+ 'name': 'zephyr-7b-beta',
176
+ 'offsetgroup': 'zephyr-7b-beta',
177
+ 'orientation': 'v',
178
+ 'showlegend': True,
179
+ 'textposition': 'auto',
180
+ 'type': 'bar',
181
+ 'x': array(['zephyr-7b-beta'], dtype=object),
182
+ 'xaxis': 'x',
183
+ 'y': array([3.44499114]),
184
+ 'yaxis': 'y'}],
185
+ 'layout': {'barmode': 'relative',
186
+ 'legend': {'title': {'text': 'Model'}, 'tracegroupgap': 0},
187
+ 'template': '...',
188
+ 'title': {'text': 'Model endpoints response times'},
189
+ 'xaxis': {'anchor': 'y',
190
+ 'categoryarray': [Mistral-7B-Instruct-v0.2,
191
+ Mixtral-8x7B-Instruct-v0.1,
192
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,
193
+ chat-bison, chat-bison (PaLM 2), chat-
194
+ bison-32k, chat-bison-32k (PaLM 2 32K),
195
+ gemini-pro, gpt-3.5-turbo, gpt-4,
196
+ gpt-4-turbo, llama-2-70b-chat,
197
+ zephyr-7b-beta],
198
+ 'categoryorder': 'array',
199
+ 'domain': [0.0, 1.0],
200
+ 'title': {'text': 'Model'}},
201
+ 'yaxis': {'anchor': 'x', 'domain': [0.0, 1.0], 'title': {'text': 'Execution time (s)'}}}
202
+ })",Model endpoints response times,,"{""data"":[{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral-7B-Instruct-v0.2"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""Mistral-7B-Instruct-v0.2"",""offsetgroup"":""Mistral-7B-Instruct-v0.2"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""Mistral-7B-Instruct-v0.2""],""xaxis"":""x"",""y"":[3.271026806036631],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mixtral-8x7B-Instruct-v0.1"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""Mixtral-8x7B-Instruct-v0.1"",""offsetgroup"":""Mixtral-8x7B-Instruct-v0.1"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""Mixtral-8x7B-Instruct-v0.1""],""xaxis"":""x"",""y"":[5.475961740149392],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""offsetgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0""],""xaxis"":""x"",""y"":[1.6606255621910095],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""chat-bison"",""offsetgroup"":""chat-bison"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""chat-bison""],""xaxis"":""x"",""y"":[3.890243631601334],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison (PaLM 2)"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""chat-bison (PaLM 2)"",""offsetgroup"":""chat-bison (PaLM 2)"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""chat-bison (PaLM 2)""],""xaxis"":""x"",""y"":[2.7970060307638986],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison-32k"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""chat-bison-32k"",""offsetgroup"":""chat-bison-32k"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""chat-bison-32k""],""xaxis"":""x"",""y"":[4.128177767992019],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison-32k (PaLM 2 32K)"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""chat-bison-32k (PaLM 2 32K)"",""offsetgroup"":""chat-bison-32k (PaLM 2 32K)"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""chat-bison-32k (PaLM 2 32K)""],""xaxis"":""x"",""y"":[6.214991477898189],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gemini-pro"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""gemini-pro"",""offsetgroup"":""gemini-pro"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gemini-pro""],""xaxis"":""x"",""y"":[3.3770613408857777],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-3.5-turbo"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""gpt-3.5-turbo"",""offsetgroup"":""gpt-3.5-turbo"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gpt-3.5-turbo""],""xaxis"":""x"",""y"":[4.63898239252044],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""gpt-4"",""offsetgroup"":""gpt-4"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gpt-4""],""xaxis"":""x"",""y"":[15.72262285346881],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4-turbo"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""gpt-4-turbo"",""offsetgroup"":""gpt-4-turbo"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gpt-4-turbo""],""xaxis"":""x"",""y"":[16.462418334769165],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""llama-2-70b-chat"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""llama-2-70b-chat"",""offsetgroup"":""llama-2-70b-chat"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""llama-2-70b-chat""],""xaxis"":""x"",""y"":[4.269299596734112],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""zephyr-7b-beta"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""zephyr-7b-beta"",""offsetgroup"":""zephyr-7b-beta"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""zephyr-7b-beta""],""xaxis"":""x"",""y"":[3.4449911407752936],""yaxis"":""y"",""type"":""bar""}],""layout"":{""template"":{""data"":{""histogram2dcontour"":[{""type"":""histogram2dcontour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""choropleth"":[{""type"":""choropleth"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""histogram2d"":[{""type"":""histogram2d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmap"":[{""type"":""heatmap"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmapgl"":[{""type"":""heatmapgl"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""contourcarpet"":[{""type"":""contourcarpet"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""contour"":[{""type"":""contour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""surface"":[{""type"":""surface"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""mesh3d"":[{""type"":""mesh3d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""scatter"":[{""fillpattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2},""type"":""scatter""}],""parcoords"":[{""type"":""parcoords"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolargl"":[{""type"":""scatterpolargl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""bar"":[{""error_x"":{""color"":""#2a3f5f""},""error_y"":{""color"":""#2a3f5f""},""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""bar""}],""scattergeo"":[{""type"":""scattergeo"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolar"":[{""type"":""scatterpolar"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""histogram"":[{""marker"":{""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""histogram""}],""scattergl"":[{""type"":""scattergl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatter3d"":[{""type"":""scatter3d"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattermapbox"":[{""type"":""scattermapbox"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterternary"":[{""type"":""scatterternary"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattercarpet"":[{""type"":""scattercarpet"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""carpet"":[{""aaxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""baxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""type"":""carpet""}],""table"":[{""cells"":{""fill"":{""color"":""#EBF0F8""},""line"":{""color"":""white""}},""header"":{""fill"":{""color"":""#C8D4E3""},""line"":{""color"":""white""}},""type"":""table""}],""barpolar"":[{""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""barpolar""}],""pie"":[{""automargin"":true,""type"":""pie""}]},""layout"":{""autotypenumbers"":""strict"",""colorway"":[""#636efa"",""#EF553B"",""#00cc96"",""#ab63fa"",""#FFA15A"",""#19d3f3"",""#FF6692"",""#B6E880"",""#FF97FF"",""#FECB52""],""font"":{""color"":""#2a3f5f""},""hovermode"":""closest"",""hoverlabel"":{""align"":""left""},""paper_bgcolor"":""white"",""plot_bgcolor"":""#E5ECF6"",""polar"":{""bgcolor"":""#E5ECF6"",""angularaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""radialaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""ternary"":{""bgcolor"":""#E5ECF6"",""aaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""baxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""caxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""coloraxis"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""colorscale"":{""sequential"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""sequentialminus"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""diverging"":[[0,""#8e0152""],[0.1,""#c51b7d""],[0.2,""#de77ae""],[0.3,""#f1b6da""],[0.4,""#fde0ef""],[0.5,""#f7f7f7""],[0.6,""#e6f5d0""],[0.7,""#b8e186""],[0.8,""#7fbc41""],[0.9,""#4d9221""],[1,""#276419""]]},""xaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""yaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""scene"":{""xaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""yaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""zaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2}},""shapedefaults"":{""line"":{""color"":""#2a3f5f""}},""annotationdefaults"":{""arrowcolor"":""#2a3f5f"",""arrowhead"":0,""arrowwidth"":1},""geo"":{""bgcolor"":""white"",""landcolor"":""#E5ECF6"",""subunitcolor"":""white"",""showland"":true,""showlakes"":true,""lakecolor"":""white""},""title"":{""x"":0.05},""mapbox"":{""style"":""light""}}},""xaxis"":{""anchor"":""y"",""domain"":[0.0,1.0],""title"":{""text"":""Model""},""categoryorder"":""array"",""categoryarray"":[""Mistral-7B-Instruct-v0.2"",""Mixtral-8x7B-Instruct-v0.1"",""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""chat-bison"",""chat-bison (PaLM 2)"",""chat-bison-32k"",""chat-bison-32k (PaLM 2 32K)"",""gemini-pro"",""gpt-3.5-turbo"",""gpt-4"",""gpt-4-turbo"",""llama-2-70b-chat"",""zephyr-7b-beta""]},""yaxis"":{""anchor"":""x"",""domain"":[0.0,1.0],""title"":{""text"":""Execution time (s)""}},""legend"":{""title"":{""text"":""Model""},""tracegroupgap"":0},""title"":{""text"":""Model endpoints response times""},""barmode"":""relative""}}"
203
+ ./html/plots/execution_costs.html,"Figure({
204
+ 'data': [{'alignmentgroup': 'True',
205
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
206
+ 'legendgroup': 'gpt-3.5-turbo',
207
+ 'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
208
+ 'name': 'gpt-3.5-turbo',
209
+ 'offsetgroup': 'gpt-3.5-turbo',
210
+ 'orientation': 'v',
211
+ 'showlegend': True,
212
+ 'textposition': 'auto',
213
+ 'type': 'bar',
214
+ 'x': array(['gpt-3.5-turbo'], dtype=object),
215
+ 'xaxis': 'x',
216
+ 'y': array([0.23604]),
217
+ 'yaxis': 'y'},
218
+ {'alignmentgroup': 'True',
219
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
220
+ 'legendgroup': 'gpt-4-turbo',
221
+ 'marker': {'color': '#EF553B', 'pattern': {'shape': ''}},
222
+ 'name': 'gpt-4-turbo',
223
+ 'offsetgroup': 'gpt-4-turbo',
224
+ 'orientation': 'v',
225
+ 'showlegend': True,
226
+ 'textposition': 'auto',
227
+ 'type': 'bar',
228
+ 'x': array(['gpt-4-turbo'], dtype=object),
229
+ 'xaxis': 'x',
230
+ 'y': array([2.5988]),
231
+ 'yaxis': 'y'},
232
+ {'alignmentgroup': 'True',
233
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
234
+ 'legendgroup': 'gpt-4',
235
+ 'marker': {'color': '#00cc96', 'pattern': {'shape': ''}},
236
+ 'name': 'gpt-4',
237
+ 'offsetgroup': 'gpt-4',
238
+ 'orientation': 'v',
239
+ 'showlegend': True,
240
+ 'textposition': 'auto',
241
+ 'type': 'bar',
242
+ 'x': array(['gpt-4'], dtype=object),
243
+ 'xaxis': 'x',
244
+ 'y': array([5.8344]),
245
+ 'yaxis': 'y'},
246
+ {'alignmentgroup': 'True',
247
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
248
+ 'legendgroup': 'llama-2-70b-chat',
249
+ 'marker': {'color': '#ab63fa', 'pattern': {'shape': ''}},
250
+ 'name': 'llama-2-70b-chat',
251
+ 'offsetgroup': 'llama-2-70b-chat',
252
+ 'orientation': 'v',
253
+ 'showlegend': True,
254
+ 'textposition': 'auto',
255
+ 'type': 'bar',
256
+ 'x': array(['llama-2-70b-chat'], dtype=object),
257
+ 'xaxis': 'x',
258
+ 'y': array([0.040992]),
259
+ 'yaxis': 'y'},
260
+ {'alignmentgroup': 'True',
261
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
262
+ 'legendgroup': 'Mixtral-8x7B-Instruct-v0.1',
263
+ 'marker': {'color': '#FFA15A', 'pattern': {'shape': ''}},
264
+ 'name': 'Mixtral-8x7B-Instruct-v0.1',
265
+ 'offsetgroup': 'Mixtral-8x7B-Instruct-v0.1',
266
+ 'orientation': 'v',
267
+ 'showlegend': True,
268
+ 'textposition': 'auto',
269
+ 'type': 'bar',
270
+ 'x': array(['Mixtral-8x7B-Instruct-v0.1'], dtype=object),
271
+ 'xaxis': 'x',
272
+ 'y': array([0.143622]),
273
+ 'yaxis': 'y'},
274
+ {'alignmentgroup': 'True',
275
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
276
+ 'legendgroup': 'zephyr-7b-beta',
277
+ 'marker': {'color': '#19d3f3', 'pattern': {'shape': ''}},
278
+ 'name': 'zephyr-7b-beta',
279
+ 'offsetgroup': 'zephyr-7b-beta',
280
+ 'orientation': 'v',
281
+ 'showlegend': True,
282
+ 'textposition': 'auto',
283
+ 'type': 'bar',
284
+ 'x': array(['zephyr-7b-beta'], dtype=object),
285
+ 'xaxis': 'x',
286
+ 'y': array([0.15650749]),
287
+ 'yaxis': 'y'},
288
+ {'alignmentgroup': 'True',
289
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
290
+ 'legendgroup': 'Mistral-7B-Instruct-v0.2',
291
+ 'marker': {'color': '#FF6692', 'pattern': {'shape': ''}},
292
+ 'name': 'Mistral-7B-Instruct-v0.2',
293
+ 'offsetgroup': 'Mistral-7B-Instruct-v0.2',
294
+ 'orientation': 'v',
295
+ 'showlegend': True,
296
+ 'textposition': 'auto',
297
+ 'type': 'bar',
298
+ 'x': array(['Mistral-7B-Instruct-v0.2'], dtype=object),
299
+ 'xaxis': 'x',
300
+ 'y': array([0.08633046]),
301
+ 'yaxis': 'y'},
302
+ {'alignmentgroup': 'True',
303
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
304
+ 'legendgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
305
+ 'marker': {'color': '#B6E880', 'pattern': {'shape': ''}},
306
+ 'name': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
307
+ 'offsetgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
308
+ 'orientation': 'v',
309
+ 'showlegend': True,
310
+ 'textposition': 'auto',
311
+ 'type': 'bar',
312
+ 'x': array(['TinyLlama/TinyLlama-1.1B-Chat-v1.0'], dtype=object),
313
+ 'xaxis': 'x',
314
+ 'y': array([0.02132704]),
315
+ 'yaxis': 'y'},
316
+ {'alignmentgroup': 'True',
317
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
318
+ 'legendgroup': 'gemini-pro',
319
+ 'marker': {'color': '#FF97FF', 'pattern': {'shape': ''}},
320
+ 'name': 'gemini-pro',
321
+ 'offsetgroup': 'gemini-pro',
322
+ 'orientation': 'v',
323
+ 'showlegend': True,
324
+ 'textposition': 'auto',
325
+ 'type': 'bar',
326
+ 'x': array(['gemini-pro'], dtype=object),
327
+ 'xaxis': 'x',
328
+ 'y': array([0.05781]),
329
+ 'yaxis': 'y'},
330
+ {'alignmentgroup': 'True',
331
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
332
+ 'legendgroup': 'chat-bison (PaLM 2)',
333
+ 'marker': {'color': '#FECB52', 'pattern': {'shape': ''}},
334
+ 'name': 'chat-bison (PaLM 2)',
335
+ 'offsetgroup': 'chat-bison (PaLM 2)',
336
+ 'orientation': 'v',
337
+ 'showlegend': True,
338
+ 'textposition': 'auto',
339
+ 'type': 'bar',
340
+ 'x': array(['chat-bison (PaLM 2)'], dtype=object),
341
+ 'xaxis': 'x',
342
+ 'y': array([0.05291]),
343
+ 'yaxis': 'y'},
344
+ {'alignmentgroup': 'True',
345
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
346
+ 'legendgroup': 'chat-bison-32k (PaLM 2 32K)',
347
+ 'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
348
+ 'name': 'chat-bison-32k (PaLM 2 32K)',
349
+ 'offsetgroup': 'chat-bison-32k (PaLM 2 32K)',
350
+ 'orientation': 'v',
351
+ 'showlegend': True,
352
+ 'textposition': 'auto',
353
+ 'type': 'bar',
354
+ 'x': array(['chat-bison-32k (PaLM 2 32K)'], dtype=object),
355
+ 'xaxis': 'x',
356
+ 'y': array([0.04954]),
357
+ 'yaxis': 'y'}],
358
+ 'layout': {'barmode': 'relative',
359
+ 'legend': {'title': {'text': 'Model'}, 'tracegroupgap': 0},
360
+ 'template': '...',
361
+ 'title': {'text': 'Costs of execution of 800 test queries per model'},
362
+ 'xaxis': {'anchor': 'y', 'domain': [0.0, 1.0], 'title': {'text': 'Model'}},
363
+ 'yaxis': {'anchor': 'x', 'domain': [0.0, 1.0], 'title': {'text': 'Execution cost ($)'}}}
364
+ })",Costs of execution of 800 test queries per model,Note that pause and resume time cost was not included in the cost calculation for the models billed hourly. Also although Gemini-Pro model is free for under 60 queries per minute we calculated the full cost for generating the tokens.,"{""data"":[{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-3.5-turbo"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""gpt-3.5-turbo"",""offsetgroup"":""gpt-3.5-turbo"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gpt-3.5-turbo""],""xaxis"":""x"",""y"":[0.23604],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4-turbo"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""gpt-4-turbo"",""offsetgroup"":""gpt-4-turbo"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gpt-4-turbo""],""xaxis"":""x"",""y"":[2.5987999999999998],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""gpt-4"",""offsetgroup"":""gpt-4"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gpt-4""],""xaxis"":""x"",""y"":[5.8344000000000005],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""llama-2-70b-chat"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""llama-2-70b-chat"",""offsetgroup"":""llama-2-70b-chat"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""llama-2-70b-chat""],""xaxis"":""x"",""y"":[0.040992],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mixtral-8x7B-Instruct-v0.1"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""Mixtral-8x7B-Instruct-v0.1"",""offsetgroup"":""Mixtral-8x7B-Instruct-v0.1"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""Mixtral-8x7B-Instruct-v0.1""],""xaxis"":""x"",""y"":[0.14362200000000003],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""zephyr-7b-beta"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""zephyr-7b-beta"",""offsetgroup"":""zephyr-7b-beta"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""zephyr-7b-beta""],""xaxis"":""x"",""y"":[0.15650748757521313],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral-7B-Instruct-v0.2"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""Mistral-7B-Instruct-v0.2"",""offsetgroup"":""Mistral-7B-Instruct-v0.2"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""Mistral-7B-Instruct-v0.2""],""xaxis"":""x"",""y"":[0.08633045819070603],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""offsetgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0""],""xaxis"":""x"",""y"":[0.02132703948020935],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gemini-pro"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""gemini-pro"",""offsetgroup"":""gemini-pro"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gemini-pro""],""xaxis"":""x"",""y"":[0.05781],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison (PaLM 2)"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""chat-bison (PaLM 2)"",""offsetgroup"":""chat-bison (PaLM 2)"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""chat-bison (PaLM 2)""],""xaxis"":""x"",""y"":[0.05291],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison-32k (PaLM 2 32K)"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""chat-bison-32k (PaLM 2 32K)"",""offsetgroup"":""chat-bison-32k (PaLM 2 32K)"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""chat-bison-32k (PaLM 2 32K)""],""xaxis"":""x"",""y"":[0.04954],""yaxis"":""y"",""type"":""bar""}],""layout"":{""template"":{""data"":{""histogram2dcontour"":[{""type"":""histogram2dcontour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""choropleth"":[{""type"":""choropleth"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""histogram2d"":[{""type"":""histogram2d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmap"":[{""type"":""heatmap"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmapgl"":[{""type"":""heatmapgl"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""contourcarpet"":[{""type"":""contourcarpet"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""contour"":[{""type"":""contour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""surface"":[{""type"":""surface"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""mesh3d"":[{""type"":""mesh3d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""scatter"":[{""fillpattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2},""type"":""scatter""}],""parcoords"":[{""type"":""parcoords"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolargl"":[{""type"":""scatterpolargl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""bar"":[{""error_x"":{""color"":""#2a3f5f""},""error_y"":{""color"":""#2a3f5f""},""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""bar""}],""scattergeo"":[{""type"":""scattergeo"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolar"":[{""type"":""scatterpolar"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""histogram"":[{""marker"":{""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""histogram""}],""scattergl"":[{""type"":""scattergl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatter3d"":[{""type"":""scatter3d"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattermapbox"":[{""type"":""scattermapbox"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterternary"":[{""type"":""scatterternary"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattercarpet"":[{""type"":""scattercarpet"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""carpet"":[{""aaxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""baxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""type"":""carpet""}],""table"":[{""cells"":{""fill"":{""color"":""#EBF0F8""},""line"":{""color"":""white""}},""header"":{""fill"":{""color"":""#C8D4E3""},""line"":{""color"":""white""}},""type"":""table""}],""barpolar"":[{""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""barpolar""}],""pie"":[{""automargin"":true,""type"":""pie""}]},""layout"":{""autotypenumbers"":""strict"",""colorway"":[""#636efa"",""#EF553B"",""#00cc96"",""#ab63fa"",""#FFA15A"",""#19d3f3"",""#FF6692"",""#B6E880"",""#FF97FF"",""#FECB52""],""font"":{""color"":""#2a3f5f""},""hovermode"":""closest"",""hoverlabel"":{""align"":""left""},""paper_bgcolor"":""white"",""plot_bgcolor"":""#E5ECF6"",""polar"":{""bgcolor"":""#E5ECF6"",""angularaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""radialaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""ternary"":{""bgcolor"":""#E5ECF6"",""aaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""baxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""caxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""coloraxis"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""colorscale"":{""sequential"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""sequentialminus"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""diverging"":[[0,""#8e0152""],[0.1,""#c51b7d""],[0.2,""#de77ae""],[0.3,""#f1b6da""],[0.4,""#fde0ef""],[0.5,""#f7f7f7""],[0.6,""#e6f5d0""],[0.7,""#b8e186""],[0.8,""#7fbc41""],[0.9,""#4d9221""],[1,""#276419""]]},""xaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""yaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""scene"":{""xaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""yaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""zaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2}},""shapedefaults"":{""line"":{""color"":""#2a3f5f""}},""annotationdefaults"":{""arrowcolor"":""#2a3f5f"",""arrowhead"":0,""arrowwidth"":1},""geo"":{""bgcolor"":""white"",""landcolor"":""#E5ECF6"",""subunitcolor"":""white"",""showland"":true,""showlakes"":true,""lakecolor"":""white""},""title"":{""x"":0.05},""mapbox"":{""style"":""light""}}},""xaxis"":{""anchor"":""y"",""domain"":[0.0,1.0],""title"":{""text"":""Model""}},""yaxis"":{""anchor"":""x"",""domain"":[0.0,1.0],""title"":{""text"":""Execution cost ($)""}},""legend"":{""title"":{""text"":""Model""},""tracegroupgap"":0},""title"":{""text"":""Costs of execution of 800 test queries per model""},""barmode"":""relative""}}"
365
+ ./html/plots/model_sizes.html,"Figure({
366
+ 'data': [{'alignmentgroup': 'True',
367
+ 'hovertemplate': 'Model=%{x}<br>Model size (B params)=%{y}<extra></extra>',
368
+ 'legendgroup': 'Mixtral-8x7B-Instruct-v0.1',
369
+ 'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
370
+ 'name': 'Mixtral-8x7B-Instruct-v0.1',
371
+ 'offsetgroup': 'Mixtral-8x7B-Instruct-v0.1',
372
+ 'orientation': 'v',
373
+ 'showlegend': True,
374
+ 'textposition': 'auto',
375
+ 'type': 'bar',
376
+ 'x': array(['Mixtral-8x7B-Instruct-v0.1'], dtype=object),
377
+ 'xaxis': 'x',
378
+ 'y': array([56.]),
379
+ 'yaxis': 'y'},
380
+ {'alignmentgroup': 'True',
381
+ 'hovertemplate': 'Model=%{x}<br>Model size (B params)=%{y}<extra></extra>',
382
+ 'legendgroup': 'zephyr-7b-beta',
383
+ 'marker': {'color': '#EF553B', 'pattern': {'shape': ''}},
384
+ 'name': 'zephyr-7b-beta',
385
+ 'offsetgroup': 'zephyr-7b-beta',
386
+ 'orientation': 'v',
387
+ 'showlegend': True,
388
+ 'textposition': 'auto',
389
+ 'type': 'bar',
390
+ 'x': array(['zephyr-7b-beta'], dtype=object),
391
+ 'xaxis': 'x',
392
+ 'y': array([7.]),
393
+ 'yaxis': 'y'},
394
+ {'alignmentgroup': 'True',
395
+ 'hovertemplate': 'Model=%{x}<br>Model size (B params)=%{y}<extra></extra>',
396
+ 'legendgroup': 'Mistral-7B-Instruct-v0.2',
397
+ 'marker': {'color': '#00cc96', 'pattern': {'shape': ''}},
398
+ 'name': 'Mistral-7B-Instruct-v0.2',
399
+ 'offsetgroup': 'Mistral-7B-Instruct-v0.2',
400
+ 'orientation': 'v',
401
+ 'showlegend': True,
402
+ 'textposition': 'auto',
403
+ 'type': 'bar',
404
+ 'x': array(['Mistral-7B-Instruct-v0.2'], dtype=object),
405
+ 'xaxis': 'x',
406
+ 'y': array([7.]),
407
+ 'yaxis': 'y'},
408
+ {'alignmentgroup': 'True',
409
+ 'hovertemplate': 'Model=%{x}<br>Model size (B params)=%{y}<extra></extra>',
410
+ 'legendgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
411
+ 'marker': {'color': '#ab63fa', 'pattern': {'shape': ''}},
412
+ 'name': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
413
+ 'offsetgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
414
+ 'orientation': 'v',
415
+ 'showlegend': True,
416
+ 'textposition': 'auto',
417
+ 'type': 'bar',
418
+ 'x': array(['TinyLlama/TinyLlama-1.1B-Chat-v1.0'], dtype=object),
419
+ 'xaxis': 'x',
420
+ 'y': array([1.1]),
421
+ 'yaxis': 'y'}],
422
+ 'layout': {'barmode': 'relative',
423
+ 'legend': {'title': {'text': 'Model'}, 'tracegroupgap': 0},
424
+ 'template': '...',
425
+ 'title': {'text': 'Model sizes in billions of parameters'},
426
+ 'xaxis': {'anchor': 'y', 'domain': [0.0, 1.0], 'title': {'text': 'Model'}},
427
+ 'yaxis': {'anchor': 'x', 'domain': [0.0, 1.0], 'title': {'text': 'Model size (B params)'}}}
428
+ })",Model sizes in billions of parameters,Note that some models have undisclosed sizes.,"{""data"":[{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eModel size (B params)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mixtral-8x7B-Instruct-v0.1"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""Mixtral-8x7B-Instruct-v0.1"",""offsetgroup"":""Mixtral-8x7B-Instruct-v0.1"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""Mixtral-8x7B-Instruct-v0.1""],""xaxis"":""x"",""y"":[56.0],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eModel size (B params)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""zephyr-7b-beta"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""zephyr-7b-beta"",""offsetgroup"":""zephyr-7b-beta"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""zephyr-7b-beta""],""xaxis"":""x"",""y"":[7.0],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eModel size (B params)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral-7B-Instruct-v0.2"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""Mistral-7B-Instruct-v0.2"",""offsetgroup"":""Mistral-7B-Instruct-v0.2"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""Mistral-7B-Instruct-v0.2""],""xaxis"":""x"",""y"":[7.0],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eModel size (B params)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""offsetgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0""],""xaxis"":""x"",""y"":[1.1],""yaxis"":""y"",""type"":""bar""}],""layout"":{""template"":{""data"":{""histogram2dcontour"":[{""type"":""histogram2dcontour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""choropleth"":[{""type"":""choropleth"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""histogram2d"":[{""type"":""histogram2d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmap"":[{""type"":""heatmap"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmapgl"":[{""type"":""heatmapgl"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""contourcarpet"":[{""type"":""contourcarpet"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""contour"":[{""type"":""contour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""surface"":[{""type"":""surface"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""mesh3d"":[{""type"":""mesh3d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""scatter"":[{""fillpattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2},""type"":""scatter""}],""parcoords"":[{""type"":""parcoords"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolargl"":[{""type"":""scatterpolargl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""bar"":[{""error_x"":{""color"":""#2a3f5f""},""error_y"":{""color"":""#2a3f5f""},""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""bar""}],""scattergeo"":[{""type"":""scattergeo"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolar"":[{""type"":""scatterpolar"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""histogram"":[{""marker"":{""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""histogram""}],""scattergl"":[{""type"":""scattergl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatter3d"":[{""type"":""scatter3d"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattermapbox"":[{""type"":""scattermapbox"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterternary"":[{""type"":""scatterternary"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattercarpet"":[{""type"":""scattercarpet"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""carpet"":[{""aaxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""baxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""type"":""carpet""}],""table"":[{""cells"":{""fill"":{""color"":""#EBF0F8""},""line"":{""color"":""white""}},""header"":{""fill"":{""color"":""#C8D4E3""},""line"":{""color"":""white""}},""type"":""table""}],""barpolar"":[{""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""barpolar""}],""pie"":[{""automargin"":true,""type"":""pie""}]},""layout"":{""autotypenumbers"":""strict"",""colorway"":[""#636efa"",""#EF553B"",""#00cc96"",""#ab63fa"",""#FFA15A"",""#19d3f3"",""#FF6692"",""#B6E880"",""#FF97FF"",""#FECB52""],""font"":{""color"":""#2a3f5f""},""hovermode"":""closest"",""hoverlabel"":{""align"":""left""},""paper_bgcolor"":""white"",""plot_bgcolor"":""#E5ECF6"",""polar"":{""bgcolor"":""#E5ECF6"",""angularaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""radialaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""ternary"":{""bgcolor"":""#E5ECF6"",""aaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""baxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""caxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""coloraxis"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""colorscale"":{""sequential"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""sequentialminus"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""diverging"":[[0,""#8e0152""],[0.1,""#c51b7d""],[0.2,""#de77ae""],[0.3,""#f1b6da""],[0.4,""#fde0ef""],[0.5,""#f7f7f7""],[0.6,""#e6f5d0""],[0.7,""#b8e186""],[0.8,""#7fbc41""],[0.9,""#4d9221""],[1,""#276419""]]},""xaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""yaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""scene"":{""xaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""yaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""zaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2}},""shapedefaults"":{""line"":{""color"":""#2a3f5f""}},""annotationdefaults"":{""arrowcolor"":""#2a3f5f"",""arrowhead"":0,""arrowwidth"":1},""geo"":{""bgcolor"":""white"",""landcolor"":""#E5ECF6"",""subunitcolor"":""white"",""showland"":true,""showlakes"":true,""lakecolor"":""white""},""title"":{""x"":0.05},""mapbox"":{""style"":""light""}}},""xaxis"":{""anchor"":""y"",""domain"":[0.0,1.0],""title"":{""text"":""Model""}},""yaxis"":{""anchor"":""x"",""domain"":[0.0,1.0],""title"":{""text"":""Model size (B params)""}},""legend"":{""title"":{""text"":""Model""},""tracegroupgap"":0},""title"":{""text"":""Model sizes in billions of parameters""},""barmode"":""relative""}}"
data/2024-02-02 11:10:33.807657_general_plot.csv ADDED
@@ -0,0 +1,293 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ path,plot_object,description,comment,plot_json
2
+ ./html/plots/response_times.html,"Figure({
3
+ 'data': [{'alignmentgroup': 'True',
4
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
5
+ 'legendgroup': 'Mistral-7B-Instruct-v0.2',
6
+ 'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
7
+ 'name': 'Mistral-7B-Instruct-v0.2',
8
+ 'offsetgroup': 'Mistral-7B-Instruct-v0.2',
9
+ 'orientation': 'v',
10
+ 'showlegend': True,
11
+ 'textposition': 'auto',
12
+ 'type': 'bar',
13
+ 'x': array(['Mistral-7B-Instruct-v0.2'], dtype=object),
14
+ 'xaxis': 'x',
15
+ 'y': array([3.27102681]),
16
+ 'yaxis': 'y'},
17
+ {'alignmentgroup': 'True',
18
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
19
+ 'legendgroup': 'Mixtral-8x7B-Instruct-v0.1',
20
+ 'marker': {'color': '#EF553B', 'pattern': {'shape': ''}},
21
+ 'name': 'Mixtral-8x7B-Instruct-v0.1',
22
+ 'offsetgroup': 'Mixtral-8x7B-Instruct-v0.1',
23
+ 'orientation': 'v',
24
+ 'showlegend': True,
25
+ 'textposition': 'auto',
26
+ 'type': 'bar',
27
+ 'x': array(['Mixtral-8x7B-Instruct-v0.1'], dtype=object),
28
+ 'xaxis': 'x',
29
+ 'y': array([5.47596174]),
30
+ 'yaxis': 'y'},
31
+ {'alignmentgroup': 'True',
32
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
33
+ 'legendgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
34
+ 'marker': {'color': '#00cc96', 'pattern': {'shape': ''}},
35
+ 'name': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
36
+ 'offsetgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
37
+ 'orientation': 'v',
38
+ 'showlegend': True,
39
+ 'textposition': 'auto',
40
+ 'type': 'bar',
41
+ 'x': array(['TinyLlama/TinyLlama-1.1B-Chat-v1.0'], dtype=object),
42
+ 'xaxis': 'x',
43
+ 'y': array([1.66062556]),
44
+ 'yaxis': 'y'},
45
+ {'alignmentgroup': 'True',
46
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
47
+ 'legendgroup': 'chat-bison',
48
+ 'marker': {'color': '#ab63fa', 'pattern': {'shape': ''}},
49
+ 'name': 'chat-bison',
50
+ 'offsetgroup': 'chat-bison',
51
+ 'orientation': 'v',
52
+ 'showlegend': True,
53
+ 'textposition': 'auto',
54
+ 'type': 'bar',
55
+ 'x': array(['chat-bison'], dtype=object),
56
+ 'xaxis': 'x',
57
+ 'y': array([3.89024363]),
58
+ 'yaxis': 'y'},
59
+ {'alignmentgroup': 'True',
60
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
61
+ 'legendgroup': 'chat-bison (PaLM 2)',
62
+ 'marker': {'color': '#FFA15A', 'pattern': {'shape': ''}},
63
+ 'name': 'chat-bison (PaLM 2)',
64
+ 'offsetgroup': 'chat-bison (PaLM 2)',
65
+ 'orientation': 'v',
66
+ 'showlegend': True,
67
+ 'textposition': 'auto',
68
+ 'type': 'bar',
69
+ 'x': array(['chat-bison (PaLM 2)'], dtype=object),
70
+ 'xaxis': 'x',
71
+ 'y': array([2.79700603]),
72
+ 'yaxis': 'y'},
73
+ {'alignmentgroup': 'True',
74
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
75
+ 'legendgroup': 'chat-bison-32k',
76
+ 'marker': {'color': '#19d3f3', 'pattern': {'shape': ''}},
77
+ 'name': 'chat-bison-32k',
78
+ 'offsetgroup': 'chat-bison-32k',
79
+ 'orientation': 'v',
80
+ 'showlegend': True,
81
+ 'textposition': 'auto',
82
+ 'type': 'bar',
83
+ 'x': array(['chat-bison-32k'], dtype=object),
84
+ 'xaxis': 'x',
85
+ 'y': array([4.12817777]),
86
+ 'yaxis': 'y'},
87
+ {'alignmentgroup': 'True',
88
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
89
+ 'legendgroup': 'chat-bison-32k (PaLM 2 32K)',
90
+ 'marker': {'color': '#FF6692', 'pattern': {'shape': ''}},
91
+ 'name': 'chat-bison-32k (PaLM 2 32K)',
92
+ 'offsetgroup': 'chat-bison-32k (PaLM 2 32K)',
93
+ 'orientation': 'v',
94
+ 'showlegend': True,
95
+ 'textposition': 'auto',
96
+ 'type': 'bar',
97
+ 'x': array(['chat-bison-32k (PaLM 2 32K)'], dtype=object),
98
+ 'xaxis': 'x',
99
+ 'y': array([6.21499148]),
100
+ 'yaxis': 'y'},
101
+ {'alignmentgroup': 'True',
102
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
103
+ 'legendgroup': 'gemini-pro',
104
+ 'marker': {'color': '#B6E880', 'pattern': {'shape': ''}},
105
+ 'name': 'gemini-pro',
106
+ 'offsetgroup': 'gemini-pro',
107
+ 'orientation': 'v',
108
+ 'showlegend': True,
109
+ 'textposition': 'auto',
110
+ 'type': 'bar',
111
+ 'x': array(['gemini-pro'], dtype=object),
112
+ 'xaxis': 'x',
113
+ 'y': array([3.37706134]),
114
+ 'yaxis': 'y'},
115
+ {'alignmentgroup': 'True',
116
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
117
+ 'legendgroup': 'gpt-3.5-turbo',
118
+ 'marker': {'color': '#FF97FF', 'pattern': {'shape': ''}},
119
+ 'name': 'gpt-3.5-turbo',
120
+ 'offsetgroup': 'gpt-3.5-turbo',
121
+ 'orientation': 'v',
122
+ 'showlegend': True,
123
+ 'textposition': 'auto',
124
+ 'type': 'bar',
125
+ 'x': array(['gpt-3.5-turbo'], dtype=object),
126
+ 'xaxis': 'x',
127
+ 'y': array([4.63898239]),
128
+ 'yaxis': 'y'},
129
+ {'alignmentgroup': 'True',
130
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
131
+ 'legendgroup': 'gpt-4',
132
+ 'marker': {'color': '#FECB52', 'pattern': {'shape': ''}},
133
+ 'name': 'gpt-4',
134
+ 'offsetgroup': 'gpt-4',
135
+ 'orientation': 'v',
136
+ 'showlegend': True,
137
+ 'textposition': 'auto',
138
+ 'type': 'bar',
139
+ 'x': array(['gpt-4'], dtype=object),
140
+ 'xaxis': 'x',
141
+ 'y': array([15.72262285]),
142
+ 'yaxis': 'y'},
143
+ {'alignmentgroup': 'True',
144
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
145
+ 'legendgroup': 'gpt-4-turbo',
146
+ 'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
147
+ 'name': 'gpt-4-turbo',
148
+ 'offsetgroup': 'gpt-4-turbo',
149
+ 'orientation': 'v',
150
+ 'showlegend': True,
151
+ 'textposition': 'auto',
152
+ 'type': 'bar',
153
+ 'x': array(['gpt-4-turbo'], dtype=object),
154
+ 'xaxis': 'x',
155
+ 'y': array([16.46241833]),
156
+ 'yaxis': 'y'},
157
+ {'alignmentgroup': 'True',
158
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
159
+ 'legendgroup': 'llama-2-70b-chat',
160
+ 'marker': {'color': '#EF553B', 'pattern': {'shape': ''}},
161
+ 'name': 'llama-2-70b-chat',
162
+ 'offsetgroup': 'llama-2-70b-chat',
163
+ 'orientation': 'v',
164
+ 'showlegend': True,
165
+ 'textposition': 'auto',
166
+ 'type': 'bar',
167
+ 'x': array(['llama-2-70b-chat'], dtype=object),
168
+ 'xaxis': 'x',
169
+ 'y': array([4.2692996]),
170
+ 'yaxis': 'y'},
171
+ {'alignmentgroup': 'True',
172
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
173
+ 'legendgroup': 'zephyr-7b-beta',
174
+ 'marker': {'color': '#00cc96', 'pattern': {'shape': ''}},
175
+ 'name': 'zephyr-7b-beta',
176
+ 'offsetgroup': 'zephyr-7b-beta',
177
+ 'orientation': 'v',
178
+ 'showlegend': True,
179
+ 'textposition': 'auto',
180
+ 'type': 'bar',
181
+ 'x': array(['zephyr-7b-beta'], dtype=object),
182
+ 'xaxis': 'x',
183
+ 'y': array([3.44499114]),
184
+ 'yaxis': 'y'}],
185
+ 'layout': {'barmode': 'relative',
186
+ 'legend': {'title': {'text': 'Model'}, 'tracegroupgap': 0},
187
+ 'template': '...',
188
+ 'title': {'text': 'Model endpoints response times'},
189
+ 'xaxis': {'anchor': 'y',
190
+ 'categoryarray': [Mistral-7B-Instruct-v0.2,
191
+ Mixtral-8x7B-Instruct-v0.1,
192
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,
193
+ chat-bison, chat-bison (PaLM 2), chat-
194
+ bison-32k, chat-bison-32k (PaLM 2 32K),
195
+ gemini-pro, gpt-3.5-turbo, gpt-4,
196
+ gpt-4-turbo, llama-2-70b-chat,
197
+ zephyr-7b-beta],
198
+ 'categoryorder': 'array',
199
+ 'domain': [0.0, 1.0],
200
+ 'title': {'text': 'Model'}},
201
+ 'yaxis': {'anchor': 'x', 'domain': [0.0, 1.0], 'title': {'text': 'Execution time (s)'}}}
202
+ })",Model endpoints response times,,"{""data"":[{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral-7B-Instruct-v0.2"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""Mistral-7B-Instruct-v0.2"",""offsetgroup"":""Mistral-7B-Instruct-v0.2"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""Mistral-7B-Instruct-v0.2""],""xaxis"":""x"",""y"":[3.271026806036631],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mixtral-8x7B-Instruct-v0.1"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""Mixtral-8x7B-Instruct-v0.1"",""offsetgroup"":""Mixtral-8x7B-Instruct-v0.1"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""Mixtral-8x7B-Instruct-v0.1""],""xaxis"":""x"",""y"":[5.475961740149392],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""offsetgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0""],""xaxis"":""x"",""y"":[1.6606255621910095],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""chat-bison"",""offsetgroup"":""chat-bison"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""chat-bison""],""xaxis"":""x"",""y"":[3.890243631601334],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison (PaLM 2)"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""chat-bison (PaLM 2)"",""offsetgroup"":""chat-bison (PaLM 2)"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""chat-bison (PaLM 2)""],""xaxis"":""x"",""y"":[2.7970060307638986],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison-32k"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""chat-bison-32k"",""offsetgroup"":""chat-bison-32k"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""chat-bison-32k""],""xaxis"":""x"",""y"":[4.128177767992019],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison-32k (PaLM 2 32K)"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""chat-bison-32k (PaLM 2 32K)"",""offsetgroup"":""chat-bison-32k (PaLM 2 32K)"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""chat-bison-32k (PaLM 2 32K)""],""xaxis"":""x"",""y"":[6.214991477898189],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gemini-pro"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""gemini-pro"",""offsetgroup"":""gemini-pro"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gemini-pro""],""xaxis"":""x"",""y"":[3.3770613408857777],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-3.5-turbo"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""gpt-3.5-turbo"",""offsetgroup"":""gpt-3.5-turbo"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gpt-3.5-turbo""],""xaxis"":""x"",""y"":[4.63898239252044],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""gpt-4"",""offsetgroup"":""gpt-4"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gpt-4""],""xaxis"":""x"",""y"":[15.72262285346881],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4-turbo"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""gpt-4-turbo"",""offsetgroup"":""gpt-4-turbo"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gpt-4-turbo""],""xaxis"":""x"",""y"":[16.462418334769165],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""llama-2-70b-chat"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""llama-2-70b-chat"",""offsetgroup"":""llama-2-70b-chat"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""llama-2-70b-chat""],""xaxis"":""x"",""y"":[4.269299596734112],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""zephyr-7b-beta"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""zephyr-7b-beta"",""offsetgroup"":""zephyr-7b-beta"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""zephyr-7b-beta""],""xaxis"":""x"",""y"":[3.4449911407752936],""yaxis"":""y"",""type"":""bar""}],""layout"":{""template"":{""data"":{""histogram2dcontour"":[{""type"":""histogram2dcontour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""choropleth"":[{""type"":""choropleth"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""histogram2d"":[{""type"":""histogram2d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmap"":[{""type"":""heatmap"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmapgl"":[{""type"":""heatmapgl"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""contourcarpet"":[{""type"":""contourcarpet"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""contour"":[{""type"":""contour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""surface"":[{""type"":""surface"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""mesh3d"":[{""type"":""mesh3d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""scatter"":[{""fillpattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2},""type"":""scatter""}],""parcoords"":[{""type"":""parcoords"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolargl"":[{""type"":""scatterpolargl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""bar"":[{""error_x"":{""color"":""#2a3f5f""},""error_y"":{""color"":""#2a3f5f""},""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""bar""}],""scattergeo"":[{""type"":""scattergeo"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolar"":[{""type"":""scatterpolar"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""histogram"":[{""marker"":{""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""histogram""}],""scattergl"":[{""type"":""scattergl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatter3d"":[{""type"":""scatter3d"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattermapbox"":[{""type"":""scattermapbox"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterternary"":[{""type"":""scatterternary"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattercarpet"":[{""type"":""scattercarpet"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""carpet"":[{""aaxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""baxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""type"":""carpet""}],""table"":[{""cells"":{""fill"":{""color"":""#EBF0F8""},""line"":{""color"":""white""}},""header"":{""fill"":{""color"":""#C8D4E3""},""line"":{""color"":""white""}},""type"":""table""}],""barpolar"":[{""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""barpolar""}],""pie"":[{""automargin"":true,""type"":""pie""}]},""layout"":{""autotypenumbers"":""strict"",""colorway"":[""#636efa"",""#EF553B"",""#00cc96"",""#ab63fa"",""#FFA15A"",""#19d3f3"",""#FF6692"",""#B6E880"",""#FF97FF"",""#FECB52""],""font"":{""color"":""#2a3f5f""},""hovermode"":""closest"",""hoverlabel"":{""align"":""left""},""paper_bgcolor"":""white"",""plot_bgcolor"":""#E5ECF6"",""polar"":{""bgcolor"":""#E5ECF6"",""angularaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""radialaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""ternary"":{""bgcolor"":""#E5ECF6"",""aaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""baxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""caxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""coloraxis"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""colorscale"":{""sequential"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""sequentialminus"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""diverging"":[[0,""#8e0152""],[0.1,""#c51b7d""],[0.2,""#de77ae""],[0.3,""#f1b6da""],[0.4,""#fde0ef""],[0.5,""#f7f7f7""],[0.6,""#e6f5d0""],[0.7,""#b8e186""],[0.8,""#7fbc41""],[0.9,""#4d9221""],[1,""#276419""]]},""xaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""yaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""scene"":{""xaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""yaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""zaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2}},""shapedefaults"":{""line"":{""color"":""#2a3f5f""}},""annotationdefaults"":{""arrowcolor"":""#2a3f5f"",""arrowhead"":0,""arrowwidth"":1},""geo"":{""bgcolor"":""white"",""landcolor"":""#E5ECF6"",""subunitcolor"":""white"",""showland"":true,""showlakes"":true,""lakecolor"":""white""},""title"":{""x"":0.05},""mapbox"":{""style"":""light""}}},""xaxis"":{""anchor"":""y"",""domain"":[0.0,1.0],""title"":{""text"":""Model""},""categoryorder"":""array"",""categoryarray"":[""Mistral-7B-Instruct-v0.2"",""Mixtral-8x7B-Instruct-v0.1"",""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""chat-bison"",""chat-bison (PaLM 2)"",""chat-bison-32k"",""chat-bison-32k (PaLM 2 32K)"",""gemini-pro"",""gpt-3.5-turbo"",""gpt-4"",""gpt-4-turbo"",""llama-2-70b-chat"",""zephyr-7b-beta""]},""yaxis"":{""anchor"":""x"",""domain"":[0.0,1.0],""title"":{""text"":""Execution time (s)""}},""legend"":{""title"":{""text"":""Model""},""tracegroupgap"":0},""title"":{""text"":""Model endpoints response times""},""barmode"":""relative""}}"
203
+ ./html/plots/execution_costs.html,"Figure({
204
+ 'data': [{'alignmentgroup': 'True',
205
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
206
+ 'legendgroup': '',
207
+ 'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
208
+ 'name': '',
209
+ 'offsetgroup': '',
210
+ 'orientation': 'v',
211
+ 'showlegend': False,
212
+ 'textposition': 'auto',
213
+ 'type': 'bar',
214
+ 'x': array(['gpt-3.5-turbo', 'gpt-4-turbo', 'gpt-4', 'llama-2-70b-chat',
215
+ 'Mixtral-8x7B-Instruct-v0.1', 'zephyr-7b-beta',
216
+ 'Mistral-7B-Instruct-v0.2', 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
217
+ 'gemini-pro', 'chat-bison (PaLM 2)', 'chat-bison-32k (PaLM 2 32K)'],
218
+ dtype=object),
219
+ 'xaxis': 'x',
220
+ 'y': array([0.22948 , 2.9468 , 6.342 , 0.02828 , 0.12708 , 0.04109804,
221
+ 0.10571385, 0.00933233, 0.05789 , 0.04731 , 0.04454 ]),
222
+ 'yaxis': 'y'}],
223
+ 'layout': {'barmode': 'relative',
224
+ 'legend': {'tracegroupgap': 0},
225
+ 'template': '...',
226
+ 'title': {'text': 'Costs of execution of 800 test queries per model'},
227
+ 'xaxis': {'anchor': 'y', 'domain': [0.0, 1.0], 'title': {'text': 'Model'}},
228
+ 'yaxis': {'anchor': 'x', 'domain': [0.0, 1.0], 'title': {'text': 'Execution cost ($)'}}}
229
+ })",Costs of execution of 800 test queries per model,Note that pause and resume time cost was not included in the cost calculation for the models billed hourly. Also although Gemini-Pro model is free for under 60 queries per minute we calculated the full cost for generating the tokens.,"{""data"":[{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":"""",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":"""",""offsetgroup"":"""",""orientation"":""v"",""showlegend"":false,""textposition"":""auto"",""x"":[""gpt-3.5-turbo"",""gpt-4-turbo"",""gpt-4"",""llama-2-70b-chat"",""Mixtral-8x7B-Instruct-v0.1"",""zephyr-7b-beta"",""Mistral-7B-Instruct-v0.2"",""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""gemini-pro"",""chat-bison (PaLM 2)"",""chat-bison-32k (PaLM 2 32K)""],""xaxis"":""x"",""y"":[0.22948,2.9467999999999996,6.3420000000000005,0.02828,0.12708,0.0410980390045378,0.1057138456636005,0.009332333167394003,0.05789,0.04731,0.044539999999999996],""yaxis"":""y"",""type"":""bar""}],""layout"":{""template"":{""data"":{""histogram2dcontour"":[{""type"":""histogram2dcontour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""choropleth"":[{""type"":""choropleth"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""histogram2d"":[{""type"":""histogram2d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmap"":[{""type"":""heatmap"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmapgl"":[{""type"":""heatmapgl"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""contourcarpet"":[{""type"":""contourcarpet"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""contour"":[{""type"":""contour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""surface"":[{""type"":""surface"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""mesh3d"":[{""type"":""mesh3d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""scatter"":[{""fillpattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2},""type"":""scatter""}],""parcoords"":[{""type"":""parcoords"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolargl"":[{""type"":""scatterpolargl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""bar"":[{""error_x"":{""color"":""#2a3f5f""},""error_y"":{""color"":""#2a3f5f""},""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""bar""}],""scattergeo"":[{""type"":""scattergeo"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolar"":[{""type"":""scatterpolar"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""histogram"":[{""marker"":{""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""histogram""}],""scattergl"":[{""type"":""scattergl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatter3d"":[{""type"":""scatter3d"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattermapbox"":[{""type"":""scattermapbox"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterternary"":[{""type"":""scatterternary"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattercarpet"":[{""type"":""scattercarpet"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""carpet"":[{""aaxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""baxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""type"":""carpet""}],""table"":[{""cells"":{""fill"":{""color"":""#EBF0F8""},""line"":{""color"":""white""}},""header"":{""fill"":{""color"":""#C8D4E3""},""line"":{""color"":""white""}},""type"":""table""}],""barpolar"":[{""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""barpolar""}],""pie"":[{""automargin"":true,""type"":""pie""}]},""layout"":{""autotypenumbers"":""strict"",""colorway"":[""#636efa"",""#EF553B"",""#00cc96"",""#ab63fa"",""#FFA15A"",""#19d3f3"",""#FF6692"",""#B6E880"",""#FF97FF"",""#FECB52""],""font"":{""color"":""#2a3f5f""},""hovermode"":""closest"",""hoverlabel"":{""align"":""left""},""paper_bgcolor"":""white"",""plot_bgcolor"":""#E5ECF6"",""polar"":{""bgcolor"":""#E5ECF6"",""angularaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""radialaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""ternary"":{""bgcolor"":""#E5ECF6"",""aaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""baxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""caxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""coloraxis"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""colorscale"":{""sequential"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""sequentialminus"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""diverging"":[[0,""#8e0152""],[0.1,""#c51b7d""],[0.2,""#de77ae""],[0.3,""#f1b6da""],[0.4,""#fde0ef""],[0.5,""#f7f7f7""],[0.6,""#e6f5d0""],[0.7,""#b8e186""],[0.8,""#7fbc41""],[0.9,""#4d9221""],[1,""#276419""]]},""xaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""yaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""scene"":{""xaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""yaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""zaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2}},""shapedefaults"":{""line"":{""color"":""#2a3f5f""}},""annotationdefaults"":{""arrowcolor"":""#2a3f5f"",""arrowhead"":0,""arrowwidth"":1},""geo"":{""bgcolor"":""white"",""landcolor"":""#E5ECF6"",""subunitcolor"":""white"",""showland"":true,""showlakes"":true,""lakecolor"":""white""},""title"":{""x"":0.05},""mapbox"":{""style"":""light""}}},""xaxis"":{""anchor"":""y"",""domain"":[0.0,1.0],""title"":{""text"":""Model""}},""yaxis"":{""anchor"":""x"",""domain"":[0.0,1.0],""title"":{""text"":""Execution cost ($)""}},""legend"":{""tracegroupgap"":0},""title"":{""text"":""Costs of execution of 800 test queries per model""},""barmode"":""relative""}}"
230
+ ./html/plots/model_sizes.html,"Figure({
231
+ 'data': [{'alignmentgroup': 'True',
232
+ 'hovertemplate': 'Model=%{x}<br>Model size (B params)=%{y}<extra></extra>',
233
+ 'legendgroup': 'Mixtral-8x7B-Instruct-v0.1',
234
+ 'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
235
+ 'name': 'Mixtral-8x7B-Instruct-v0.1',
236
+ 'offsetgroup': 'Mixtral-8x7B-Instruct-v0.1',
237
+ 'orientation': 'v',
238
+ 'showlegend': True,
239
+ 'textposition': 'auto',
240
+ 'type': 'bar',
241
+ 'x': array(['Mixtral-8x7B-Instruct-v0.1'], dtype=object),
242
+ 'xaxis': 'x',
243
+ 'y': array([56.]),
244
+ 'yaxis': 'y'},
245
+ {'alignmentgroup': 'True',
246
+ 'hovertemplate': 'Model=%{x}<br>Model size (B params)=%{y}<extra></extra>',
247
+ 'legendgroup': 'zephyr-7b-beta',
248
+ 'marker': {'color': '#EF553B', 'pattern': {'shape': ''}},
249
+ 'name': 'zephyr-7b-beta',
250
+ 'offsetgroup': 'zephyr-7b-beta',
251
+ 'orientation': 'v',
252
+ 'showlegend': True,
253
+ 'textposition': 'auto',
254
+ 'type': 'bar',
255
+ 'x': array(['zephyr-7b-beta'], dtype=object),
256
+ 'xaxis': 'x',
257
+ 'y': array([7.]),
258
+ 'yaxis': 'y'},
259
+ {'alignmentgroup': 'True',
260
+ 'hovertemplate': 'Model=%{x}<br>Model size (B params)=%{y}<extra></extra>',
261
+ 'legendgroup': 'Mistral-7B-Instruct-v0.2',
262
+ 'marker': {'color': '#00cc96', 'pattern': {'shape': ''}},
263
+ 'name': 'Mistral-7B-Instruct-v0.2',
264
+ 'offsetgroup': 'Mistral-7B-Instruct-v0.2',
265
+ 'orientation': 'v',
266
+ 'showlegend': True,
267
+ 'textposition': 'auto',
268
+ 'type': 'bar',
269
+ 'x': array(['Mistral-7B-Instruct-v0.2'], dtype=object),
270
+ 'xaxis': 'x',
271
+ 'y': array([7.]),
272
+ 'yaxis': 'y'},
273
+ {'alignmentgroup': 'True',
274
+ 'hovertemplate': 'Model=%{x}<br>Model size (B params)=%{y}<extra></extra>',
275
+ 'legendgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
276
+ 'marker': {'color': '#ab63fa', 'pattern': {'shape': ''}},
277
+ 'name': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
278
+ 'offsetgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
279
+ 'orientation': 'v',
280
+ 'showlegend': True,
281
+ 'textposition': 'auto',
282
+ 'type': 'bar',
283
+ 'x': array(['TinyLlama/TinyLlama-1.1B-Chat-v1.0'], dtype=object),
284
+ 'xaxis': 'x',
285
+ 'y': array([1.1]),
286
+ 'yaxis': 'y'}],
287
+ 'layout': {'barmode': 'relative',
288
+ 'legend': {'title': {'text': 'Model'}, 'tracegroupgap': 0},
289
+ 'template': '...',
290
+ 'title': {'text': 'Model sizes in billions of parameters'},
291
+ 'xaxis': {'anchor': 'y', 'domain': [0.0, 1.0], 'title': {'text': 'Model'}},
292
+ 'yaxis': {'anchor': 'x', 'domain': [0.0, 1.0], 'title': {'text': 'Model size (B params)'}}}
293
+ })",Model sizes in billions of parameters,Note that some models have undisclosed sizes.,"{""data"":[{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eModel size (B params)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mixtral-8x7B-Instruct-v0.1"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""Mixtral-8x7B-Instruct-v0.1"",""offsetgroup"":""Mixtral-8x7B-Instruct-v0.1"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""Mixtral-8x7B-Instruct-v0.1""],""xaxis"":""x"",""y"":[56.0],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eModel size (B params)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""zephyr-7b-beta"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""zephyr-7b-beta"",""offsetgroup"":""zephyr-7b-beta"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""zephyr-7b-beta""],""xaxis"":""x"",""y"":[7.0],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eModel size (B params)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral-7B-Instruct-v0.2"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""Mistral-7B-Instruct-v0.2"",""offsetgroup"":""Mistral-7B-Instruct-v0.2"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""Mistral-7B-Instruct-v0.2""],""xaxis"":""x"",""y"":[7.0],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eModel size (B params)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""offsetgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0""],""xaxis"":""x"",""y"":[1.1],""yaxis"":""y"",""type"":""bar""}],""layout"":{""template"":{""data"":{""histogram2dcontour"":[{""type"":""histogram2dcontour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""choropleth"":[{""type"":""choropleth"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""histogram2d"":[{""type"":""histogram2d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmap"":[{""type"":""heatmap"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmapgl"":[{""type"":""heatmapgl"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""contourcarpet"":[{""type"":""contourcarpet"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""contour"":[{""type"":""contour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""surface"":[{""type"":""surface"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""mesh3d"":[{""type"":""mesh3d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""scatter"":[{""fillpattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2},""type"":""scatter""}],""parcoords"":[{""type"":""parcoords"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolargl"":[{""type"":""scatterpolargl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""bar"":[{""error_x"":{""color"":""#2a3f5f""},""error_y"":{""color"":""#2a3f5f""},""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""bar""}],""scattergeo"":[{""type"":""scattergeo"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolar"":[{""type"":""scatterpolar"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""histogram"":[{""marker"":{""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""histogram""}],""scattergl"":[{""type"":""scattergl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatter3d"":[{""type"":""scatter3d"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattermapbox"":[{""type"":""scattermapbox"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterternary"":[{""type"":""scatterternary"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattercarpet"":[{""type"":""scattercarpet"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""carpet"":[{""aaxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""baxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""type"":""carpet""}],""table"":[{""cells"":{""fill"":{""color"":""#EBF0F8""},""line"":{""color"":""white""}},""header"":{""fill"":{""color"":""#C8D4E3""},""line"":{""color"":""white""}},""type"":""table""}],""barpolar"":[{""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""barpolar""}],""pie"":[{""automargin"":true,""type"":""pie""}]},""layout"":{""autotypenumbers"":""strict"",""colorway"":[""#636efa"",""#EF553B"",""#00cc96"",""#ab63fa"",""#FFA15A"",""#19d3f3"",""#FF6692"",""#B6E880"",""#FF97FF"",""#FECB52""],""font"":{""color"":""#2a3f5f""},""hovermode"":""closest"",""hoverlabel"":{""align"":""left""},""paper_bgcolor"":""white"",""plot_bgcolor"":""#E5ECF6"",""polar"":{""bgcolor"":""#E5ECF6"",""angularaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""radialaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""ternary"":{""bgcolor"":""#E5ECF6"",""aaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""baxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""caxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""coloraxis"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""colorscale"":{""sequential"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""sequentialminus"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""diverging"":[[0,""#8e0152""],[0.1,""#c51b7d""],[0.2,""#de77ae""],[0.3,""#f1b6da""],[0.4,""#fde0ef""],[0.5,""#f7f7f7""],[0.6,""#e6f5d0""],[0.7,""#b8e186""],[0.8,""#7fbc41""],[0.9,""#4d9221""],[1,""#276419""]]},""xaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""yaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""scene"":{""xaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""yaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""zaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2}},""shapedefaults"":{""line"":{""color"":""#2a3f5f""}},""annotationdefaults"":{""arrowcolor"":""#2a3f5f"",""arrowhead"":0,""arrowwidth"":1},""geo"":{""bgcolor"":""white"",""landcolor"":""#E5ECF6"",""subunitcolor"":""white"",""showland"":true,""showlakes"":true,""lakecolor"":""white""},""title"":{""x"":0.05},""mapbox"":{""style"":""light""}}},""xaxis"":{""anchor"":""y"",""domain"":[0.0,1.0],""title"":{""text"":""Model""}},""yaxis"":{""anchor"":""x"",""domain"":[0.0,1.0],""title"":{""text"":""Model size (B params)""}},""legend"":{""title"":{""text"":""Model""},""tracegroupgap"":0},""title"":{""text"":""Model sizes in billions of parameters""},""barmode"":""relative""}}"
data/2024-02-03 21:01:06.672013_time_of_day_comparison.csv ADDED
@@ -0,0 +1,58 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ model,time_of_day,execution_time,characters_count,words_count
2
+ Mistral-7B-Instruct-v0.2,afternoon,3.2297915895779927,224.50833333333333,32.375
3
+ Mistral-7B-Instruct-v0.2,evening,3.335640662057059,237.52857142857144,35.33571428571429
4
+ Mistral-7B-Instruct-v0.2,midnight,,,
5
+ Mistral-7B-Instruct-v0.2,morning,3.267787692944209,154.65,23.283333333333335
6
+ Mistral-7B-Instruct-v0.2,noon,3.1783012986183166,210.325,30.975
7
+ Mixtral-8x7B-Instruct-v0.1,afternoon,5.647441667449138,361.92105263157896,51.305263157894736
8
+ Mixtral-8x7B-Instruct-v0.1,evening,4.120577350668951,346.51,48.5125
9
+ Mixtral-8x7B-Instruct-v0.1,midnight,5.600324046611786,399.5,61.7
10
+ Mixtral-8x7B-Instruct-v0.1,morning,4.245225775510745,318.15714285714284,45.17857142857143
11
+ Mixtral-8x7B-Instruct-v0.1,noon,5.2255242466926575,350.46,50.36
12
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,afternoon,1.7891986429691316,292.65833333333336,48.225
13
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,evening,1.8029413998126984,282.245,46.325
14
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,midnight,2.0674875736236573,372.05,62.6
15
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,morning,1.7550641377766927,283.4533333333333,47.29
16
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,noon,1.8389003086090088,314.46,52.08
17
+ chat-bison,morning,3.890243631601334,398.075,49.0
18
+ chat-bison (PaLM 2),afternoon,2.8929106787631387,385.43684210526317,55.810526315789474
19
+ chat-bison (PaLM 2),evening,2.7066626918315886,374.8975,54.42
20
+ chat-bison (PaLM 2),midnight,2.501569759845734,381.95,60.9
21
+ chat-bison (PaLM 2),morning,2.4689753359014337,381.8840909090909,60.902272727272724
22
+ chat-bison (PaLM 2),noon,2.571754927635193,352.17,50.81
23
+ chat-bison-32k,morning,4.128177767992019,389.925,48.025
24
+ chat-bison-32k (PaLM 2 32K),afternoon,4.44931383258418,349.0105263157895,49.86052631578947
25
+ chat-bison-32k (PaLM 2 32K),evening,7.76503027677536,339.705,48.6525
26
+ chat-bison-32k (PaLM 2 32K),midnight,7.170754861831665,335.75,53.85
27
+ chat-bison-32k (PaLM 2 32K),morning,7.92237914909016,335.75,53.85
28
+ chat-bison-32k (PaLM 2 32K),noon,6.040619640350342,323.17,45.15
29
+ gemini-pro,afternoon,2.8898058522299785,366.08684210526314,52.444736842105264
30
+ gemini-pro,evening,3.060831026541881,364.98,52.845
31
+ gemini-pro,midnight,2.8754740890703703,364.45,57.0
32
+ gemini-pro,morning,3.172877737902161,386.9125,58.09464285714286
33
+ gemini-pro,noon,2.7814492097834953,348.55,49.4
34
+ gpt-3.5-turbo,afternoon,4.1847387138678105,398.0991253644315,45.470845481049565
35
+ gpt-3.5-turbo,evening,4.304991676779234,399.01502145922746,44.74034334763949
36
+ gpt-3.5-turbo,midnight,3.5683146858215333,404.84,43.88
37
+ gpt-3.5-turbo,morning,4.437713119534958,423.19741379310346,49.02155172413793
38
+ gpt-3.5-turbo,noon,4.098882734775543,346.4125,34.7375
39
+ gpt-4,afternoon,16.17388726863186,320.5529411764706,39.75588235294118
40
+ gpt-4,evening,14.089318896690486,316.045652173913,38.46413043478261
41
+ gpt-4,midnight,12.091028991371694,316.73,37.44
42
+ gpt-4,morning,12.958622653407113,330.034375,41.71145833333333
43
+ gpt-4,noon,17.375231413543226,295.78125,31.23125
44
+ gpt-4-turbo,afternoon,18.663996428251266,364.4514705882353,47.06470588235294
45
+ gpt-4-turbo,evening,15.48614443048187,399.3239130434783,46.46630434782609
46
+ gpt-4-turbo,midnight,11.938190605640411,384.78,44.55
47
+ gpt-4-turbo,morning,13.66163076336185,369.496875,48.915625
48
+ gpt-4-turbo,noon,16.01451396048069,374.3375,45.11875
49
+ llama-2-70b-chat,afternoon,3.9614109361273613,429.84293193717275,60.924083769633505
50
+ llama-2-70b-chat,evening,3.514792161901998,407.02941176470586,57.77205882352941
51
+ llama-2-70b-chat,midnight,2.7049551407496133,312.85,48.55
52
+ llama-2-70b-chat,morning,3.5679600898884543,378.98214285714283,56.725
53
+ llama-2-70b-chat,noon,4.026921252409617,294.06,42.54
54
+ zephyr-7b-beta,afternoon,3.5596186633871385,273.65833333333336,43.233333333333334
55
+ zephyr-7b-beta,evening,3.4374013015202114,242.40714285714284,37.892857142857146
56
+ zephyr-7b-beta,midnight,,,
57
+ zephyr-7b-beta,morning,3.3750870446364085,158.19166666666666,24.941666666666666
58
+ zephyr-7b-beta,noon,3.3402509868144987,216.9,33.575
data/2024-02-03 22:21:49.754184_time_of_day_comparison.csv ADDED
@@ -0,0 +1,267 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ model,hour,execution_time,characters_count,words_count
2
+ Mistral-7B-Instruct-v0.2,0.0,,,
3
+ Mistral-7B-Instruct-v0.2,1.0,1.9149879813194275,37.8,2.95
4
+ Mistral-7B-Instruct-v0.2,2.0,,,
5
+ Mistral-7B-Instruct-v0.2,3.0,,,
6
+ Mistral-7B-Instruct-v0.2,4.0,,,
7
+ Mistral-7B-Instruct-v0.2,5.0,,,
8
+ Mistral-7B-Instruct-v0.2,6.0,,,
9
+ Mistral-7B-Instruct-v0.2,7.0,,,
10
+ Mistral-7B-Instruct-v0.2,8.0,,,
11
+ Mistral-7B-Instruct-v0.2,9.0,,,
12
+ Mistral-7B-Instruct-v0.2,10.0,,,
13
+ Mistral-7B-Instruct-v0.2,11.0,3.734026002883911,362.9,58.35
14
+ Mistral-7B-Instruct-v0.2,12.0,3.1783012986183166,210.325,30.975
15
+ Mistral-7B-Instruct-v0.2,13.0,,,
16
+ Mistral-7B-Instruct-v0.2,14.0,3.2796461462974547,233.8,33.525
17
+ Mistral-7B-Instruct-v0.2,15.0,3.749682915210724,362.9,58.35
18
+ Mistral-7B-Instruct-v0.2,16.0,3.023258109887441,172.18333333333334,22.95
19
+ Mistral-7B-Instruct-v0.2,17.0,,,
20
+ Mistral-7B-Instruct-v0.2,18.0,3.741873788833618,362.9,58.35
21
+ Mistral-7B-Instruct-v0.2,19.0,,,
22
+ Mistral-7B-Instruct-v0.2,20.0,3.225523215532303,210.325,30.975
23
+ Mistral-7B-Instruct-v0.2,21.0,3.2891411036252975,219.7875,31.7625
24
+ Mistral-7B-Instruct-v0.2,22.0,,,
25
+ Mistral-7B-Instruct-v0.2,23.0,,,
26
+ Mixtral-8x7B-Instruct-v0.1,0.0,5.600324046611786,399.5,61.7
27
+ Mixtral-8x7B-Instruct-v0.1,1.0,3.643988568608354,389.36,55.27
28
+ Mixtral-8x7B-Instruct-v0.1,2.0,3.1196579193246774,275.875,42.4
29
+ Mixtral-8x7B-Instruct-v0.1,3.0,3.017132020765735,316.8,49.025
30
+ Mixtral-8x7B-Instruct-v0.1,4.0,3.0949330102829706,200.375,30.9
31
+ Mixtral-8x7B-Instruct-v0.1,5.0,2.8691824844905307,279.65,42.95
32
+ Mixtral-8x7B-Instruct-v0.1,6.0,2.9245848854382834,251.4,38.7
33
+ Mixtral-8x7B-Instruct-v0.1,7.0,3.039147071838379,244.925,37.8
34
+ Mixtral-8x7B-Instruct-v0.1,8.0,3.6833377838134767,236.73333333333332,36.68333333333333
35
+ Mixtral-8x7B-Instruct-v0.1,9.0,2.35319835799081,286.25,44.75
36
+ Mixtral-8x7B-Instruct-v0.1,10.0,4.525930786132813,311.3,48.55
37
+ Mixtral-8x7B-Instruct-v0.1,11.0,4.267878273700146,308.85,47.7
38
+ Mixtral-8x7B-Instruct-v0.1,12.0,5.2255242466926575,350.46,50.36
39
+ Mixtral-8x7B-Instruct-v0.1,13.0,4.550832962644273,371.5375,57.975
40
+ Mixtral-8x7B-Instruct-v0.1,14.0,6.3550496492812885,390.675,55.725
41
+ Mixtral-8x7B-Instruct-v0.1,15.0,5.536225740114848,298.05,46.2
42
+ Mixtral-8x7B-Instruct-v0.1,16.0,6.244929383286332,410.9916666666667,51.69166666666667
43
+ Mixtral-8x7B-Instruct-v0.1,17.0,4.749357461929321,255.2,39.15
44
+ Mixtral-8x7B-Instruct-v0.1,18.0,3.441127454080889,312.875,48.525
45
+ Mixtral-8x7B-Instruct-v0.1,19.0,3.921023598888464,279.5625,43.225
46
+ Mixtral-8x7B-Instruct-v0.1,20.0,3.5051895811937857,380.725,53.875
47
+ Mixtral-8x7B-Instruct-v0.1,21.0,4.853644103915603,408.34166666666664,49.56666666666667
48
+ Mixtral-8x7B-Instruct-v0.1,22.0,3.1714347918828327,284.9,43.825
49
+ Mixtral-8x7B-Instruct-v0.1,23.0,4.876900292932987,321.725,49.875
50
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,0.0,2.0674875736236573,372.05,62.6
51
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,1.0,1.2007620811462403,48.35,5.8
52
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,2.0,,,
53
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,3.0,2.0712238788604735,372.05,62.6
54
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,4.0,1.9543781518936156,372.05,62.6
55
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,5.0,,,
56
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,6.0,2.110265576839447,372.05,62.6
57
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,7.0,2.0211721837520598,372.25,62.425
58
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,8.0,1.99203217625618,372.05,62.6
59
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,9.0,,,
60
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,10.0,,,
61
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,11.0,1.9041210174560548,372.05,62.6
62
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,12.0,1.8389003086090088,314.46,52.08
63
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,13.0,1.9219599564870198,353.6666666666667,59.266666666666666
64
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,14.0,1.7107620418071747,227.325,36.3
65
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,15.0,1.8755218625068664,372.05,62.6
66
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,16.0,1.538642168045044,169.46666666666667,26.083333333333332
67
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,17.0,1.9580047667026519,371.875,62.425
68
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,18.0,1.857077181339264,372.05,62.6
69
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,19.0,1.938528937101364,371.625,62.3
70
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,20.0,1.628979456424713,227.325,36.3
71
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,21.0,1.7358034878969193,220.1125,35.2125
72
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,22.0,,,
73
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,23.0,2.094106078147888,372.05,62.6
74
+ chat-bison,1.0,3.890243631601334,398.075,49.0
75
+ chat-bison (PaLM 2),0.0,2.501569759845734,381.95,60.9
76
+ chat-bison (PaLM 2),1.0,2.476984361807505,381.95,60.9
77
+ chat-bison (PaLM 2),2.0,2.438890391588211,381.95,60.9
78
+ chat-bison (PaLM 2),3.0,2.440149003267288,381.95,60.9
79
+ chat-bison (PaLM 2),4.0,2.4795879781246186,381.95,60.9
80
+ chat-bison (PaLM 2),5.0,2.461125838756561,381.8,61.1
81
+ chat-bison (PaLM 2),6.0,2.469940322637558,381.95,60.9
82
+ chat-bison (PaLM 2),7.0,2.4428869783878326,381.95,60.9
83
+ chat-bison (PaLM 2),8.0,2.4800265431404114,381.8833333333333,60.88333333333333
84
+ chat-bison (PaLM 2),9.0,2.465018570423126,381.95,60.9
85
+ chat-bison (PaLM 2),10.0,2.4786566257476808,381.75,60.85
86
+ chat-bison (PaLM 2),11.0,2.499571430683136,381.65,60.88333333333333
87
+ chat-bison (PaLM 2),12.0,2.571754927635193,352.17,50.81
88
+ chat-bison (PaLM 2),13.0,2.522790166735649,409.325,65.3875
89
+ chat-bison (PaLM 2),14.0,2.8620632350444795,373.375,52.9875
90
+ chat-bison (PaLM 2),15.0,2.650241893529892,377.8,60.425
91
+ chat-bison (PaLM 2),16.0,3.4333535691102344,381.84166666666664,47.225
92
+ chat-bison (PaLM 2),17.0,2.5084280292193095,381.95,60.9
93
+ chat-bison (PaLM 2),18.0,2.615047258138657,381.45,60.85
94
+ chat-bison (PaLM 2),19.0,2.821215844154358,382.225,61.025
95
+ chat-bison (PaLM 2),20.0,2.591941976547241,344.725,48.275
96
+ chat-bison (PaLM 2),21.0,2.7827586233615875,383.275,47.65833333333333
97
+ chat-bison (PaLM 2),22.0,2.813016355037689,381.95,60.9
98
+ chat-bison (PaLM 2),23.0,2.463971793651581,381.85,60.875
99
+ chat-bison-32k,1.0,4.128177767992019,389.925,48.025
100
+ chat-bison-32k (PaLM 2 32K),0.0,7.170754861831665,335.75,53.85
101
+ chat-bison-32k (PaLM 2 32K),1.0,9.889513119061787,335.75,53.85
102
+ chat-bison-32k (PaLM 2 32K),2.0,4.82983283996582,335.75,53.85
103
+ chat-bison-32k (PaLM 2 32K),3.0,6.070689761638642,335.75,53.85
104
+ chat-bison-32k (PaLM 2 32K),4.0,8.697703075408935,335.75,53.85
105
+ chat-bison-32k (PaLM 2 32K),5.0,2.9196789026260377,335.75,53.85
106
+ chat-bison-32k (PaLM 2 32K),6.0,10.046520245075225,335.75,53.85
107
+ chat-bison-32k (PaLM 2 32K),7.0,8.814902746677399,335.75,53.85
108
+ chat-bison-32k (PaLM 2 32K),8.0,8.755691254138947,335.75,53.85
109
+ chat-bison-32k (PaLM 2 32K),9.0,2.943085324764252,335.75,53.85
110
+ chat-bison-32k (PaLM 2 32K),10.0,13.628323638439179,335.75,53.85
111
+ chat-bison-32k (PaLM 2 32K),11.0,7.315447652339936,335.75,53.85
112
+ chat-bison-32k (PaLM 2 32K),12.0,6.040619640350342,323.17,45.15
113
+ chat-bison-32k (PaLM 2 32K),13.0,3.8712039202451707,359.3,57.725
114
+ chat-bison-32k (PaLM 2 32K),14.0,4.875012156367302,339.6875,46.1375
115
+ chat-bison-32k (PaLM 2 32K),15.0,2.951279658079147,335.75,53.85
116
+ chat-bison-32k (PaLM 2 32K),16.0,4.577468846241633,359.4166666666667,43.775
117
+ chat-bison-32k (PaLM 2 32K),17.0,5.394908706347148,335.75,53.85
118
+ chat-bison-32k (PaLM 2 32K),18.0,7.554238790273667,335.75,53.85
119
+ chat-bison-32k (PaLM 2 32K),19.0,10.186308375000953,335.75,53.85
120
+ chat-bison-32k (PaLM 2 32K),20.0,5.36962095797062,320.025,42.975
121
+ chat-bison-32k (PaLM 2 32K),21.0,5.4035370687643685,359.4166666666667,43.775
122
+ chat-bison-32k (PaLM 2 32K),22.0,12.272967928647995,335.75,53.85
123
+ chat-bison-32k (PaLM 2 32K),23.0,10.500626176595688,335.75,53.85
124
+ gemini-pro,0.0,2.8754740890703703,364.45,57.0
125
+ gemini-pro,1.0,3.731358753455864,375.3,55.09
126
+ gemini-pro,2.0,2.664601039886475,358.825,57.425
127
+ gemini-pro,3.0,2.8943973687978892,387.0,61.725
128
+ gemini-pro,4.0,2.8736069202423096,371.375,60.025
129
+ gemini-pro,5.0,2.656540846824646,357.25,56.7
130
+ gemini-pro,6.0,2.8120841443538667,390.4,62.45
131
+ gemini-pro,7.0,2.70631699073009,378.2,60.35
132
+ gemini-pro,8.0,2.7259290743682345,377.1166666666667,60.38333333333333
133
+ gemini-pro,9.0,2.6013306021690368,396.15,63.35
134
+ gemini-pro,10.0,2.4627303073280737,381.7,59.75
135
+ gemini-pro,11.0,2.4739445872226002,360.6,57.95
136
+ gemini-pro,12.0,2.7814492097834953,348.55,49.4
137
+ gemini-pro,13.0,2.559203814856614,392.975,63.875
138
+ gemini-pro,14.0,3.1300881316787317,343.3625,47.4625
139
+ gemini-pro,15.0,2.4760417878627776,361.275,58.075
140
+ gemini-pro,16.0,3.3130789541565213,353.7,41.59166666666667
141
+ gemini-pro,17.0,2.492802628016068,388.51666666666665,61.8
142
+ gemini-pro,18.0,2.7202366315401516,362.925,57.825
143
+ gemini-pro,19.0,2.6147810145269466,392.6875,62.0125
144
+ gemini-pro,20.0,3.2052203896757843,341.85,46.6875
145
+ gemini-pro,21.0,3.6886135495227315,358.10833333333335,44.858333333333334
146
+ gemini-pro,22.0,2.6609258592128753,376.325,60.05
147
+ gemini-pro,23.0,2.590940225124359,367.15,58.6
148
+ gpt-3.5-turbo,0.0,3.5683146858215333,404.84,43.88
149
+ gpt-3.5-turbo,1.0,4.272891883608661,444.9625,48.91875
150
+ gpt-3.5-turbo,2.0,2.6514626717567444,390.22,54.64
151
+ gpt-3.5-turbo,3.0,8.802967548370361,438.15833333333336,48.75
152
+ gpt-3.5-turbo,4.0,3.9857387453317643,409.6,38.875
153
+ gpt-3.5-turbo,5.0,3.3526177048683166,391.56666666666666,45.35
154
+ gpt-3.5-turbo,6.0,3.9461031516393024,413.46666666666664,46.666666666666664
155
+ gpt-3.5-turbo,7.0,3.563987676302592,396.7,48.483333333333334
156
+ gpt-3.5-turbo,8.0,3.8539037982622784,401.06666666666666,46.88333333333333
157
+ gpt-3.5-turbo,9.0,3.774983811378479,373.15,41.81666666666667
158
+ gpt-3.5-turbo,10.0,,,
159
+ gpt-3.5-turbo,11.0,2.8019149283568066,398.40833333333336,55.5
160
+ gpt-3.5-turbo,12.0,4.098882734775543,346.4125,34.7375
161
+ gpt-3.5-turbo,13.0,3.8091073359761918,414.22857142857146,50.82142857142857
162
+ gpt-3.5-turbo,14.0,3.901234769821167,389.9,47.55833333333333
163
+ gpt-3.5-turbo,15.0,4.8184381556510925,411.03,42.87
164
+ gpt-3.5-turbo,16.0,3.899510098587383,376.54545454545456,43.67727272727273
165
+ gpt-3.5-turbo,17.0,5.015711693763733,425.6,42.83
166
+ gpt-3.5-turbo,18.0,3.721581067641576,378.26666666666665,44.46666666666667
167
+ gpt-3.5-turbo,19.0,3.851715175310771,399.625,46.0
168
+ gpt-3.5-turbo,20.0,3.153710008992089,380.1611111111111,47.05555555555556
169
+ gpt-3.5-turbo,21.0,4.117136875174681,407.26153846153846,40.63076923076923
170
+ gpt-3.5-turbo,22.0,3.208261313041051,396.3,46.266666666666666
171
+ gpt-3.5-turbo,23.0,8.566175188620885,441.65833333333336,49.28333333333333
172
+ gpt-4,0.0,12.091028991371694,316.73,37.44
173
+ gpt-4,1.0,12.780311059551078,338.25416666666666,40.09166666666667
174
+ gpt-4,2.0,11.616398258209228,341.39,48.28
175
+ gpt-4,3.0,12.220598830779393,324.725,40.541666666666664
176
+ gpt-4,4.0,13.938926541805268,303.1625,31.9875
177
+ gpt-4,5.0,12.497149809201558,319.71666666666664,40.63333333333333
178
+ gpt-4,6.0,13.388921443621317,330.0833333333333,41.46666666666667
179
+ gpt-4,7.0,14.678142400582631,323.53333333333336,40.733333333333334
180
+ gpt-4,8.0,14.978816239039103,317.0,39.43333333333333
181
+ gpt-4,9.0,15.373240264256795,324.98333333333335,40.5
182
+ gpt-4,10.0,,,
183
+ gpt-4,11.0,11.441057385516768,344.78333333333336,50.025
184
+ gpt-4,12.0,17.375231413543226,295.78125,31.23125
185
+ gpt-4,13.0,15.355684958185469,337.90714285714284,44.85
186
+ gpt-4,14.0,14.926335791746775,325.48333333333335,41.733333333333334
187
+ gpt-4,15.0,17.480767397880555,301.15,34.69
188
+ gpt-4,16.0,17.60613609231226,325.15,39.6
189
+ gpt-4,17.0,14.354735706791732,299.63,35.66
190
+ gpt-4,18.0,13.452181231975555,317.68333333333334,39.675
191
+ gpt-4,19.0,14.330684673786163,317.45,39.791666666666664
192
+ gpt-4,20.0,13.774037790298461,318.76666666666665,40.80555555555556
193
+ gpt-4,21.0,15.565142148249858,308.5769230769231,33.707692307692305
194
+ gpt-4,22.0,15.137496527036031,323.8666666666667,41.00833333333333
195
+ gpt-4,23.0,10.696240643493267,317.28333333333336,40.175
196
+ gpt-4-turbo,0.0,11.938190605640411,384.78,44.55
197
+ gpt-4-turbo,1.0,14.554479810595513,382.94166666666666,48.0625
198
+ gpt-4-turbo,2.0,13.72197850227356,380.31,49.62
199
+ gpt-4-turbo,3.0,11.976015224059422,370.85833333333335,49.108333333333334
200
+ gpt-4-turbo,4.0,17.072669982910156,366.9875,44.7875
201
+ gpt-4-turbo,5.0,15.055192097028096,296.6666666666667,43.03333333333333
202
+ gpt-4-turbo,6.0,15.722527865568797,378.6166666666667,51.416666666666664
203
+ gpt-4-turbo,7.0,7.6716701745986935,302.23333333333335,40.96666666666667
204
+ gpt-4-turbo,8.0,11.272664443651836,392.1166666666667,49.266666666666666
205
+ gpt-4-turbo,9.0,20.45977386633555,332.1166666666667,43.5
206
+ gpt-4-turbo,10.0,,,
207
+ gpt-4-turbo,11.0,10.300394964218139,406.775,60.791666666666664
208
+ gpt-4-turbo,12.0,16.01451396048069,374.3375,45.11875
209
+ gpt-4-turbo,13.0,13.703989851474763,327.0571428571429,46.714285714285715
210
+ gpt-4-turbo,14.0,11.651468181610108,347.85833333333335,46.458333333333336
211
+ gpt-4-turbo,15.0,37.896924748420716,367.4,49.16
212
+ gpt-4-turbo,16.0,18.2455517671325,395.83181818181816,48.56818181818182
213
+ gpt-4-turbo,17.0,15.710689465999604,364.73,42.88
214
+ gpt-4-turbo,18.0,16.597523101170857,379.60833333333335,47.983333333333334
215
+ gpt-4-turbo,19.0,19.196569097042083,355.68333333333334,46.958333333333336
216
+ gpt-4-turbo,20.0,14.754687264230515,401.8777777777778,49.75555555555555
217
+ gpt-4-turbo,21.0,14.39423566047962,439.87692307692305,42.72692307692308
218
+ gpt-4-turbo,22.0,17.963759408394495,437.6,50.358333333333334
219
+ gpt-4-turbo,23.0,11.649714199701945,332.7083333333333,43.733333333333334
220
+ llama-2-70b-chat,0.0,2.7049551407496133,312.85,48.55
221
+ llama-2-70b-chat,1.0,3.5678966999053956,355.78,52.5
222
+ llama-2-70b-chat,2.0,2.7264933708386545,341.675,52.75
223
+ llama-2-70b-chat,3.0,3.13531751036644,355.5,54.75
224
+ llama-2-70b-chat,4.0,2.6207807064056396,262.85,40.7
225
+ llama-2-70b-chat,5.0,2.4901255933861983,331.85,51.2
226
+ llama-2-70b-chat,6.0,3.237797245834813,298.0,46.025
227
+ llama-2-70b-chat,7.0,2.8074560369764057,309.8,47.225
228
+ llama-2-70b-chat,8.0,2.643855281498121,270.68333333333334,41.93333333333333
229
+ llama-2-70b-chat,9.0,2.270249330997467,355.5,54.75
230
+ llama-2-70b-chat,10.0,2.6760833263397217,165.55,25.2
231
+ llama-2-70b-chat,11.0,3.1485369634628295,298.56666666666666,45.766666666666666
232
+ llama-2-70b-chat,12.0,4.026921252409617,294.06,42.54
233
+ llama-2-70b-chat,13.0,4.110724348770945,428.7375,65.5375
234
+ llama-2-70b-chat,14.0,4.592028452555339,423.8875,60.8125
235
+ llama-2-70b-chat,15.0,2.76978215304288,285.925,44.15
236
+ llama-2-70b-chat,16.0,4.2957686424255375,572.3083333333333,74.625
237
+ llama-2-70b-chat,17.0,2.720098500781589,254.86666666666667,39.28333333333333
238
+ llama-2-70b-chat,18.0,2.9921934604644775,326.375,50.025
239
+ llama-2-70b-chat,19.0,2.7523183100151294,283.95,43.8375
240
+ llama-2-70b-chat,20.0,3.1451149598146095,345.975,49.65
241
+ llama-2-70b-chat,21.0,4.558388976727501,556.1583333333333,71.875
242
+ llama-2-70b-chat,22.0,3.0530899854806752,348.0,53.65
243
+ llama-2-70b-chat,23.0,2.941225928068161,355.5,54.75
244
+ zephyr-7b-beta,0.0,,,
245
+ zephyr-7b-beta,1.0,1.9264068841934203,29.75,3.3
246
+ zephyr-7b-beta,2.0,,,
247
+ zephyr-7b-beta,3.0,,,
248
+ zephyr-7b-beta,4.0,,,
249
+ zephyr-7b-beta,5.0,,,
250
+ zephyr-7b-beta,6.0,,,
251
+ zephyr-7b-beta,7.0,,,
252
+ zephyr-7b-beta,8.0,,,
253
+ zephyr-7b-beta,9.0,,,
254
+ zephyr-7b-beta,10.0,,,
255
+ zephyr-7b-beta,11.0,4.056525647640228,386.3,63.35
256
+ zephyr-7b-beta,12.0,3.3402509868144987,216.9,33.575
257
+ zephyr-7b-beta,13.0,,,
258
+ zephyr-7b-beta,14.0,4.056431210041046,399.0,64.9
259
+ zephyr-7b-beta,15.0,4.06974081993103,386.3,63.35
260
+ zephyr-7b-beta,16.0,3.304698485362379,214.1625,32.7875
261
+ zephyr-7b-beta,17.0,,,
262
+ zephyr-7b-beta,18.0,4.079625189304352,386.3,63.35
263
+ zephyr-7b-beta,19.0,,,
264
+ zephyr-7b-beta,20.0,3.3111458659172057,216.9,33.575
265
+ zephyr-7b-beta,21.0,3.339973047375679,219.1875,33.6875
266
+ zephyr-7b-beta,22.0,,,
267
+ zephyr-7b-beta,23.0,,,
data/2024-02-03 22:30:15.856748_time_of_day_comparison.csv ADDED
@@ -0,0 +1,91 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ model,time,execution_time,characters_count,words_count
2
+ Mistral-7B-Instruct-v0.2,afternoon 12-14,3.228973722457886,222.0625,32.25
3
+ Mistral-7B-Instruct-v0.2,early morning 6-8,,,
4
+ Mistral-7B-Instruct-v0.2,evening 18-20,3.397640073299408,261.18333333333334,40.1
5
+ Mistral-7B-Instruct-v0.2,late afternoon 15-17,3.2048643112182615,219.8625,31.8
6
+ Mistral-7B-Instruct-v0.2,morning 9-11,3.734026002883911,362.9,58.35
7
+ Mistral-7B-Instruct-v0.2,night 0-2,1.9149879813194275,37.8,2.95
8
+ Mistral-7B-Instruct-v0.2,night 21-23,3.389284573495388,175.79375,25.68125
9
+ Mistral-7B-Instruct-v0.2,night 3-5,,,
10
+ Mixtral-8x7B-Instruct-v0.1,afternoon 12-14,5.362903979589355,369.3192307692308,54.353846153846156
11
+ Mixtral-8x7B-Instruct-v0.1,early morning 6-8,3.2748278152374994,243.2642857142857,37.57857142857143
12
+ Mixtral-8x7B-Instruct-v0.1,evening 18-20,3.6435119574237023,326.69,48.545
13
+ Mixtral-8x7B-Instruct-v0.1,late afternoon 15-17,5.80184749175942,347.9681818181818,47.27272727272727
14
+ Mixtral-8x7B-Instruct-v0.1,morning 9-11,3.9661054956285575,304.82,47.28
15
+ Mixtral-8x7B-Instruct-v0.1,night 0-2,3.8265925436529495,362.25625,52.85625
16
+ Mixtral-8x7B-Instruct-v0.1,night 21-23,5.62397656769588,395.15714285714284,49.02857142857143
17
+ Mixtral-8x7B-Instruct-v0.1,night 3-5,3.010503646099206,262.8,40.56
18
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,afternoon 12-14,1.8381905496120452,308.795,51.08
19
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,early morning 6-8,2.0273348593711855,372.13,62.53
20
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,evening 18-20,1.7984187936782836,313.99,51.96
21
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,late afternoon 15-17,1.7547113946505954,285.17857142857144,46.9
22
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,morning 9-11,1.9041210174560548,372.05,62.6
23
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,night 0-2,1.6341248273849487,210.2,34.2
24
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,night 21-23,1.5875422928068372,192.78333333333333,31.261111111111113
25
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,night 3-5,2.0128010153770446,372.05,62.6
26
+ chat-bison,night 0-2,3.890243631601334,398.075,49.0
27
+ chat-bison (PaLM 2),afternoon 12-14,2.6460144804074215,376.28076923076924,55.965384615384615
28
+ chat-bison (PaLM 2),early morning 6-8,2.4665334616388592,381.9214285714286,60.892857142857146
29
+ chat-bison (PaLM 2),evening 18-20,2.688272579908371,367.07,55.89
30
+ chat-bison (PaLM 2),late afternoon 15-17,3.0387172081253744,381.1363636363636,53.35454545454545
31
+ chat-bison (PaLM 2),morning 9-11,2.488477897644043,381.73,60.88
32
+ chat-bison (PaLM 2),night 0-2,2.468383938074112,381.95,60.9
33
+ chat-bison (PaLM 2),night 21-23,2.7250528037548065,382.725,52.95
34
+ chat-bison (PaLM 2),night 3-5,2.460119960308075,381.92,60.94
35
+ chat-bison-32k,night 0-2,4.128177767992019,389.925,48.025
36
+ chat-bison-32k (PaLM 2 32K),afternoon 12-14,5.014458654477046,339.3692307692308,49.323076923076925
37
+ chat-bison-32k (PaLM 2 32K),early morning 6-8,9.141417106560299,335.75,53.85
38
+ chat-bison-32k (PaLM 2 32K),evening 18-20,7.7332194912433625,329.46,49.5
39
+ chat-bison-32k (PaLM 2 32K),late afternoon 15-17,4.5047362284226855,348.65909090909093,48.35454545454545
40
+ chat-bison-32k (PaLM 2 32K),morning 9-11,7.7035503840446475,335.75,53.85
41
+ chat-bison-32k (PaLM 2 32K),night 0-2,7.7498266498247785,335.75,53.85
42
+ chat-bison-32k (PaLM 2 32K),night 21-23,7.796841062307358,349.95,47.805
43
+ chat-bison-32k (PaLM 2 32K),night 3-5,6.491292915344238,335.75,53.85
44
+ gemini-pro,afternoon 12-14,2.816922114008949,360.62307692307695,53.25769230769231
45
+ gemini-pro,early morning 6-8,2.7453590130460435,381.2214285714286,60.964285714285715
46
+ gemini-pro,evening 18-20,2.86901999375759,366.4,55.045
47
+ gemini-pro,late afternoon 15-17,2.9268629640903114,364.57272727272726,50.1
48
+ gemini-pro,morning 9-11,2.497767536007628,371.93,59.39
49
+ gemini-pro,night 0-2,3.338477972348531,369.825,55.9125
50
+ gemini-pro,night 21-23,3.7189874940246117,390.9142857142857,51.35
51
+ gemini-pro,night 3-5,2.8375814715210272,374.8,60.04
52
+ gpt-3.5-turbo,afternoon 12-14,3.9458200880459375,381.4428571428571,43.76190476190476
53
+ gpt-3.5-turbo,early morning 6-8,3.787998208734724,403.74444444444447,47.34444444444444
54
+ gpt-3.5-turbo,evening 18-20,3.5153889304115657,385.18095238095236,46.01428571428571
55
+ gpt-3.5-turbo,late afternoon 15-17,4.384064777692159,396.4357142857143,43.28333333333333
56
+ gpt-3.5-turbo,morning 9-11,3.126271222697364,389.9888888888889,50.93888888888889
57
+ gpt-3.5-turbo,night 0-2,3.822115447632102,426.71923076923076,49.05
58
+ gpt-3.5-turbo,night 21-23,5.110168156187617,422.73510971786834,45.358934169278996
59
+ gpt-3.5-turbo,night 3-5,6.062970260473398,418.6192307692308,44.926923076923075
60
+ gpt-4,afternoon 12-14,16.002364798386893,318.3095238095238,38.77142857142857
61
+ gpt-4,early morning 6-8,14.348626694414351,323.5388888888889,40.544444444444444
62
+ gpt-4,evening 18-20,13.841120740345547,318.0809523809524,40.19285714285714
63
+ gpt-4,late afternoon 15-17,16.80607506932254,313.3595238095238,37.49285714285714
64
+ gpt-4,morning 9-11,12.759107512468733,338.18333333333334,46.85
65
+ gpt-4,night 0-2,12.3578163115329,334.075,41.35
66
+ gpt-4,night 21-23,14.298642643005493,314.336,37.012
67
+ gpt-4,night 3-5,12.813134506115546,316.93461538461537,37.93076923076923
68
+ gpt-4-turbo,afternoon 12-14,13.997754749229976,351.01190476190476,46.03333333333333
69
+ gpt-4-turbo,early morning 6-8,11.555620827939775,357.65555555555557,47.21666666666667
70
+ gpt-4-turbo,evening 18-20,16.550320884159632,382.31666666666666,48.45
71
+ gpt-4-turbo,late afternoon 15-17,22.320911452883767,381.65714285714284,47.35476190476191
72
+ gpt-4-turbo,morning 9-11,13.686854598257277,381.8888888888889,55.02777777777778
73
+ gpt-4-turbo,night 0-2,13.770663784850727,382.7613636363636,47.61818181818182
74
+ gpt-4-turbo,night 21-23,14.592236209392548,413.61,44.8
75
+ gpt-4-turbo,night 3-5,14.254795966698573,352.54615384615386,46.37692307692308
76
+ llama-2-70b-chat,afternoon 12-14,4.234376892130426,375.44615384615383,55.238461538461536
77
+ llama-2-70b-chat,early morning 6-8,2.8660141522424265,289.6642857142857,44.614285714285714
78
+ llama-2-70b-chat,evening 18-20,2.9706250462084185,317.245,47.4
79
+ llama-2-70b-chat,late afternoon 15-17,3.6833307104881365,433.6636363636364,59.445454545454545
80
+ llama-2-70b-chat,morning 9-11,2.872361832027194,283.35,43.45
81
+ llama-2-70b-chat,night 0-2,3.249819871626402,346.8875,52.06875
82
+ llama-2-70b-chat,night 21-23,4.719581684340602,572.1689655172414,79.83103448275862
83
+ llama-2-70b-chat,night 3-5,2.8264514451677147,313.71,48.42
84
+ zephyr-7b-beta,afternoon 12-14,3.5789777278900146,277.6,44.016666666666666
85
+ zephyr-7b-beta,early morning 6-8,,,
86
+ zephyr-7b-beta,evening 18-20,3.5673056403795878,273.3666666666667,43.5
87
+ zephyr-7b-beta,late afternoon 15-17,3.4592524923459447,248.59,38.9
88
+ zephyr-7b-beta,morning 9-11,4.056525647640228,386.3,63.35
89
+ zephyr-7b-beta,night 0-2,1.9264068841934203,29.75,3.3
90
+ zephyr-7b-beta,night 21-23,3.45343524068594,176.23125,27.21875
91
+ zephyr-7b-beta,night 3-5,,,
data/2024-02-03 22:31:14.132394_time_of_day_comparison.csv ADDED
@@ -0,0 +1,91 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ model,time_of_day,execution_time,characters_count,words_count
2
+ Mistral-7B-Instruct-v0.2,afternoon 12-14,3.228973722457886,222.0625,32.25
3
+ Mistral-7B-Instruct-v0.2,early morning 6-8,,,
4
+ Mistral-7B-Instruct-v0.2,evening 18-20,3.397640073299408,261.18333333333334,40.1
5
+ Mistral-7B-Instruct-v0.2,late afternoon 15-17,3.2048643112182615,219.8625,31.8
6
+ Mistral-7B-Instruct-v0.2,morning 9-11,3.734026002883911,362.9,58.35
7
+ Mistral-7B-Instruct-v0.2,night 0-2,1.9149879813194275,37.8,2.95
8
+ Mistral-7B-Instruct-v0.2,night 21-23,3.389284573495388,175.79375,25.68125
9
+ Mistral-7B-Instruct-v0.2,night 3-5,,,
10
+ Mixtral-8x7B-Instruct-v0.1,afternoon 12-14,5.362903979589355,369.3192307692308,54.353846153846156
11
+ Mixtral-8x7B-Instruct-v0.1,early morning 6-8,3.2748278152374994,243.2642857142857,37.57857142857143
12
+ Mixtral-8x7B-Instruct-v0.1,evening 18-20,3.6435119574237023,326.69,48.545
13
+ Mixtral-8x7B-Instruct-v0.1,late afternoon 15-17,5.80184749175942,347.9681818181818,47.27272727272727
14
+ Mixtral-8x7B-Instruct-v0.1,morning 9-11,3.9661054956285575,304.82,47.28
15
+ Mixtral-8x7B-Instruct-v0.1,night 0-2,3.8265925436529495,362.25625,52.85625
16
+ Mixtral-8x7B-Instruct-v0.1,night 21-23,5.62397656769588,395.15714285714284,49.02857142857143
17
+ Mixtral-8x7B-Instruct-v0.1,night 3-5,3.010503646099206,262.8,40.56
18
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,afternoon 12-14,1.8381905496120452,308.795,51.08
19
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,early morning 6-8,2.0273348593711855,372.13,62.53
20
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,evening 18-20,1.7984187936782836,313.99,51.96
21
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,late afternoon 15-17,1.7547113946505954,285.17857142857144,46.9
22
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,morning 9-11,1.9041210174560548,372.05,62.6
23
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,night 0-2,1.6341248273849487,210.2,34.2
24
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,night 21-23,1.5875422928068372,192.78333333333333,31.261111111111113
25
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,night 3-5,2.0128010153770446,372.05,62.6
26
+ chat-bison,night 0-2,3.890243631601334,398.075,49.0
27
+ chat-bison (PaLM 2),afternoon 12-14,2.6460144804074215,376.28076923076924,55.965384615384615
28
+ chat-bison (PaLM 2),early morning 6-8,2.4665334616388592,381.9214285714286,60.892857142857146
29
+ chat-bison (PaLM 2),evening 18-20,2.688272579908371,367.07,55.89
30
+ chat-bison (PaLM 2),late afternoon 15-17,3.0387172081253744,381.1363636363636,53.35454545454545
31
+ chat-bison (PaLM 2),morning 9-11,2.488477897644043,381.73,60.88
32
+ chat-bison (PaLM 2),night 0-2,2.468383938074112,381.95,60.9
33
+ chat-bison (PaLM 2),night 21-23,2.7250528037548065,382.725,52.95
34
+ chat-bison (PaLM 2),night 3-5,2.460119960308075,381.92,60.94
35
+ chat-bison-32k,night 0-2,4.128177767992019,389.925,48.025
36
+ chat-bison-32k (PaLM 2 32K),afternoon 12-14,5.014458654477046,339.3692307692308,49.323076923076925
37
+ chat-bison-32k (PaLM 2 32K),early morning 6-8,9.141417106560299,335.75,53.85
38
+ chat-bison-32k (PaLM 2 32K),evening 18-20,7.7332194912433625,329.46,49.5
39
+ chat-bison-32k (PaLM 2 32K),late afternoon 15-17,4.5047362284226855,348.65909090909093,48.35454545454545
40
+ chat-bison-32k (PaLM 2 32K),morning 9-11,7.7035503840446475,335.75,53.85
41
+ chat-bison-32k (PaLM 2 32K),night 0-2,7.7498266498247785,335.75,53.85
42
+ chat-bison-32k (PaLM 2 32K),night 21-23,7.796841062307358,349.95,47.805
43
+ chat-bison-32k (PaLM 2 32K),night 3-5,6.491292915344238,335.75,53.85
44
+ gemini-pro,afternoon 12-14,2.816922114008949,360.62307692307695,53.25769230769231
45
+ gemini-pro,early morning 6-8,2.7453590130460435,381.2214285714286,60.964285714285715
46
+ gemini-pro,evening 18-20,2.86901999375759,366.4,55.045
47
+ gemini-pro,late afternoon 15-17,2.9268629640903114,364.57272727272726,50.1
48
+ gemini-pro,morning 9-11,2.497767536007628,371.93,59.39
49
+ gemini-pro,night 0-2,3.338477972348531,369.825,55.9125
50
+ gemini-pro,night 21-23,3.7189874940246117,390.9142857142857,51.35
51
+ gemini-pro,night 3-5,2.8375814715210272,374.8,60.04
52
+ gpt-3.5-turbo,afternoon 12-14,3.9458200880459375,381.4428571428571,43.76190476190476
53
+ gpt-3.5-turbo,early morning 6-8,3.787998208734724,403.74444444444447,47.34444444444444
54
+ gpt-3.5-turbo,evening 18-20,3.5153889304115657,385.18095238095236,46.01428571428571
55
+ gpt-3.5-turbo,late afternoon 15-17,4.384064777692159,396.4357142857143,43.28333333333333
56
+ gpt-3.5-turbo,morning 9-11,3.126271222697364,389.9888888888889,50.93888888888889
57
+ gpt-3.5-turbo,night 0-2,3.822115447632102,426.71923076923076,49.05
58
+ gpt-3.5-turbo,night 21-23,5.110168156187617,422.73510971786834,45.358934169278996
59
+ gpt-3.5-turbo,night 3-5,6.062970260473398,418.6192307692308,44.926923076923075
60
+ gpt-4,afternoon 12-14,16.002364798386893,318.3095238095238,38.77142857142857
61
+ gpt-4,early morning 6-8,14.348626694414351,323.5388888888889,40.544444444444444
62
+ gpt-4,evening 18-20,13.841120740345547,318.0809523809524,40.19285714285714
63
+ gpt-4,late afternoon 15-17,16.80607506932254,313.3595238095238,37.49285714285714
64
+ gpt-4,morning 9-11,12.759107512468733,338.18333333333334,46.85
65
+ gpt-4,night 0-2,12.3578163115329,334.075,41.35
66
+ gpt-4,night 21-23,14.298642643005493,314.336,37.012
67
+ gpt-4,night 3-5,12.813134506115546,316.93461538461537,37.93076923076923
68
+ gpt-4-turbo,afternoon 12-14,13.997754749229976,351.01190476190476,46.03333333333333
69
+ gpt-4-turbo,early morning 6-8,11.555620827939775,357.65555555555557,47.21666666666667
70
+ gpt-4-turbo,evening 18-20,16.550320884159632,382.31666666666666,48.45
71
+ gpt-4-turbo,late afternoon 15-17,22.320911452883767,381.65714285714284,47.35476190476191
72
+ gpt-4-turbo,morning 9-11,13.686854598257277,381.8888888888889,55.02777777777778
73
+ gpt-4-turbo,night 0-2,13.770663784850727,382.7613636363636,47.61818181818182
74
+ gpt-4-turbo,night 21-23,14.592236209392548,413.61,44.8
75
+ gpt-4-turbo,night 3-5,14.254795966698573,352.54615384615386,46.37692307692308
76
+ llama-2-70b-chat,afternoon 12-14,4.234376892130426,375.44615384615383,55.238461538461536
77
+ llama-2-70b-chat,early morning 6-8,2.8660141522424265,289.6642857142857,44.614285714285714
78
+ llama-2-70b-chat,evening 18-20,2.9706250462084185,317.245,47.4
79
+ llama-2-70b-chat,late afternoon 15-17,3.6833307104881365,433.6636363636364,59.445454545454545
80
+ llama-2-70b-chat,morning 9-11,2.872361832027194,283.35,43.45
81
+ llama-2-70b-chat,night 0-2,3.249819871626402,346.8875,52.06875
82
+ llama-2-70b-chat,night 21-23,4.719581684340602,572.1689655172414,79.83103448275862
83
+ llama-2-70b-chat,night 3-5,2.8264514451677147,313.71,48.42
84
+ zephyr-7b-beta,afternoon 12-14,3.5789777278900146,277.6,44.016666666666666
85
+ zephyr-7b-beta,early morning 6-8,,,
86
+ zephyr-7b-beta,evening 18-20,3.5673056403795878,273.3666666666667,43.5
87
+ zephyr-7b-beta,late afternoon 15-17,3.4592524923459447,248.59,38.9
88
+ zephyr-7b-beta,morning 9-11,4.056525647640228,386.3,63.35
89
+ zephyr-7b-beta,night 0-2,1.9264068841934203,29.75,3.3
90
+ zephyr-7b-beta,night 21-23,3.45343524068594,176.23125,27.21875
91
+ zephyr-7b-beta,night 3-5,,,
data/2024-02-03 22:33:36.957992_time_of_day_comparison.csv ADDED
@@ -0,0 +1,91 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ model,time_of_day,execution_time,characters_count,words_count
2
+ Mistral-7B-Instruct-v0.2,0-2 midnight,1.9149879813194275,37.8,2.95
3
+ Mistral-7B-Instruct-v0.2,12-14 afternoon,3.228973722457886,222.0625,32.25
4
+ Mistral-7B-Instruct-v0.2,15-17 late afternoon,3.2048643112182615,219.8625,31.8
5
+ Mistral-7B-Instruct-v0.2,18-20 evening,3.397640073299408,261.18333333333334,40.1
6
+ Mistral-7B-Instruct-v0.2,21-23 late evening,3.389284573495388,175.79375,25.68125
7
+ Mistral-7B-Instruct-v0.2,3-5 night,,,
8
+ Mistral-7B-Instruct-v0.2,6-8 early morning,,,
9
+ Mistral-7B-Instruct-v0.2,9-11 morning,3.734026002883911,362.9,58.35
10
+ Mixtral-8x7B-Instruct-v0.1,0-2 midnight,3.8265925436529495,362.25625,52.85625
11
+ Mixtral-8x7B-Instruct-v0.1,12-14 afternoon,5.362903979589355,369.3192307692308,54.353846153846156
12
+ Mixtral-8x7B-Instruct-v0.1,15-17 late afternoon,5.80184749175942,347.9681818181818,47.27272727272727
13
+ Mixtral-8x7B-Instruct-v0.1,18-20 evening,3.6435119574237023,326.69,48.545
14
+ Mixtral-8x7B-Instruct-v0.1,21-23 late evening,5.62397656769588,395.15714285714284,49.02857142857143
15
+ Mixtral-8x7B-Instruct-v0.1,3-5 night,3.010503646099206,262.8,40.56
16
+ Mixtral-8x7B-Instruct-v0.1,6-8 early morning,3.2748278152374994,243.2642857142857,37.57857142857143
17
+ Mixtral-8x7B-Instruct-v0.1,9-11 morning,3.9661054956285575,304.82,47.28
18
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,0-2 midnight,1.6341248273849487,210.2,34.2
19
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,12-14 afternoon,1.8381905496120452,308.795,51.08
20
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,15-17 late afternoon,1.7547113946505954,285.17857142857144,46.9
21
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,18-20 evening,1.7984187936782836,313.99,51.96
22
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,21-23 late evening,1.5875422928068372,192.78333333333333,31.261111111111113
23
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,3-5 night,2.0128010153770446,372.05,62.6
24
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,6-8 early morning,2.0273348593711855,372.13,62.53
25
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,9-11 morning,1.9041210174560548,372.05,62.6
26
+ chat-bison,0-2 midnight,3.890243631601334,398.075,49.0
27
+ chat-bison (PaLM 2),0-2 midnight,2.468383938074112,381.95,60.9
28
+ chat-bison (PaLM 2),12-14 afternoon,2.6460144804074215,376.28076923076924,55.965384615384615
29
+ chat-bison (PaLM 2),15-17 late afternoon,3.0387172081253744,381.1363636363636,53.35454545454545
30
+ chat-bison (PaLM 2),18-20 evening,2.688272579908371,367.07,55.89
31
+ chat-bison (PaLM 2),21-23 late evening,2.7250528037548065,382.725,52.95
32
+ chat-bison (PaLM 2),3-5 night,2.460119960308075,381.92,60.94
33
+ chat-bison (PaLM 2),6-8 early morning,2.4665334616388592,381.9214285714286,60.892857142857146
34
+ chat-bison (PaLM 2),9-11 morning,2.488477897644043,381.73,60.88
35
+ chat-bison-32k,0-2 midnight,4.128177767992019,389.925,48.025
36
+ chat-bison-32k (PaLM 2 32K),0-2 midnight,7.7498266498247785,335.75,53.85
37
+ chat-bison-32k (PaLM 2 32K),12-14 afternoon,5.014458654477046,339.3692307692308,49.323076923076925
38
+ chat-bison-32k (PaLM 2 32K),15-17 late afternoon,4.5047362284226855,348.65909090909093,48.35454545454545
39
+ chat-bison-32k (PaLM 2 32K),18-20 evening,7.7332194912433625,329.46,49.5
40
+ chat-bison-32k (PaLM 2 32K),21-23 late evening,7.796841062307358,349.95,47.805
41
+ chat-bison-32k (PaLM 2 32K),3-5 night,6.491292915344238,335.75,53.85
42
+ chat-bison-32k (PaLM 2 32K),6-8 early morning,9.141417106560299,335.75,53.85
43
+ chat-bison-32k (PaLM 2 32K),9-11 morning,7.7035503840446475,335.75,53.85
44
+ gemini-pro,0-2 midnight,3.338477972348531,369.825,55.9125
45
+ gemini-pro,12-14 afternoon,2.816922114008949,360.62307692307695,53.25769230769231
46
+ gemini-pro,15-17 late afternoon,2.9268629640903114,364.57272727272726,50.1
47
+ gemini-pro,18-20 evening,2.86901999375759,366.4,55.045
48
+ gemini-pro,21-23 late evening,3.7189874940246117,390.9142857142857,51.35
49
+ gemini-pro,3-5 night,2.8375814715210272,374.8,60.04
50
+ gemini-pro,6-8 early morning,2.7453590130460435,381.2214285714286,60.964285714285715
51
+ gemini-pro,9-11 morning,2.497767536007628,371.93,59.39
52
+ gpt-3.5-turbo,0-2 midnight,3.822115447632102,426.71923076923076,49.05
53
+ gpt-3.5-turbo,12-14 afternoon,3.9458200880459375,381.4428571428571,43.76190476190476
54
+ gpt-3.5-turbo,15-17 late afternoon,4.384064777692159,396.4357142857143,43.28333333333333
55
+ gpt-3.5-turbo,18-20 evening,3.5153889304115657,385.18095238095236,46.01428571428571
56
+ gpt-3.5-turbo,21-23 late evening,5.110168156187617,422.73510971786834,45.358934169278996
57
+ gpt-3.5-turbo,3-5 night,6.062970260473398,418.6192307692308,44.926923076923075
58
+ gpt-3.5-turbo,6-8 early morning,3.787998208734724,403.74444444444447,47.34444444444444
59
+ gpt-3.5-turbo,9-11 morning,3.126271222697364,389.9888888888889,50.93888888888889
60
+ gpt-4,0-2 midnight,12.3578163115329,334.075,41.35
61
+ gpt-4,12-14 afternoon,16.002364798386893,318.3095238095238,38.77142857142857
62
+ gpt-4,15-17 late afternoon,16.80607506932254,313.3595238095238,37.49285714285714
63
+ gpt-4,18-20 evening,13.841120740345547,318.0809523809524,40.19285714285714
64
+ gpt-4,21-23 late evening,14.298642643005493,314.336,37.012
65
+ gpt-4,3-5 night,12.813134506115546,316.93461538461537,37.93076923076923
66
+ gpt-4,6-8 early morning,14.348626694414351,323.5388888888889,40.544444444444444
67
+ gpt-4,9-11 morning,12.759107512468733,338.18333333333334,46.85
68
+ gpt-4-turbo,0-2 midnight,13.770663784850727,382.7613636363636,47.61818181818182
69
+ gpt-4-turbo,12-14 afternoon,13.997754749229976,351.01190476190476,46.03333333333333
70
+ gpt-4-turbo,15-17 late afternoon,22.320911452883767,381.65714285714284,47.35476190476191
71
+ gpt-4-turbo,18-20 evening,16.550320884159632,382.31666666666666,48.45
72
+ gpt-4-turbo,21-23 late evening,14.592236209392548,413.61,44.8
73
+ gpt-4-turbo,3-5 night,14.254795966698573,352.54615384615386,46.37692307692308
74
+ gpt-4-turbo,6-8 early morning,11.555620827939775,357.65555555555557,47.21666666666667
75
+ gpt-4-turbo,9-11 morning,13.686854598257277,381.8888888888889,55.02777777777778
76
+ llama-2-70b-chat,0-2 midnight,3.249819871626402,346.8875,52.06875
77
+ llama-2-70b-chat,12-14 afternoon,4.234376892130426,375.44615384615383,55.238461538461536
78
+ llama-2-70b-chat,15-17 late afternoon,3.6833307104881365,433.6636363636364,59.445454545454545
79
+ llama-2-70b-chat,18-20 evening,2.9706250462084185,317.245,47.4
80
+ llama-2-70b-chat,21-23 late evening,4.719581684340602,572.1689655172414,79.83103448275862
81
+ llama-2-70b-chat,3-5 night,2.8264514451677147,313.71,48.42
82
+ llama-2-70b-chat,6-8 early morning,2.8660141522424265,289.6642857142857,44.614285714285714
83
+ llama-2-70b-chat,9-11 morning,2.872361832027194,283.35,43.45
84
+ zephyr-7b-beta,0-2 midnight,1.9264068841934203,29.75,3.3
85
+ zephyr-7b-beta,12-14 afternoon,3.5789777278900146,277.6,44.016666666666666
86
+ zephyr-7b-beta,15-17 late afternoon,3.4592524923459447,248.59,38.9
87
+ zephyr-7b-beta,18-20 evening,3.5673056403795878,273.3666666666667,43.5
88
+ zephyr-7b-beta,21-23 late evening,3.45343524068594,176.23125,27.21875
89
+ zephyr-7b-beta,3-5 night,,,
90
+ zephyr-7b-beta,6-8 early morning,,,
91
+ zephyr-7b-beta,9-11 morning,4.056525647640228,386.3,63.35
data/2024-02-03 22:42:23.322179_summary.csv ADDED
@@ -0,0 +1,75 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ model,language,template_name,execution_time,characters_count,words_count,chunk_sizes_mean,chunk_sizes_min,chunk_sizes_max,chunk_generation_times_mean,chunk_generation_times_min,chunk_generation_times_max
2
+ Mistral-7B-Instruct-v0.2,english,call,,,,,,,,,
3
+ Mistral-7B-Instruct-v0.2,english,json,4.278648148264204,342.8,55.15,4.1311870534561415,1.0,15.0,0.040544769239987996,0.00024437904357910156,60.7178213596344
4
+ Mistral-7B-Instruct-v0.2,english,markdown,3.7188014924526214,366.85,57.1375,4.239202657807309,1.0,16.0,0.03371991898375372,0.020945072174072266,0.25538039207458496
5
+ Mistral-7B-Instruct-v0.2,japanese,call,,,,,,,,,
6
+ Mistral-7B-Instruct-v0.2,japanese,json,2.413569121701377,52.07857142857143,3.414285714285714,1.2991803278688525,1.0,11.0,0.039267738759305254,0.00047779083251953125,3.370748996734619
7
+ Mistral-7B-Instruct-v0.2,japanese,markdown,2.323612022399902,42.25,1.5833333333333333,1.1069868995633187,1.0,6.0,0.03958142719935121,0.0004932880401611328,0.2205650806427002
8
+ Mixtral-8x7B-Instruct-v0.1,english,call,,,,,,,,,
9
+ Mixtral-8x7B-Instruct-v0.1,english,json,3.643989532061343,295.4172413793103,45.744827586206895,4.137546333747872,1.0,15.0,0.014243678199270911,0.00020456314086914062,3.4127349853515625
10
+ Mixtral-8x7B-Instruct-v0.1,english,markdown,5.995457515120506,512.57,81.75,4.360071452875127,1.0,15.0,0.016480832612607788,0.00021076202392578125,1.7103569507598877
11
+ Mixtral-8x7B-Instruct-v0.1,japanese,call,,,,,,,,,
12
+ Mixtral-8x7B-Instruct-v0.1,japanese,json,7.938035423738243,553.5285714285715,63.378571428571426,2.248940739450926,1.0,109.0,0.023964353726961752,0.00020885467529296875,76.45081758499146
13
+ Mixtral-8x7B-Instruct-v0.1,japanese,markdown,9.979603266716003,431.71666666666664,5.983333333333333,1.0810483702683527,1.0,12.0,0.017558807731893653,0.0002148151397705078,2.994176149368286
14
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,english,call,,,,,,,,,
15
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,english,json,1.9458302193674548,366.25,61.58965517241379,4.169774654522613,1.0,13.0,0.012296600931852907,0.00024318695068359375,0.17363858222961426
16
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,english,markdown,1.6830505162477494,282.55,47.1125,3.9572829131652663,1.0,14.0,0.012217252319600401,0.0003170967102050781,0.15227961540222168
17
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,japanese,call,,,,,,,,,
18
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,japanese,json,1.4167885013989039,72.81428571428572,8.8,2.0274463007159906,1.0,13.0,0.014790566363975749,0.00031280517578125,0.3310587406158447
19
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,japanese,markdown,1.336316986878713,89.78333333333333,12.716666666666667,2.432054176072235,1.0,13.0,0.013910464400900675,0.0005300045013427734,0.176621675491333
20
+ chat-bison,english,call,,,,,,,,,
21
+ chat-bison,english,json,3.446989095211029,550.05,86.0,89.4390243902439,1.0,138.0,0.4258628240445765,0.0006544589996337891,2.2015340328216553
22
+ chat-bison,japanese,call,,,,,,,,,
23
+ chat-bison,japanese,json,4.333498167991638,246.1,12.0,33.48299319727891,3.0,124.0,0.47770044917152044,0.0005426406860351562,3.5425846576690674
24
+ chat-bison (PaLM 2),english,call,,,,,,,,,
25
+ chat-bison (PaLM 2),english,json,2.5406186148524283,381.7267857142857,60.88125,78.31727422604872,1.0,142.0,0.3495202942369709,0.0003688335418701172,7.334931373596191
26
+ chat-bison (PaLM 2),english,markdown,2.9635989278554917,490.4875,78.5375,84.20386266094421,1.0,138.0,0.3641034907025841,0.0004639625549316406,4.600815534591675
27
+ chat-bison (PaLM 2),japanese,call,,,,,,,,,
28
+ chat-bison (PaLM 2),japanese,json,3.0616454005241396,232.68,10.48,34.21764705882353,3.0,124.0,0.326771635167739,0.0005857944488525391,2.7724690437316895
29
+ chat-bison (PaLM 2),japanese,markdown,4.669546687602997,431.725,13.85,31.74448529411765,2.0,124.0,0.27883222348549785,0.0005550384521484375,7.114030122756958
30
+ chat-bison-32k,english,call,,,,,,,,,
31
+ chat-bison-32k,english,json,3.74513863325119,538.4,84.25,88.26229508196721,1.0,134.0,0.47832588094179745,0.0006556510925292969,3.0114917755126953
32
+ chat-bison-32k,japanese,call,,,,,,,,,
33
+ chat-bison-32k,japanese,json,4.5112169027328495,241.45,11.8,35.77037037037037,6.0,124.0,0.5467217816246881,0.0005869865417480469,4.387756824493408
34
+ chat-bison-32k (PaLM 2 32K),english,call,,,,,,,,,
35
+ chat-bison-32k (PaLM 2 32K),english,json,7.142214598400252,335.47232142857143,53.799107142857146,77.18344289235826,1.0,133.0,1.4512595853652734,0.00041985511779785156,101.5493803024292
36
+ chat-bison-32k (PaLM 2 32K),english,markdown,3.44630788564682,429.95,69.35,82.6826923076923,1.0,133.0,0.5048719226167753,0.0005412101745605469,18.035786390304565
37
+ chat-bison-32k (PaLM 2 32K),japanese,call,,,,,,,,,
38
+ chat-bison-32k (PaLM 2 32K),japanese,json,5.072022783756256,272.85,10.35,34.320754716981135,4.0,124.0,0.5336985453119818,0.0005052089691162109,52.47814655303955
39
+ chat-bison-32k (PaLM 2 32K),japanese,markdown,6.1971998631954195,446.45,21.4,32.118705035971225,5.0,124.0,0.3856057263106751,0.0005400180816650391,7.165225505828857
40
+ gemini-pro,english,call,,,,,,,,,
41
+ gemini-pro,english,json,2.7415290858475547,381.48706896551727,60.894827586206894,204.58853444290338,1.0,988.0,1.4202116817663073,0.0004703998565673828,13.73231840133667
42
+ gemini-pro,english,markdown,3.0089986324310303,467.66,77.45,183.39607843137256,12.0,472.0,1.1130499073103362,0.0006177425384521484,4.875006198883057
43
+ gemini-pro,japanese,call,,,,,,,,,
44
+ gemini-pro,japanese,json,4.5300196591070145,233.19285714285715,5.885714285714286,91.1927374301676,4.0,333.0,1.4752027082709627,0.0006062984466552734,8.291066646575928
45
+ gemini-pro,japanese,markdown,6.166934008781727,366.3666666666667,7.883333333333334,90.83471074380165,9.0,266.0,1.3123543331445742,0.0006639957427978516,13.754565954208374
46
+ gpt-3.5-turbo,english,call,2.908525016600803,456.85911016949154,72.26059322033899,,,,,,
47
+ gpt-3.5-turbo,english,json,2.566863525494622,398.56960556844547,65.32366589327147,4.806746320443226,1.0,16.0,0.015585779219764062,0.0005395412445068359,1.4500916004180908
48
+ gpt-3.5-turbo,english,markdown,2.3388922008184285,506.90384615384613,81.99038461538461,5.050584403142365,1.0,16.0,0.01715806382989308,0.0005617141723632812,1.127073049545288
49
+ gpt-3.5-turbo,japanese,call,7.255881716940138,381.2555309734513,6.323008849557522,,,,,,
50
+ gpt-3.5-turbo,japanese,json,5.226112197780009,232.71604938271605,3.493827160493827,1.1291481969569905,1.0,7.0,0.02129129201220198,0.0005452632904052734,13.75982117652893
51
+ gpt-3.5-turbo,japanese,markdown,7.29901300883684,352.93548387096774,5.967741935483871,1.1894977168949772,1.0,15.0,0.021750167313542772,0.0005612373352050781,13.71114993095398
52
+ gpt-4,english,call,9.15708539162022,373.33666666666664,59.528888888888886,,,,,,
53
+ gpt-4,english,json,7.963626848197565,383.3707317073171,61.69512195121951,4.7834568389659005,1.0,16.0,0.08687007305138472,0.000537872314453125,3.531284809112549
54
+ gpt-4,english,markdown,10.02310108244419,428.35,67.825,4.990243192078054,1.0,16.0,0.10377185442257747,0.0005447864532470703,2.087376117706299
55
+ gpt-4,japanese,call,24.259297592319243,213.65813953488373,1.1627906976744187,,,,,,
56
+ gpt-4,japanese,json,22.703774025460252,209.86666666666667,4.133333333333334,1.1685226429101707,1.0,7.0,0.11835955503744466,0.0005507469177246094,3.5608017444610596
57
+ gpt-4,japanese,markdown,31.99519391655922,275.1,2.925,1.1327980234712787,1.0,9.0,0.12606545905407157,0.0005619525909423828,2.9794347286224365
58
+ gpt-4-turbo,english,call,7.319288367695279,372.86,58.532222222222224,,,,,,
59
+ gpt-4-turbo,english,json,6.457074524425879,407.0243902439024,64.18414634146342,4.735998183701559,1.0,17.0,0.06474667943090798,0.0006806850433349609,5.431884765625
60
+ gpt-4-turbo,english,markdown,8.325546002388,462.1125,71.925,4.984360253471754,1.0,16.0,0.07950969425127868,0.0006999969482421875,2.0926766395568848
61
+ gpt-4-turbo,japanese,call,32.67405146055443,372.7860465116279,24.886046511627907,,,,,,
62
+ gpt-4-turbo,japanese,json,19.359180968999862,250.44166666666666,6.183333333333334,1.184261339007763,1.0,8.0,0.08582140138847597,0.0006830692291259766,13.252992153167725
63
+ gpt-4-turbo,japanese,markdown,20.977174520492554,283.55,4.45,1.1460038395473375,1.0,10.0,0.07991695286011809,0.0007085800170898438,2.3845231533050537
64
+ llama-2-70b-chat,english,call,,,,,,,,,
65
+ llama-2-70b-chat,english,json,2.917410132025375,314.4871134020619,48.49828178694158,4.02267032967033,1.0,15.0,0.019103390617685005,0.0001990795135498047,3.8762006759643555
66
+ llama-2-70b-chat,english,markdown,4.99397261045417,795.1176470588235,121.01960784313725,4.177931176591799,1.0,16.0,0.018161741699259625,0.0002124309539794922,0.7439091205596924
67
+ llama-2-70b-chat,japanese,call,,,,,,,,,
68
+ llama-2-70b-chat,japanese,json,5.265992468681889,358.9718309859155,41.36619718309859,2.3362207250561435,1.0,15.0,0.023359512199899433,0.00020837783813476562,0.9314718246459961
69
+ llama-2-70b-chat,japanese,markdown,11.084085723449444,1290.6774193548388,147.82258064516128,2.2644745033674796,1.0,16.0,0.01566780037868879,0.0002117156982421875,76.44498753547668
70
+ zephyr-7b-beta,english,call,,,,,,,,,
71
+ zephyr-7b-beta,english,json,3.94231437737087,365.275,59.88125,4.262252042007002,1.0,14.0,0.03629181767914927,0.0003070831298828125,0.4896988868713379
72
+ zephyr-7b-beta,english,markdown,4.959704548120499,358.9375,58.3625,4.390672782874618,1.0,15.0,0.05067269182351022,0.00040459632873535156,75.15552616119385
73
+ zephyr-7b-beta,japanese,call,,,,,,,,,
74
+ zephyr-7b-beta,japanese,json,2.339889786640803,41.583333333333336,3.6333333333333333,1.1566991191469633,1.0,7.0,0.042134473762636,0.018090486526489258,0.4599947929382324
75
+ zephyr-7b-beta,japanese,markdown,2.3176693956057233,38.1,2.3833333333333333,1.0343891402714933,1.0,4.0,0.041092377011053165,0.02583909034729004,0.4606599807739258
data/2024-02-03 22:42:30.259126_general_plot.csv ADDED
@@ -0,0 +1,428 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ path,plot_object,description,comment,plot_json
2
+ ./html/plots/response_times.html,"Figure({
3
+ 'data': [{'alignmentgroup': 'True',
4
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
5
+ 'legendgroup': 'Mistral-7B-Instruct-v0.2',
6
+ 'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
7
+ 'name': 'Mistral-7B-Instruct-v0.2',
8
+ 'offsetgroup': 'Mistral-7B-Instruct-v0.2',
9
+ 'orientation': 'v',
10
+ 'showlegend': True,
11
+ 'textposition': 'auto',
12
+ 'type': 'bar',
13
+ 'x': array(['Mistral-7B-Instruct-v0.2'], dtype=object),
14
+ 'xaxis': 'x',
15
+ 'y': array([3.27102681]),
16
+ 'yaxis': 'y'},
17
+ {'alignmentgroup': 'True',
18
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
19
+ 'legendgroup': 'Mixtral-8x7B-Instruct-v0.1',
20
+ 'marker': {'color': '#EF553B', 'pattern': {'shape': ''}},
21
+ 'name': 'Mixtral-8x7B-Instruct-v0.1',
22
+ 'offsetgroup': 'Mixtral-8x7B-Instruct-v0.1',
23
+ 'orientation': 'v',
24
+ 'showlegend': True,
25
+ 'textposition': 'auto',
26
+ 'type': 'bar',
27
+ 'x': array(['Mixtral-8x7B-Instruct-v0.1'], dtype=object),
28
+ 'xaxis': 'x',
29
+ 'y': array([4.69058203]),
30
+ 'yaxis': 'y'},
31
+ {'alignmentgroup': 'True',
32
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
33
+ 'legendgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
34
+ 'marker': {'color': '#00cc96', 'pattern': {'shape': ''}},
35
+ 'name': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
36
+ 'offsetgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
37
+ 'orientation': 'v',
38
+ 'showlegend': True,
39
+ 'textposition': 'auto',
40
+ 'type': 'bar',
41
+ 'x': array(['TinyLlama/TinyLlama-1.1B-Chat-v1.0'], dtype=object),
42
+ 'xaxis': 'x',
43
+ 'y': array([1.79273835]),
44
+ 'yaxis': 'y'},
45
+ {'alignmentgroup': 'True',
46
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
47
+ 'legendgroup': 'chat-bison',
48
+ 'marker': {'color': '#ab63fa', 'pattern': {'shape': ''}},
49
+ 'name': 'chat-bison',
50
+ 'offsetgroup': 'chat-bison',
51
+ 'orientation': 'v',
52
+ 'showlegend': True,
53
+ 'textposition': 'auto',
54
+ 'type': 'bar',
55
+ 'x': array(['chat-bison'], dtype=object),
56
+ 'xaxis': 'x',
57
+ 'y': array([3.89024363]),
58
+ 'yaxis': 'y'},
59
+ {'alignmentgroup': 'True',
60
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
61
+ 'legendgroup': 'chat-bison (PaLM 2)',
62
+ 'marker': {'color': '#FFA15A', 'pattern': {'shape': ''}},
63
+ 'name': 'chat-bison (PaLM 2)',
64
+ 'offsetgroup': 'chat-bison (PaLM 2)',
65
+ 'orientation': 'v',
66
+ 'showlegend': True,
67
+ 'textposition': 'auto',
68
+ 'type': 'bar',
69
+ 'x': array(['chat-bison (PaLM 2)'], dtype=object),
70
+ 'xaxis': 'x',
71
+ 'y': array([2.66830386]),
72
+ 'yaxis': 'y'},
73
+ {'alignmentgroup': 'True',
74
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
75
+ 'legendgroup': 'chat-bison-32k',
76
+ 'marker': {'color': '#19d3f3', 'pattern': {'shape': ''}},
77
+ 'name': 'chat-bison-32k',
78
+ 'offsetgroup': 'chat-bison-32k',
79
+ 'orientation': 'v',
80
+ 'showlegend': True,
81
+ 'textposition': 'auto',
82
+ 'type': 'bar',
83
+ 'x': array(['chat-bison-32k'], dtype=object),
84
+ 'xaxis': 'x',
85
+ 'y': array([4.12817777]),
86
+ 'yaxis': 'y'},
87
+ {'alignmentgroup': 'True',
88
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
89
+ 'legendgroup': 'chat-bison-32k (PaLM 2 32K)',
90
+ 'marker': {'color': '#FF6692', 'pattern': {'shape': ''}},
91
+ 'name': 'chat-bison-32k (PaLM 2 32K)',
92
+ 'offsetgroup': 'chat-bison-32k (PaLM 2 32K)',
93
+ 'orientation': 'v',
94
+ 'showlegend': True,
95
+ 'textposition': 'auto',
96
+ 'type': 'bar',
97
+ 'x': array(['chat-bison-32k (PaLM 2 32K)'], dtype=object),
98
+ 'xaxis': 'x',
99
+ 'y': array([6.73886213]),
100
+ 'yaxis': 'y'},
101
+ {'alignmentgroup': 'True',
102
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
103
+ 'legendgroup': 'gemini-pro',
104
+ 'marker': {'color': '#B6E880', 'pattern': {'shape': ''}},
105
+ 'name': 'gemini-pro',
106
+ 'offsetgroup': 'gemini-pro',
107
+ 'orientation': 'v',
108
+ 'showlegend': True,
109
+ 'textposition': 'auto',
110
+ 'type': 'bar',
111
+ 'x': array(['gemini-pro'], dtype=object),
112
+ 'xaxis': 'x',
113
+ 'y': array([3.03678889]),
114
+ 'yaxis': 'y'},
115
+ {'alignmentgroup': 'True',
116
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
117
+ 'legendgroup': 'gpt-3.5-turbo',
118
+ 'marker': {'color': '#FF97FF', 'pattern': {'shape': ''}},
119
+ 'name': 'gpt-3.5-turbo',
120
+ 'offsetgroup': 'gpt-3.5-turbo',
121
+ 'orientation': 'v',
122
+ 'showlegend': True,
123
+ 'textposition': 'auto',
124
+ 'type': 'bar',
125
+ 'x': array(['gpt-3.5-turbo'], dtype=object),
126
+ 'xaxis': 'x',
127
+ 'y': array([4.29307391]),
128
+ 'yaxis': 'y'},
129
+ {'alignmentgroup': 'True',
130
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
131
+ 'legendgroup': 'gpt-4',
132
+ 'marker': {'color': '#FECB52', 'pattern': {'shape': ''}},
133
+ 'name': 'gpt-4',
134
+ 'offsetgroup': 'gpt-4',
135
+ 'orientation': 'v',
136
+ 'showlegend': True,
137
+ 'textposition': 'auto',
138
+ 'type': 'bar',
139
+ 'x': array(['gpt-4'], dtype=object),
140
+ 'xaxis': 'x',
141
+ 'y': array([14.32373439]),
142
+ 'yaxis': 'y'},
143
+ {'alignmentgroup': 'True',
144
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
145
+ 'legendgroup': 'gpt-4-turbo',
146
+ 'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
147
+ 'name': 'gpt-4-turbo',
148
+ 'offsetgroup': 'gpt-4-turbo',
149
+ 'orientation': 'v',
150
+ 'showlegend': True,
151
+ 'textposition': 'auto',
152
+ 'type': 'bar',
153
+ 'x': array(['gpt-4-turbo'], dtype=object),
154
+ 'xaxis': 'x',
155
+ 'y': array([15.5354884]),
156
+ 'yaxis': 'y'},
157
+ {'alignmentgroup': 'True',
158
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
159
+ 'legendgroup': 'llama-2-70b-chat',
160
+ 'marker': {'color': '#EF553B', 'pattern': {'shape': ''}},
161
+ 'name': 'llama-2-70b-chat',
162
+ 'offsetgroup': 'llama-2-70b-chat',
163
+ 'orientation': 'v',
164
+ 'showlegend': True,
165
+ 'textposition': 'auto',
166
+ 'type': 'bar',
167
+ 'x': array(['llama-2-70b-chat'], dtype=object),
168
+ 'xaxis': 'x',
169
+ 'y': array([3.6742315]),
170
+ 'yaxis': 'y'},
171
+ {'alignmentgroup': 'True',
172
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
173
+ 'legendgroup': 'zephyr-7b-beta',
174
+ 'marker': {'color': '#00cc96', 'pattern': {'shape': ''}},
175
+ 'name': 'zephyr-7b-beta',
176
+ 'offsetgroup': 'zephyr-7b-beta',
177
+ 'orientation': 'v',
178
+ 'showlegend': True,
179
+ 'textposition': 'auto',
180
+ 'type': 'bar',
181
+ 'x': array(['zephyr-7b-beta'], dtype=object),
182
+ 'xaxis': 'x',
183
+ 'y': array([3.44499114]),
184
+ 'yaxis': 'y'}],
185
+ 'layout': {'barmode': 'relative',
186
+ 'legend': {'title': {'text': 'Model'}, 'tracegroupgap': 0},
187
+ 'template': '...',
188
+ 'title': {'text': 'Model endpoints response times'},
189
+ 'xaxis': {'anchor': 'y',
190
+ 'categoryarray': [Mistral-7B-Instruct-v0.2,
191
+ Mixtral-8x7B-Instruct-v0.1,
192
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,
193
+ chat-bison, chat-bison (PaLM 2), chat-
194
+ bison-32k, chat-bison-32k (PaLM 2 32K),
195
+ gemini-pro, gpt-3.5-turbo, gpt-4,
196
+ gpt-4-turbo, llama-2-70b-chat,
197
+ zephyr-7b-beta],
198
+ 'categoryorder': 'array',
199
+ 'domain': [0.0, 1.0],
200
+ 'title': {'text': 'Model'}},
201
+ 'yaxis': {'anchor': 'x', 'domain': [0.0, 1.0], 'title': {'text': 'Execution time (s)'}}}
202
+ })",Model endpoints response times,,"{""data"":[{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral-7B-Instruct-v0.2"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""Mistral-7B-Instruct-v0.2"",""offsetgroup"":""Mistral-7B-Instruct-v0.2"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""Mistral-7B-Instruct-v0.2""],""xaxis"":""x"",""y"":[3.271026806036631],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mixtral-8x7B-Instruct-v0.1"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""Mixtral-8x7B-Instruct-v0.1"",""offsetgroup"":""Mixtral-8x7B-Instruct-v0.1"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""Mixtral-8x7B-Instruct-v0.1""],""xaxis"":""x"",""y"":[4.690582027777991],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""offsetgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0""],""xaxis"":""x"",""y"":[1.7927383464436197],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""chat-bison"",""offsetgroup"":""chat-bison"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""chat-bison""],""xaxis"":""x"",""y"":[3.890243631601334],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison (PaLM 2)"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""chat-bison (PaLM 2)"",""offsetgroup"":""chat-bison (PaLM 2)"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""chat-bison (PaLM 2)""],""xaxis"":""x"",""y"":[2.668303858522159],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison-32k"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""chat-bison-32k"",""offsetgroup"":""chat-bison-32k"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""chat-bison-32k""],""xaxis"":""x"",""y"":[4.128177767992019],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison-32k (PaLM 2 32K)"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""chat-bison-32k (PaLM 2 32K)"",""offsetgroup"":""chat-bison-32k (PaLM 2 32K)"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""chat-bison-32k (PaLM 2 32K)""],""xaxis"":""x"",""y"":[6.738862129823485],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gemini-pro"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""gemini-pro"",""offsetgroup"":""gemini-pro"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gemini-pro""],""xaxis"":""x"",""y"":[3.036788886637026],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-3.5-turbo"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""gpt-3.5-turbo"",""offsetgroup"":""gpt-3.5-turbo"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gpt-3.5-turbo""],""xaxis"":""x"",""y"":[4.293073908173212],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""gpt-4"",""offsetgroup"":""gpt-4"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gpt-4""],""xaxis"":""x"",""y"":[14.323734385105828],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4-turbo"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""gpt-4-turbo"",""offsetgroup"":""gpt-4-turbo"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gpt-4-turbo""],""xaxis"":""x"",""y"":[15.535488395149827],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""llama-2-70b-chat"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""llama-2-70b-chat"",""offsetgroup"":""llama-2-70b-chat"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""llama-2-70b-chat""],""xaxis"":""x"",""y"":[3.6742314998615178],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""zephyr-7b-beta"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""zephyr-7b-beta"",""offsetgroup"":""zephyr-7b-beta"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""zephyr-7b-beta""],""xaxis"":""x"",""y"":[3.4449911407752936],""yaxis"":""y"",""type"":""bar""}],""layout"":{""template"":{""data"":{""histogram2dcontour"":[{""type"":""histogram2dcontour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""choropleth"":[{""type"":""choropleth"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""histogram2d"":[{""type"":""histogram2d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmap"":[{""type"":""heatmap"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmapgl"":[{""type"":""heatmapgl"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""contourcarpet"":[{""type"":""contourcarpet"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""contour"":[{""type"":""contour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""surface"":[{""type"":""surface"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""mesh3d"":[{""type"":""mesh3d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""scatter"":[{""fillpattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2},""type"":""scatter""}],""parcoords"":[{""type"":""parcoords"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolargl"":[{""type"":""scatterpolargl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""bar"":[{""error_x"":{""color"":""#2a3f5f""},""error_y"":{""color"":""#2a3f5f""},""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""bar""}],""scattergeo"":[{""type"":""scattergeo"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolar"":[{""type"":""scatterpolar"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""histogram"":[{""marker"":{""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""histogram""}],""scattergl"":[{""type"":""scattergl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatter3d"":[{""type"":""scatter3d"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattermapbox"":[{""type"":""scattermapbox"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterternary"":[{""type"":""scatterternary"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattercarpet"":[{""type"":""scattercarpet"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""carpet"":[{""aaxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""baxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""type"":""carpet""}],""table"":[{""cells"":{""fill"":{""color"":""#EBF0F8""},""line"":{""color"":""white""}},""header"":{""fill"":{""color"":""#C8D4E3""},""line"":{""color"":""white""}},""type"":""table""}],""barpolar"":[{""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""barpolar""}],""pie"":[{""automargin"":true,""type"":""pie""}]},""layout"":{""autotypenumbers"":""strict"",""colorway"":[""#636efa"",""#EF553B"",""#00cc96"",""#ab63fa"",""#FFA15A"",""#19d3f3"",""#FF6692"",""#B6E880"",""#FF97FF"",""#FECB52""],""font"":{""color"":""#2a3f5f""},""hovermode"":""closest"",""hoverlabel"":{""align"":""left""},""paper_bgcolor"":""white"",""plot_bgcolor"":""#E5ECF6"",""polar"":{""bgcolor"":""#E5ECF6"",""angularaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""radialaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""ternary"":{""bgcolor"":""#E5ECF6"",""aaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""baxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""caxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""coloraxis"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""colorscale"":{""sequential"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""sequentialminus"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""diverging"":[[0,""#8e0152""],[0.1,""#c51b7d""],[0.2,""#de77ae""],[0.3,""#f1b6da""],[0.4,""#fde0ef""],[0.5,""#f7f7f7""],[0.6,""#e6f5d0""],[0.7,""#b8e186""],[0.8,""#7fbc41""],[0.9,""#4d9221""],[1,""#276419""]]},""xaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""yaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""scene"":{""xaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""yaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""zaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2}},""shapedefaults"":{""line"":{""color"":""#2a3f5f""}},""annotationdefaults"":{""arrowcolor"":""#2a3f5f"",""arrowhead"":0,""arrowwidth"":1},""geo"":{""bgcolor"":""white"",""landcolor"":""#E5ECF6"",""subunitcolor"":""white"",""showland"":true,""showlakes"":true,""lakecolor"":""white""},""title"":{""x"":0.05},""mapbox"":{""style"":""light""}}},""xaxis"":{""anchor"":""y"",""domain"":[0.0,1.0],""title"":{""text"":""Model""},""categoryorder"":""array"",""categoryarray"":[""Mistral-7B-Instruct-v0.2"",""Mixtral-8x7B-Instruct-v0.1"",""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""chat-bison"",""chat-bison (PaLM 2)"",""chat-bison-32k"",""chat-bison-32k (PaLM 2 32K)"",""gemini-pro"",""gpt-3.5-turbo"",""gpt-4"",""gpt-4-turbo"",""llama-2-70b-chat"",""zephyr-7b-beta""]},""yaxis"":{""anchor"":""x"",""domain"":[0.0,1.0],""title"":{""text"":""Execution time (s)""}},""legend"":{""title"":{""text"":""Model""},""tracegroupgap"":0},""title"":{""text"":""Model endpoints response times""},""barmode"":""relative""}}"
203
+ ./html/plots/execution_costs.html,"Figure({
204
+ 'data': [{'alignmentgroup': 'True',
205
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
206
+ 'legendgroup': 'gpt-3.5-turbo',
207
+ 'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
208
+ 'name': 'gpt-3.5-turbo',
209
+ 'offsetgroup': 'gpt-3.5-turbo',
210
+ 'orientation': 'v',
211
+ 'showlegend': True,
212
+ 'textposition': 'auto',
213
+ 'type': 'bar',
214
+ 'x': array(['gpt-3.5-turbo'], dtype=object),
215
+ 'xaxis': 'x',
216
+ 'y': array([0.22948]),
217
+ 'yaxis': 'y'},
218
+ {'alignmentgroup': 'True',
219
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
220
+ 'legendgroup': 'gpt-4-turbo',
221
+ 'marker': {'color': '#EF553B', 'pattern': {'shape': ''}},
222
+ 'name': 'gpt-4-turbo',
223
+ 'offsetgroup': 'gpt-4-turbo',
224
+ 'orientation': 'v',
225
+ 'showlegend': True,
226
+ 'textposition': 'auto',
227
+ 'type': 'bar',
228
+ 'x': array(['gpt-4-turbo'], dtype=object),
229
+ 'xaxis': 'x',
230
+ 'y': array([2.9468]),
231
+ 'yaxis': 'y'},
232
+ {'alignmentgroup': 'True',
233
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
234
+ 'legendgroup': 'gpt-4',
235
+ 'marker': {'color': '#00cc96', 'pattern': {'shape': ''}},
236
+ 'name': 'gpt-4',
237
+ 'offsetgroup': 'gpt-4',
238
+ 'orientation': 'v',
239
+ 'showlegend': True,
240
+ 'textposition': 'auto',
241
+ 'type': 'bar',
242
+ 'x': array(['gpt-4'], dtype=object),
243
+ 'xaxis': 'x',
244
+ 'y': array([6.342]),
245
+ 'yaxis': 'y'},
246
+ {'alignmentgroup': 'True',
247
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
248
+ 'legendgroup': 'llama-2-70b-chat',
249
+ 'marker': {'color': '#ab63fa', 'pattern': {'shape': ''}},
250
+ 'name': 'llama-2-70b-chat',
251
+ 'offsetgroup': 'llama-2-70b-chat',
252
+ 'orientation': 'v',
253
+ 'showlegend': True,
254
+ 'textposition': 'auto',
255
+ 'type': 'bar',
256
+ 'x': array(['llama-2-70b-chat'], dtype=object),
257
+ 'xaxis': 'x',
258
+ 'y': array([0.02828]),
259
+ 'yaxis': 'y'},
260
+ {'alignmentgroup': 'True',
261
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
262
+ 'legendgroup': 'Mixtral-8x7B-Instruct-v0.1',
263
+ 'marker': {'color': '#FFA15A', 'pattern': {'shape': ''}},
264
+ 'name': 'Mixtral-8x7B-Instruct-v0.1',
265
+ 'offsetgroup': 'Mixtral-8x7B-Instruct-v0.1',
266
+ 'orientation': 'v',
267
+ 'showlegend': True,
268
+ 'textposition': 'auto',
269
+ 'type': 'bar',
270
+ 'x': array(['Mixtral-8x7B-Instruct-v0.1'], dtype=object),
271
+ 'xaxis': 'x',
272
+ 'y': array([0.12708]),
273
+ 'yaxis': 'y'},
274
+ {'alignmentgroup': 'True',
275
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
276
+ 'legendgroup': 'zephyr-7b-beta',
277
+ 'marker': {'color': '#19d3f3', 'pattern': {'shape': ''}},
278
+ 'name': 'zephyr-7b-beta',
279
+ 'offsetgroup': 'zephyr-7b-beta',
280
+ 'orientation': 'v',
281
+ 'showlegend': True,
282
+ 'textposition': 'auto',
283
+ 'type': 'bar',
284
+ 'x': array(['zephyr-7b-beta'], dtype=object),
285
+ 'xaxis': 'x',
286
+ 'y': array([0.04109804]),
287
+ 'yaxis': 'y'},
288
+ {'alignmentgroup': 'True',
289
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
290
+ 'legendgroup': 'Mistral-7B-Instruct-v0.2',
291
+ 'marker': {'color': '#FF6692', 'pattern': {'shape': ''}},
292
+ 'name': 'Mistral-7B-Instruct-v0.2',
293
+ 'offsetgroup': 'Mistral-7B-Instruct-v0.2',
294
+ 'orientation': 'v',
295
+ 'showlegend': True,
296
+ 'textposition': 'auto',
297
+ 'type': 'bar',
298
+ 'x': array(['Mistral-7B-Instruct-v0.2'], dtype=object),
299
+ 'xaxis': 'x',
300
+ 'y': array([0.10571385]),
301
+ 'yaxis': 'y'},
302
+ {'alignmentgroup': 'True',
303
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
304
+ 'legendgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
305
+ 'marker': {'color': '#B6E880', 'pattern': {'shape': ''}},
306
+ 'name': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
307
+ 'offsetgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
308
+ 'orientation': 'v',
309
+ 'showlegend': True,
310
+ 'textposition': 'auto',
311
+ 'type': 'bar',
312
+ 'x': array(['TinyLlama/TinyLlama-1.1B-Chat-v1.0'], dtype=object),
313
+ 'xaxis': 'x',
314
+ 'y': array([0.00933233]),
315
+ 'yaxis': 'y'},
316
+ {'alignmentgroup': 'True',
317
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
318
+ 'legendgroup': 'gemini-pro',
319
+ 'marker': {'color': '#FF97FF', 'pattern': {'shape': ''}},
320
+ 'name': 'gemini-pro',
321
+ 'offsetgroup': 'gemini-pro',
322
+ 'orientation': 'v',
323
+ 'showlegend': True,
324
+ 'textposition': 'auto',
325
+ 'type': 'bar',
326
+ 'x': array(['gemini-pro'], dtype=object),
327
+ 'xaxis': 'x',
328
+ 'y': array([0.05789]),
329
+ 'yaxis': 'y'},
330
+ {'alignmentgroup': 'True',
331
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
332
+ 'legendgroup': 'chat-bison (PaLM 2)',
333
+ 'marker': {'color': '#FECB52', 'pattern': {'shape': ''}},
334
+ 'name': 'chat-bison (PaLM 2)',
335
+ 'offsetgroup': 'chat-bison (PaLM 2)',
336
+ 'orientation': 'v',
337
+ 'showlegend': True,
338
+ 'textposition': 'auto',
339
+ 'type': 'bar',
340
+ 'x': array(['chat-bison (PaLM 2)'], dtype=object),
341
+ 'xaxis': 'x',
342
+ 'y': array([0.04731]),
343
+ 'yaxis': 'y'},
344
+ {'alignmentgroup': 'True',
345
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
346
+ 'legendgroup': 'chat-bison-32k (PaLM 2 32K)',
347
+ 'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
348
+ 'name': 'chat-bison-32k (PaLM 2 32K)',
349
+ 'offsetgroup': 'chat-bison-32k (PaLM 2 32K)',
350
+ 'orientation': 'v',
351
+ 'showlegend': True,
352
+ 'textposition': 'auto',
353
+ 'type': 'bar',
354
+ 'x': array(['chat-bison-32k (PaLM 2 32K)'], dtype=object),
355
+ 'xaxis': 'x',
356
+ 'y': array([0.04454]),
357
+ 'yaxis': 'y'}],
358
+ 'layout': {'barmode': 'relative',
359
+ 'legend': {'title': {'text': 'Model'}, 'tracegroupgap': 0},
360
+ 'template': '...',
361
+ 'title': {'text': 'Costs of execution of 800 test queries per model'},
362
+ 'xaxis': {'anchor': 'y', 'domain': [0.0, 1.0], 'title': {'text': 'Model'}},
363
+ 'yaxis': {'anchor': 'x', 'domain': [0.0, 1.0], 'title': {'text': 'Execution cost ($)'}}}
364
+ })",Costs of execution of 800 test queries per model,Note that pause and resume time cost was not included in the cost calculation for the models billed hourly. Also although Gemini-Pro model is free for under 60 queries per minute we calculated the full cost for generating the tokens.,"{""data"":[{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-3.5-turbo"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""gpt-3.5-turbo"",""offsetgroup"":""gpt-3.5-turbo"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gpt-3.5-turbo""],""xaxis"":""x"",""y"":[0.22948],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4-turbo"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""gpt-4-turbo"",""offsetgroup"":""gpt-4-turbo"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gpt-4-turbo""],""xaxis"":""x"",""y"":[2.9467999999999996],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""gpt-4"",""offsetgroup"":""gpt-4"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gpt-4""],""xaxis"":""x"",""y"":[6.3420000000000005],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""llama-2-70b-chat"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""llama-2-70b-chat"",""offsetgroup"":""llama-2-70b-chat"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""llama-2-70b-chat""],""xaxis"":""x"",""y"":[0.02828],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mixtral-8x7B-Instruct-v0.1"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""Mixtral-8x7B-Instruct-v0.1"",""offsetgroup"":""Mixtral-8x7B-Instruct-v0.1"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""Mixtral-8x7B-Instruct-v0.1""],""xaxis"":""x"",""y"":[0.12708],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""zephyr-7b-beta"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""zephyr-7b-beta"",""offsetgroup"":""zephyr-7b-beta"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""zephyr-7b-beta""],""xaxis"":""x"",""y"":[0.0410980390045378],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral-7B-Instruct-v0.2"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""Mistral-7B-Instruct-v0.2"",""offsetgroup"":""Mistral-7B-Instruct-v0.2"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""Mistral-7B-Instruct-v0.2""],""xaxis"":""x"",""y"":[0.1057138456636005],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""offsetgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0""],""xaxis"":""x"",""y"":[0.009332333167394003],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gemini-pro"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""gemini-pro"",""offsetgroup"":""gemini-pro"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gemini-pro""],""xaxis"":""x"",""y"":[0.05789],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison (PaLM 2)"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""chat-bison (PaLM 2)"",""offsetgroup"":""chat-bison (PaLM 2)"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""chat-bison (PaLM 2)""],""xaxis"":""x"",""y"":[0.04731],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison-32k (PaLM 2 32K)"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""chat-bison-32k (PaLM 2 32K)"",""offsetgroup"":""chat-bison-32k (PaLM 2 32K)"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""chat-bison-32k (PaLM 2 32K)""],""xaxis"":""x"",""y"":[0.044539999999999996],""yaxis"":""y"",""type"":""bar""}],""layout"":{""template"":{""data"":{""histogram2dcontour"":[{""type"":""histogram2dcontour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""choropleth"":[{""type"":""choropleth"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""histogram2d"":[{""type"":""histogram2d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmap"":[{""type"":""heatmap"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmapgl"":[{""type"":""heatmapgl"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""contourcarpet"":[{""type"":""contourcarpet"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""contour"":[{""type"":""contour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""surface"":[{""type"":""surface"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""mesh3d"":[{""type"":""mesh3d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""scatter"":[{""fillpattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2},""type"":""scatter""}],""parcoords"":[{""type"":""parcoords"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolargl"":[{""type"":""scatterpolargl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""bar"":[{""error_x"":{""color"":""#2a3f5f""},""error_y"":{""color"":""#2a3f5f""},""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""bar""}],""scattergeo"":[{""type"":""scattergeo"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolar"":[{""type"":""scatterpolar"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""histogram"":[{""marker"":{""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""histogram""}],""scattergl"":[{""type"":""scattergl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatter3d"":[{""type"":""scatter3d"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattermapbox"":[{""type"":""scattermapbox"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterternary"":[{""type"":""scatterternary"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattercarpet"":[{""type"":""scattercarpet"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""carpet"":[{""aaxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""baxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""type"":""carpet""}],""table"":[{""cells"":{""fill"":{""color"":""#EBF0F8""},""line"":{""color"":""white""}},""header"":{""fill"":{""color"":""#C8D4E3""},""line"":{""color"":""white""}},""type"":""table""}],""barpolar"":[{""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""barpolar""}],""pie"":[{""automargin"":true,""type"":""pie""}]},""layout"":{""autotypenumbers"":""strict"",""colorway"":[""#636efa"",""#EF553B"",""#00cc96"",""#ab63fa"",""#FFA15A"",""#19d3f3"",""#FF6692"",""#B6E880"",""#FF97FF"",""#FECB52""],""font"":{""color"":""#2a3f5f""},""hovermode"":""closest"",""hoverlabel"":{""align"":""left""},""paper_bgcolor"":""white"",""plot_bgcolor"":""#E5ECF6"",""polar"":{""bgcolor"":""#E5ECF6"",""angularaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""radialaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""ternary"":{""bgcolor"":""#E5ECF6"",""aaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""baxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""caxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""coloraxis"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""colorscale"":{""sequential"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""sequentialminus"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""diverging"":[[0,""#8e0152""],[0.1,""#c51b7d""],[0.2,""#de77ae""],[0.3,""#f1b6da""],[0.4,""#fde0ef""],[0.5,""#f7f7f7""],[0.6,""#e6f5d0""],[0.7,""#b8e186""],[0.8,""#7fbc41""],[0.9,""#4d9221""],[1,""#276419""]]},""xaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""yaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""scene"":{""xaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""yaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""zaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2}},""shapedefaults"":{""line"":{""color"":""#2a3f5f""}},""annotationdefaults"":{""arrowcolor"":""#2a3f5f"",""arrowhead"":0,""arrowwidth"":1},""geo"":{""bgcolor"":""white"",""landcolor"":""#E5ECF6"",""subunitcolor"":""white"",""showland"":true,""showlakes"":true,""lakecolor"":""white""},""title"":{""x"":0.05},""mapbox"":{""style"":""light""}}},""xaxis"":{""anchor"":""y"",""domain"":[0.0,1.0],""title"":{""text"":""Model""}},""yaxis"":{""anchor"":""x"",""domain"":[0.0,1.0],""title"":{""text"":""Execution cost ($)""}},""legend"":{""title"":{""text"":""Model""},""tracegroupgap"":0},""title"":{""text"":""Costs of execution of 800 test queries per model""},""barmode"":""relative""}}"
365
+ ./html/plots/model_sizes.html,"Figure({
366
+ 'data': [{'alignmentgroup': 'True',
367
+ 'hovertemplate': 'Model=%{x}<br>Model size (B params)=%{y}<extra></extra>',
368
+ 'legendgroup': 'Mixtral-8x7B-Instruct-v0.1',
369
+ 'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
370
+ 'name': 'Mixtral-8x7B-Instruct-v0.1',
371
+ 'offsetgroup': 'Mixtral-8x7B-Instruct-v0.1',
372
+ 'orientation': 'v',
373
+ 'showlegend': True,
374
+ 'textposition': 'auto',
375
+ 'type': 'bar',
376
+ 'x': array(['Mixtral-8x7B-Instruct-v0.1'], dtype=object),
377
+ 'xaxis': 'x',
378
+ 'y': array([56.]),
379
+ 'yaxis': 'y'},
380
+ {'alignmentgroup': 'True',
381
+ 'hovertemplate': 'Model=%{x}<br>Model size (B params)=%{y}<extra></extra>',
382
+ 'legendgroup': 'zephyr-7b-beta',
383
+ 'marker': {'color': '#EF553B', 'pattern': {'shape': ''}},
384
+ 'name': 'zephyr-7b-beta',
385
+ 'offsetgroup': 'zephyr-7b-beta',
386
+ 'orientation': 'v',
387
+ 'showlegend': True,
388
+ 'textposition': 'auto',
389
+ 'type': 'bar',
390
+ 'x': array(['zephyr-7b-beta'], dtype=object),
391
+ 'xaxis': 'x',
392
+ 'y': array([7.]),
393
+ 'yaxis': 'y'},
394
+ {'alignmentgroup': 'True',
395
+ 'hovertemplate': 'Model=%{x}<br>Model size (B params)=%{y}<extra></extra>',
396
+ 'legendgroup': 'Mistral-7B-Instruct-v0.2',
397
+ 'marker': {'color': '#00cc96', 'pattern': {'shape': ''}},
398
+ 'name': 'Mistral-7B-Instruct-v0.2',
399
+ 'offsetgroup': 'Mistral-7B-Instruct-v0.2',
400
+ 'orientation': 'v',
401
+ 'showlegend': True,
402
+ 'textposition': 'auto',
403
+ 'type': 'bar',
404
+ 'x': array(['Mistral-7B-Instruct-v0.2'], dtype=object),
405
+ 'xaxis': 'x',
406
+ 'y': array([7.]),
407
+ 'yaxis': 'y'},
408
+ {'alignmentgroup': 'True',
409
+ 'hovertemplate': 'Model=%{x}<br>Model size (B params)=%{y}<extra></extra>',
410
+ 'legendgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
411
+ 'marker': {'color': '#ab63fa', 'pattern': {'shape': ''}},
412
+ 'name': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
413
+ 'offsetgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
414
+ 'orientation': 'v',
415
+ 'showlegend': True,
416
+ 'textposition': 'auto',
417
+ 'type': 'bar',
418
+ 'x': array(['TinyLlama/TinyLlama-1.1B-Chat-v1.0'], dtype=object),
419
+ 'xaxis': 'x',
420
+ 'y': array([1.1]),
421
+ 'yaxis': 'y'}],
422
+ 'layout': {'barmode': 'relative',
423
+ 'legend': {'title': {'text': 'Model'}, 'tracegroupgap': 0},
424
+ 'template': '...',
425
+ 'title': {'text': 'Model sizes in billions of parameters'},
426
+ 'xaxis': {'anchor': 'y', 'domain': [0.0, 1.0], 'title': {'text': 'Model'}},
427
+ 'yaxis': {'anchor': 'x', 'domain': [0.0, 1.0], 'title': {'text': 'Model size (B params)'}}}
428
+ })",Model sizes in billions of parameters,Note that some models have undisclosed sizes.,"{""data"":[{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eModel size (B params)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mixtral-8x7B-Instruct-v0.1"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""Mixtral-8x7B-Instruct-v0.1"",""offsetgroup"":""Mixtral-8x7B-Instruct-v0.1"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""Mixtral-8x7B-Instruct-v0.1""],""xaxis"":""x"",""y"":[56.0],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eModel size (B params)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""zephyr-7b-beta"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""zephyr-7b-beta"",""offsetgroup"":""zephyr-7b-beta"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""zephyr-7b-beta""],""xaxis"":""x"",""y"":[7.0],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eModel size (B params)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral-7B-Instruct-v0.2"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""Mistral-7B-Instruct-v0.2"",""offsetgroup"":""Mistral-7B-Instruct-v0.2"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""Mistral-7B-Instruct-v0.2""],""xaxis"":""x"",""y"":[7.0],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eModel size (B params)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""offsetgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0""],""xaxis"":""x"",""y"":[1.1],""yaxis"":""y"",""type"":""bar""}],""layout"":{""template"":{""data"":{""histogram2dcontour"":[{""type"":""histogram2dcontour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""choropleth"":[{""type"":""choropleth"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""histogram2d"":[{""type"":""histogram2d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmap"":[{""type"":""heatmap"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmapgl"":[{""type"":""heatmapgl"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""contourcarpet"":[{""type"":""contourcarpet"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""contour"":[{""type"":""contour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""surface"":[{""type"":""surface"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""mesh3d"":[{""type"":""mesh3d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""scatter"":[{""fillpattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2},""type"":""scatter""}],""parcoords"":[{""type"":""parcoords"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolargl"":[{""type"":""scatterpolargl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""bar"":[{""error_x"":{""color"":""#2a3f5f""},""error_y"":{""color"":""#2a3f5f""},""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""bar""}],""scattergeo"":[{""type"":""scattergeo"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolar"":[{""type"":""scatterpolar"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""histogram"":[{""marker"":{""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""histogram""}],""scattergl"":[{""type"":""scattergl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatter3d"":[{""type"":""scatter3d"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattermapbox"":[{""type"":""scattermapbox"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterternary"":[{""type"":""scatterternary"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattercarpet"":[{""type"":""scattercarpet"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""carpet"":[{""aaxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""baxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""type"":""carpet""}],""table"":[{""cells"":{""fill"":{""color"":""#EBF0F8""},""line"":{""color"":""white""}},""header"":{""fill"":{""color"":""#C8D4E3""},""line"":{""color"":""white""}},""type"":""table""}],""barpolar"":[{""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""barpolar""}],""pie"":[{""automargin"":true,""type"":""pie""}]},""layout"":{""autotypenumbers"":""strict"",""colorway"":[""#636efa"",""#EF553B"",""#00cc96"",""#ab63fa"",""#FFA15A"",""#19d3f3"",""#FF6692"",""#B6E880"",""#FF97FF"",""#FECB52""],""font"":{""color"":""#2a3f5f""},""hovermode"":""closest"",""hoverlabel"":{""align"":""left""},""paper_bgcolor"":""white"",""plot_bgcolor"":""#E5ECF6"",""polar"":{""bgcolor"":""#E5ECF6"",""angularaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""radialaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""ternary"":{""bgcolor"":""#E5ECF6"",""aaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""baxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""caxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""coloraxis"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""colorscale"":{""sequential"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""sequentialminus"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""diverging"":[[0,""#8e0152""],[0.1,""#c51b7d""],[0.2,""#de77ae""],[0.3,""#f1b6da""],[0.4,""#fde0ef""],[0.5,""#f7f7f7""],[0.6,""#e6f5d0""],[0.7,""#b8e186""],[0.8,""#7fbc41""],[0.9,""#4d9221""],[1,""#276419""]]},""xaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""yaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""scene"":{""xaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""yaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""zaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2}},""shapedefaults"":{""line"":{""color"":""#2a3f5f""}},""annotationdefaults"":{""arrowcolor"":""#2a3f5f"",""arrowhead"":0,""arrowwidth"":1},""geo"":{""bgcolor"":""white"",""landcolor"":""#E5ECF6"",""subunitcolor"":""white"",""showland"":true,""showlakes"":true,""lakecolor"":""white""},""title"":{""x"":0.05},""mapbox"":{""style"":""light""}}},""xaxis"":{""anchor"":""y"",""domain"":[0.0,1.0],""title"":{""text"":""Model""}},""yaxis"":{""anchor"":""x"",""domain"":[0.0,1.0],""title"":{""text"":""Model size (B params)""}},""legend"":{""title"":{""text"":""Model""},""tracegroupgap"":0},""title"":{""text"":""Model sizes in billions of parameters""},""barmode"":""relative""}}"
data/2024-02-05 12:03:42.452218_general_plot.csv ADDED
@@ -0,0 +1,442 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ path,plot_object,description,comment,plot_json
2
+ ./html/plots/response_times.html,"Figure({
3
+ 'data': [{'alignmentgroup': 'True',
4
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
5
+ 'legendgroup': 'Mistral-7B-Instruct-v0.2',
6
+ 'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
7
+ 'name': 'Mistral-7B-Instruct-v0.2',
8
+ 'offsetgroup': 'Mistral-7B-Instruct-v0.2',
9
+ 'orientation': 'v',
10
+ 'showlegend': True,
11
+ 'textposition': 'auto',
12
+ 'type': 'bar',
13
+ 'x': array(['Mistral-7B-Instruct-v0.2'], dtype=object),
14
+ 'xaxis': 'x',
15
+ 'y': array([3.27102681]),
16
+ 'yaxis': 'y'},
17
+ {'alignmentgroup': 'True',
18
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
19
+ 'legendgroup': 'Mixtral-8x7B-Instruct-v0.1',
20
+ 'marker': {'color': '#EF553B', 'pattern': {'shape': ''}},
21
+ 'name': 'Mixtral-8x7B-Instruct-v0.1',
22
+ 'offsetgroup': 'Mixtral-8x7B-Instruct-v0.1',
23
+ 'orientation': 'v',
24
+ 'showlegend': True,
25
+ 'textposition': 'auto',
26
+ 'type': 'bar',
27
+ 'x': array(['Mixtral-8x7B-Instruct-v0.1'], dtype=object),
28
+ 'xaxis': 'x',
29
+ 'y': array([4.69058203]),
30
+ 'yaxis': 'y'},
31
+ {'alignmentgroup': 'True',
32
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
33
+ 'legendgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
34
+ 'marker': {'color': '#00cc96', 'pattern': {'shape': ''}},
35
+ 'name': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
36
+ 'offsetgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
37
+ 'orientation': 'v',
38
+ 'showlegend': True,
39
+ 'textposition': 'auto',
40
+ 'type': 'bar',
41
+ 'x': array(['TinyLlama/TinyLlama-1.1B-Chat-v1.0'], dtype=object),
42
+ 'xaxis': 'x',
43
+ 'y': array([1.79273835]),
44
+ 'yaxis': 'y'},
45
+ {'alignmentgroup': 'True',
46
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
47
+ 'legendgroup': 'chat-bison',
48
+ 'marker': {'color': '#ab63fa', 'pattern': {'shape': ''}},
49
+ 'name': 'chat-bison',
50
+ 'offsetgroup': 'chat-bison',
51
+ 'orientation': 'v',
52
+ 'showlegend': True,
53
+ 'textposition': 'auto',
54
+ 'type': 'bar',
55
+ 'x': array(['chat-bison'], dtype=object),
56
+ 'xaxis': 'x',
57
+ 'y': array([3.89024363]),
58
+ 'yaxis': 'y'},
59
+ {'alignmentgroup': 'True',
60
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
61
+ 'legendgroup': 'chat-bison (PaLM 2)',
62
+ 'marker': {'color': '#FFA15A', 'pattern': {'shape': ''}},
63
+ 'name': 'chat-bison (PaLM 2)',
64
+ 'offsetgroup': 'chat-bison (PaLM 2)',
65
+ 'orientation': 'v',
66
+ 'showlegend': True,
67
+ 'textposition': 'auto',
68
+ 'type': 'bar',
69
+ 'x': array(['chat-bison (PaLM 2)'], dtype=object),
70
+ 'xaxis': 'x',
71
+ 'y': array([2.66830386]),
72
+ 'yaxis': 'y'},
73
+ {'alignmentgroup': 'True',
74
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
75
+ 'legendgroup': 'chat-bison-32k',
76
+ 'marker': {'color': '#19d3f3', 'pattern': {'shape': ''}},
77
+ 'name': 'chat-bison-32k',
78
+ 'offsetgroup': 'chat-bison-32k',
79
+ 'orientation': 'v',
80
+ 'showlegend': True,
81
+ 'textposition': 'auto',
82
+ 'type': 'bar',
83
+ 'x': array(['chat-bison-32k'], dtype=object),
84
+ 'xaxis': 'x',
85
+ 'y': array([4.12817777]),
86
+ 'yaxis': 'y'},
87
+ {'alignmentgroup': 'True',
88
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
89
+ 'legendgroup': 'chat-bison-32k (PaLM 2 32K)',
90
+ 'marker': {'color': '#FF6692', 'pattern': {'shape': ''}},
91
+ 'name': 'chat-bison-32k (PaLM 2 32K)',
92
+ 'offsetgroup': 'chat-bison-32k (PaLM 2 32K)',
93
+ 'orientation': 'v',
94
+ 'showlegend': True,
95
+ 'textposition': 'auto',
96
+ 'type': 'bar',
97
+ 'x': array(['chat-bison-32k (PaLM 2 32K)'], dtype=object),
98
+ 'xaxis': 'x',
99
+ 'y': array([6.73886213]),
100
+ 'yaxis': 'y'},
101
+ {'alignmentgroup': 'True',
102
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
103
+ 'legendgroup': 'gemini-pro',
104
+ 'marker': {'color': '#B6E880', 'pattern': {'shape': ''}},
105
+ 'name': 'gemini-pro',
106
+ 'offsetgroup': 'gemini-pro',
107
+ 'orientation': 'v',
108
+ 'showlegend': True,
109
+ 'textposition': 'auto',
110
+ 'type': 'bar',
111
+ 'x': array(['gemini-pro'], dtype=object),
112
+ 'xaxis': 'x',
113
+ 'y': array([3.03678889]),
114
+ 'yaxis': 'y'},
115
+ {'alignmentgroup': 'True',
116
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
117
+ 'legendgroup': 'gpt-3.5-turbo',
118
+ 'marker': {'color': '#FF97FF', 'pattern': {'shape': ''}},
119
+ 'name': 'gpt-3.5-turbo',
120
+ 'offsetgroup': 'gpt-3.5-turbo',
121
+ 'orientation': 'v',
122
+ 'showlegend': True,
123
+ 'textposition': 'auto',
124
+ 'type': 'bar',
125
+ 'x': array(['gpt-3.5-turbo'], dtype=object),
126
+ 'xaxis': 'x',
127
+ 'y': array([4.29307391]),
128
+ 'yaxis': 'y'},
129
+ {'alignmentgroup': 'True',
130
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
131
+ 'legendgroup': 'gpt-4',
132
+ 'marker': {'color': '#FECB52', 'pattern': {'shape': ''}},
133
+ 'name': 'gpt-4',
134
+ 'offsetgroup': 'gpt-4',
135
+ 'orientation': 'v',
136
+ 'showlegend': True,
137
+ 'textposition': 'auto',
138
+ 'type': 'bar',
139
+ 'x': array(['gpt-4'], dtype=object),
140
+ 'xaxis': 'x',
141
+ 'y': array([14.32373439]),
142
+ 'yaxis': 'y'},
143
+ {'alignmentgroup': 'True',
144
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
145
+ 'legendgroup': 'gpt-4-turbo',
146
+ 'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
147
+ 'name': 'gpt-4-turbo',
148
+ 'offsetgroup': 'gpt-4-turbo',
149
+ 'orientation': 'v',
150
+ 'showlegend': True,
151
+ 'textposition': 'auto',
152
+ 'type': 'bar',
153
+ 'x': array(['gpt-4-turbo'], dtype=object),
154
+ 'xaxis': 'x',
155
+ 'y': array([15.5354884]),
156
+ 'yaxis': 'y'},
157
+ {'alignmentgroup': 'True',
158
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
159
+ 'legendgroup': 'llama-2-70b-chat',
160
+ 'marker': {'color': '#EF553B', 'pattern': {'shape': ''}},
161
+ 'name': 'llama-2-70b-chat',
162
+ 'offsetgroup': 'llama-2-70b-chat',
163
+ 'orientation': 'v',
164
+ 'showlegend': True,
165
+ 'textposition': 'auto',
166
+ 'type': 'bar',
167
+ 'x': array(['llama-2-70b-chat'], dtype=object),
168
+ 'xaxis': 'x',
169
+ 'y': array([3.6742315]),
170
+ 'yaxis': 'y'},
171
+ {'alignmentgroup': 'True',
172
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
173
+ 'legendgroup': 'zephyr-7b-beta',
174
+ 'marker': {'color': '#00cc96', 'pattern': {'shape': ''}},
175
+ 'name': 'zephyr-7b-beta',
176
+ 'offsetgroup': 'zephyr-7b-beta',
177
+ 'orientation': 'v',
178
+ 'showlegend': True,
179
+ 'textposition': 'auto',
180
+ 'type': 'bar',
181
+ 'x': array(['zephyr-7b-beta'], dtype=object),
182
+ 'xaxis': 'x',
183
+ 'y': array([3.44499114]),
184
+ 'yaxis': 'y'}],
185
+ 'layout': {'barmode': 'relative',
186
+ 'legend': {'title': {'text': 'Model'}, 'tracegroupgap': 0},
187
+ 'template': '...',
188
+ 'title': {'text': 'Model endpoints response times'},
189
+ 'xaxis': {'anchor': 'y',
190
+ 'categoryarray': [Mistral-7B-Instruct-v0.2,
191
+ Mixtral-8x7B-Instruct-v0.1,
192
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,
193
+ chat-bison, chat-bison (PaLM 2), chat-
194
+ bison-32k, chat-bison-32k (PaLM 2 32K),
195
+ gemini-pro, gpt-3.5-turbo, gpt-4,
196
+ gpt-4-turbo, llama-2-70b-chat,
197
+ zephyr-7b-beta],
198
+ 'categoryorder': 'array',
199
+ 'domain': [0.0, 1.0],
200
+ 'title': {'text': 'Model'}},
201
+ 'yaxis': {'anchor': 'x', 'domain': [0.0, 1.0], 'title': {'text': 'Execution time (s)'}}}
202
+ })",Model endpoints response times,,"{""data"":[{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral-7B-Instruct-v0.2"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""Mistral-7B-Instruct-v0.2"",""offsetgroup"":""Mistral-7B-Instruct-v0.2"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""Mistral-7B-Instruct-v0.2""],""xaxis"":""x"",""y"":[3.271026806036631],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mixtral-8x7B-Instruct-v0.1"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""Mixtral-8x7B-Instruct-v0.1"",""offsetgroup"":""Mixtral-8x7B-Instruct-v0.1"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""Mixtral-8x7B-Instruct-v0.1""],""xaxis"":""x"",""y"":[4.690582027777991],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""offsetgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0""],""xaxis"":""x"",""y"":[1.7927383464436197],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""chat-bison"",""offsetgroup"":""chat-bison"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""chat-bison""],""xaxis"":""x"",""y"":[3.890243631601334],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison (PaLM 2)"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""chat-bison (PaLM 2)"",""offsetgroup"":""chat-bison (PaLM 2)"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""chat-bison (PaLM 2)""],""xaxis"":""x"",""y"":[2.668303858522159],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison-32k"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""chat-bison-32k"",""offsetgroup"":""chat-bison-32k"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""chat-bison-32k""],""xaxis"":""x"",""y"":[4.128177767992019],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison-32k (PaLM 2 32K)"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""chat-bison-32k (PaLM 2 32K)"",""offsetgroup"":""chat-bison-32k (PaLM 2 32K)"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""chat-bison-32k (PaLM 2 32K)""],""xaxis"":""x"",""y"":[6.738862129823485],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gemini-pro"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""gemini-pro"",""offsetgroup"":""gemini-pro"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gemini-pro""],""xaxis"":""x"",""y"":[3.036788886637026],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-3.5-turbo"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""gpt-3.5-turbo"",""offsetgroup"":""gpt-3.5-turbo"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gpt-3.5-turbo""],""xaxis"":""x"",""y"":[4.293073908173212],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""gpt-4"",""offsetgroup"":""gpt-4"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gpt-4""],""xaxis"":""x"",""y"":[14.323734385105828],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4-turbo"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""gpt-4-turbo"",""offsetgroup"":""gpt-4-turbo"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gpt-4-turbo""],""xaxis"":""x"",""y"":[15.535488395149827],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""llama-2-70b-chat"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""llama-2-70b-chat"",""offsetgroup"":""llama-2-70b-chat"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""llama-2-70b-chat""],""xaxis"":""x"",""y"":[3.6742314998615178],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""zephyr-7b-beta"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""zephyr-7b-beta"",""offsetgroup"":""zephyr-7b-beta"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""zephyr-7b-beta""],""xaxis"":""x"",""y"":[3.4449911407752936],""yaxis"":""y"",""type"":""bar""}],""layout"":{""template"":{""data"":{""histogram2dcontour"":[{""type"":""histogram2dcontour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""choropleth"":[{""type"":""choropleth"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""histogram2d"":[{""type"":""histogram2d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmap"":[{""type"":""heatmap"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmapgl"":[{""type"":""heatmapgl"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""contourcarpet"":[{""type"":""contourcarpet"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""contour"":[{""type"":""contour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""surface"":[{""type"":""surface"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""mesh3d"":[{""type"":""mesh3d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""scatter"":[{""fillpattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2},""type"":""scatter""}],""parcoords"":[{""type"":""parcoords"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolargl"":[{""type"":""scatterpolargl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""bar"":[{""error_x"":{""color"":""#2a3f5f""},""error_y"":{""color"":""#2a3f5f""},""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""bar""}],""scattergeo"":[{""type"":""scattergeo"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolar"":[{""type"":""scatterpolar"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""histogram"":[{""marker"":{""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""histogram""}],""scattergl"":[{""type"":""scattergl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatter3d"":[{""type"":""scatter3d"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattermapbox"":[{""type"":""scattermapbox"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterternary"":[{""type"":""scatterternary"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattercarpet"":[{""type"":""scattercarpet"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""carpet"":[{""aaxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""baxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""type"":""carpet""}],""table"":[{""cells"":{""fill"":{""color"":""#EBF0F8""},""line"":{""color"":""white""}},""header"":{""fill"":{""color"":""#C8D4E3""},""line"":{""color"":""white""}},""type"":""table""}],""barpolar"":[{""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""barpolar""}],""pie"":[{""automargin"":true,""type"":""pie""}]},""layout"":{""autotypenumbers"":""strict"",""colorway"":[""#636efa"",""#EF553B"",""#00cc96"",""#ab63fa"",""#FFA15A"",""#19d3f3"",""#FF6692"",""#B6E880"",""#FF97FF"",""#FECB52""],""font"":{""color"":""#2a3f5f""},""hovermode"":""closest"",""hoverlabel"":{""align"":""left""},""paper_bgcolor"":""white"",""plot_bgcolor"":""#E5ECF6"",""polar"":{""bgcolor"":""#E5ECF6"",""angularaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""radialaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""ternary"":{""bgcolor"":""#E5ECF6"",""aaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""baxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""caxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""coloraxis"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""colorscale"":{""sequential"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""sequentialminus"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""diverging"":[[0,""#8e0152""],[0.1,""#c51b7d""],[0.2,""#de77ae""],[0.3,""#f1b6da""],[0.4,""#fde0ef""],[0.5,""#f7f7f7""],[0.6,""#e6f5d0""],[0.7,""#b8e186""],[0.8,""#7fbc41""],[0.9,""#4d9221""],[1,""#276419""]]},""xaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""yaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""scene"":{""xaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""yaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""zaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2}},""shapedefaults"":{""line"":{""color"":""#2a3f5f""}},""annotationdefaults"":{""arrowcolor"":""#2a3f5f"",""arrowhead"":0,""arrowwidth"":1},""geo"":{""bgcolor"":""white"",""landcolor"":""#E5ECF6"",""subunitcolor"":""white"",""showland"":true,""showlakes"":true,""lakecolor"":""white""},""title"":{""x"":0.05},""mapbox"":{""style"":""light""}}},""xaxis"":{""anchor"":""y"",""domain"":[0.0,1.0],""title"":{""text"":""Model""},""categoryorder"":""array"",""categoryarray"":[""Mistral-7B-Instruct-v0.2"",""Mixtral-8x7B-Instruct-v0.1"",""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""chat-bison"",""chat-bison (PaLM 2)"",""chat-bison-32k"",""chat-bison-32k (PaLM 2 32K)"",""gemini-pro"",""gpt-3.5-turbo"",""gpt-4"",""gpt-4-turbo"",""llama-2-70b-chat"",""zephyr-7b-beta""]},""yaxis"":{""anchor"":""x"",""domain"":[0.0,1.0],""title"":{""text"":""Execution time (s)""}},""legend"":{""title"":{""text"":""Model""},""tracegroupgap"":0},""title"":{""text"":""Model endpoints response times""},""barmode"":""relative""}}"
203
+ ./html/plots/execution_costs.html,"Figure({
204
+ 'data': [{'alignmentgroup': 'True',
205
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
206
+ 'legendgroup': 'gpt-3.5-turbo',
207
+ 'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
208
+ 'name': 'gpt-3.5-turbo',
209
+ 'offsetgroup': 'gpt-3.5-turbo',
210
+ 'orientation': 'v',
211
+ 'showlegend': True,
212
+ 'textposition': 'auto',
213
+ 'type': 'bar',
214
+ 'x': array(['gpt-3.5-turbo'], dtype=object),
215
+ 'xaxis': 'x',
216
+ 'y': array([0.041]),
217
+ 'yaxis': 'y'},
218
+ {'alignmentgroup': 'True',
219
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
220
+ 'legendgroup': 'gpt-4-turbo',
221
+ 'marker': {'color': '#EF553B', 'pattern': {'shape': ''}},
222
+ 'name': 'gpt-4-turbo',
223
+ 'offsetgroup': 'gpt-4-turbo',
224
+ 'orientation': 'v',
225
+ 'showlegend': True,
226
+ 'textposition': 'auto',
227
+ 'type': 'bar',
228
+ 'x': array(['gpt-4-turbo'], dtype=object),
229
+ 'xaxis': 'x',
230
+ 'y': array([0.5018]),
231
+ 'yaxis': 'y'},
232
+ {'alignmentgroup': 'True',
233
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
234
+ 'legendgroup': 'gpt-4',
235
+ 'marker': {'color': '#00cc96', 'pattern': {'shape': ''}},
236
+ 'name': 'gpt-4',
237
+ 'offsetgroup': 'gpt-4',
238
+ 'orientation': 'v',
239
+ 'showlegend': True,
240
+ 'textposition': 'auto',
241
+ 'type': 'bar',
242
+ 'x': array(['gpt-4'], dtype=object),
243
+ 'xaxis': 'x',
244
+ 'y': array([1.2624]),
245
+ 'yaxis': 'y'},
246
+ {'alignmentgroup': 'True',
247
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
248
+ 'legendgroup': 'llama-2-70b-chat',
249
+ 'marker': {'color': '#ab63fa', 'pattern': {'shape': ''}},
250
+ 'name': 'llama-2-70b-chat',
251
+ 'offsetgroup': 'llama-2-70b-chat',
252
+ 'orientation': 'v',
253
+ 'showlegend': True,
254
+ 'textposition': 'auto',
255
+ 'type': 'bar',
256
+ 'x': array(['llama-2-70b-chat'], dtype=object),
257
+ 'xaxis': 'x',
258
+ 'y': array([0.062568]),
259
+ 'yaxis': 'y'},
260
+ {'alignmentgroup': 'True',
261
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
262
+ 'legendgroup': 'Mixtral-8x7B-Instruct-v0.1',
263
+ 'marker': {'color': '#FFA15A', 'pattern': {'shape': ''}},
264
+ 'name': 'Mixtral-8x7B-Instruct-v0.1',
265
+ 'offsetgroup': 'Mixtral-8x7B-Instruct-v0.1',
266
+ 'orientation': 'v',
267
+ 'showlegend': True,
268
+ 'textposition': 'auto',
269
+ 'type': 'bar',
270
+ 'x': array(['Mixtral-8x7B-Instruct-v0.1'], dtype=object),
271
+ 'xaxis': 'x',
272
+ 'y': array([0.072612]),
273
+ 'yaxis': 'y'},
274
+ {'alignmentgroup': 'True',
275
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
276
+ 'legendgroup': 'zephyr-7b-beta',
277
+ 'marker': {'color': '#19d3f3', 'pattern': {'shape': ''}},
278
+ 'name': 'zephyr-7b-beta',
279
+ 'offsetgroup': 'zephyr-7b-beta',
280
+ 'orientation': 'v',
281
+ 'showlegend': True,
282
+ 'textposition': 'auto',
283
+ 'type': 'bar',
284
+ 'x': array(['zephyr-7b-beta'], dtype=object),
285
+ 'xaxis': 'x',
286
+ 'y': array([0.05180257]),
287
+ 'yaxis': 'y'},
288
+ {'alignmentgroup': 'True',
289
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
290
+ 'legendgroup': 'Mistral-7B-Instruct-v0.2',
291
+ 'marker': {'color': '#FF6692', 'pattern': {'shape': ''}},
292
+ 'name': 'Mistral-7B-Instruct-v0.2',
293
+ 'offsetgroup': 'Mistral-7B-Instruct-v0.2',
294
+ 'orientation': 'v',
295
+ 'showlegend': True,
296
+ 'textposition': 'auto',
297
+ 'type': 'bar',
298
+ 'x': array(['Mistral-7B-Instruct-v0.2'], dtype=object),
299
+ 'xaxis': 'x',
300
+ 'y': array([0.05200691]),
301
+ 'yaxis': 'y'},
302
+ {'alignmentgroup': 'True',
303
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
304
+ 'legendgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
305
+ 'marker': {'color': '#B6E880', 'pattern': {'shape': ''}},
306
+ 'name': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
307
+ 'offsetgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
308
+ 'orientation': 'v',
309
+ 'showlegend': True,
310
+ 'textposition': 'auto',
311
+ 'type': 'bar',
312
+ 'x': array(['TinyLlama/TinyLlama-1.1B-Chat-v1.0'], dtype=object),
313
+ 'xaxis': 'x',
314
+ 'y': array([0.01634787]),
315
+ 'yaxis': 'y'},
316
+ {'alignmentgroup': 'True',
317
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
318
+ 'legendgroup': 'gemini-pro',
319
+ 'marker': {'color': '#FF97FF', 'pattern': {'shape': ''}},
320
+ 'name': 'gemini-pro',
321
+ 'offsetgroup': 'gemini-pro',
322
+ 'orientation': 'v',
323
+ 'showlegend': True,
324
+ 'textposition': 'auto',
325
+ 'type': 'bar',
326
+ 'x': array(['gemini-pro'], dtype=object),
327
+ 'xaxis': 'x',
328
+ 'y': array([0.01052]),
329
+ 'yaxis': 'y'},
330
+ {'alignmentgroup': 'True',
331
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
332
+ 'legendgroup': 'chat-bison (PaLM 2)',
333
+ 'marker': {'color': '#FECB52', 'pattern': {'shape': ''}},
334
+ 'name': 'chat-bison (PaLM 2)',
335
+ 'offsetgroup': 'chat-bison (PaLM 2)',
336
+ 'orientation': 'v',
337
+ 'showlegend': True,
338
+ 'textposition': 'auto',
339
+ 'type': 'bar',
340
+ 'x': array(['chat-bison (PaLM 2)'], dtype=object),
341
+ 'xaxis': 'x',
342
+ 'y': array([0.01309]),
343
+ 'yaxis': 'y'},
344
+ {'alignmentgroup': 'True',
345
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
346
+ 'legendgroup': 'chat-bison-32k (PaLM 2 32K)',
347
+ 'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
348
+ 'name': 'chat-bison-32k (PaLM 2 32K)',
349
+ 'offsetgroup': 'chat-bison-32k (PaLM 2 32K)',
350
+ 'orientation': 'v',
351
+ 'showlegend': True,
352
+ 'textposition': 'auto',
353
+ 'type': 'bar',
354
+ 'x': array(['chat-bison-32k (PaLM 2 32K)'], dtype=object),
355
+ 'xaxis': 'x',
356
+ 'y': array([0.01304]),
357
+ 'yaxis': 'y'}],
358
+ 'layout': {'barmode': 'relative',
359
+ 'legend': {'title': {'text': 'Model'}, 'tracegroupgap': 0},
360
+ 'template': '...',
361
+ 'title': {'text': 'Costs of execution of 800 test queries per model'},
362
+ 'xaxis': {'anchor': 'y', 'domain': [0.0, 1.0], 'title': {'text': 'Model'}},
363
+ 'yaxis': {'anchor': 'x', 'domain': [0.0, 1.0], 'title': {'text': 'Execution cost ($)'}}}
364
+ })",Costs of execution of 800 test queries per model,Note that pause and resume time cost was not included in the cost calculation for the models billed hourly. Also although Gemini-Pro model is free for under 60 queries per minute we calculated the full cost for generating the tokens.,"{""data"":[{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-3.5-turbo"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""gpt-3.5-turbo"",""offsetgroup"":""gpt-3.5-turbo"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gpt-3.5-turbo""],""xaxis"":""x"",""y"":[0.041],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4-turbo"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""gpt-4-turbo"",""offsetgroup"":""gpt-4-turbo"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gpt-4-turbo""],""xaxis"":""x"",""y"":[0.5018],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""gpt-4"",""offsetgroup"":""gpt-4"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gpt-4""],""xaxis"":""x"",""y"":[1.2624],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""llama-2-70b-chat"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""llama-2-70b-chat"",""offsetgroup"":""llama-2-70b-chat"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""llama-2-70b-chat""],""xaxis"":""x"",""y"":[0.062568],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mixtral-8x7B-Instruct-v0.1"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""Mixtral-8x7B-Instruct-v0.1"",""offsetgroup"":""Mixtral-8x7B-Instruct-v0.1"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""Mixtral-8x7B-Instruct-v0.1""],""xaxis"":""x"",""y"":[0.07261200000000001],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""zephyr-7b-beta"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""zephyr-7b-beta"",""offsetgroup"":""zephyr-7b-beta"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""zephyr-7b-beta""],""xaxis"":""x"",""y"":[0.05180256798532274],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral-7B-Instruct-v0.2"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""Mistral-7B-Instruct-v0.2"",""offsetgroup"":""Mistral-7B-Instruct-v0.2"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""Mistral-7B-Instruct-v0.2""],""xaxis"":""x"",""y"":[0.052006909343931415],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""offsetgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0""],""xaxis"":""x"",""y"":[0.016347871700922646],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gemini-pro"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""gemini-pro"",""offsetgroup"":""gemini-pro"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gemini-pro""],""xaxis"":""x"",""y"":[0.01052],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison (PaLM 2)"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""chat-bison (PaLM 2)"",""offsetgroup"":""chat-bison (PaLM 2)"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""chat-bison (PaLM 2)""],""xaxis"":""x"",""y"":[0.013090000000000001],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison-32k (PaLM 2 32K)"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""chat-bison-32k (PaLM 2 32K)"",""offsetgroup"":""chat-bison-32k (PaLM 2 32K)"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""chat-bison-32k (PaLM 2 32K)""],""xaxis"":""x"",""y"":[0.01304],""yaxis"":""y"",""type"":""bar""}],""layout"":{""template"":{""data"":{""histogram2dcontour"":[{""type"":""histogram2dcontour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""choropleth"":[{""type"":""choropleth"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""histogram2d"":[{""type"":""histogram2d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmap"":[{""type"":""heatmap"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmapgl"":[{""type"":""heatmapgl"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""contourcarpet"":[{""type"":""contourcarpet"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""contour"":[{""type"":""contour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""surface"":[{""type"":""surface"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""mesh3d"":[{""type"":""mesh3d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""scatter"":[{""fillpattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2},""type"":""scatter""}],""parcoords"":[{""type"":""parcoords"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolargl"":[{""type"":""scatterpolargl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""bar"":[{""error_x"":{""color"":""#2a3f5f""},""error_y"":{""color"":""#2a3f5f""},""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""bar""}],""scattergeo"":[{""type"":""scattergeo"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolar"":[{""type"":""scatterpolar"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""histogram"":[{""marker"":{""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""histogram""}],""scattergl"":[{""type"":""scattergl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatter3d"":[{""type"":""scatter3d"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattermapbox"":[{""type"":""scattermapbox"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterternary"":[{""type"":""scatterternary"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattercarpet"":[{""type"":""scattercarpet"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""carpet"":[{""aaxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""baxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""type"":""carpet""}],""table"":[{""cells"":{""fill"":{""color"":""#EBF0F8""},""line"":{""color"":""white""}},""header"":{""fill"":{""color"":""#C8D4E3""},""line"":{""color"":""white""}},""type"":""table""}],""barpolar"":[{""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""barpolar""}],""pie"":[{""automargin"":true,""type"":""pie""}]},""layout"":{""autotypenumbers"":""strict"",""colorway"":[""#636efa"",""#EF553B"",""#00cc96"",""#ab63fa"",""#FFA15A"",""#19d3f3"",""#FF6692"",""#B6E880"",""#FF97FF"",""#FECB52""],""font"":{""color"":""#2a3f5f""},""hovermode"":""closest"",""hoverlabel"":{""align"":""left""},""paper_bgcolor"":""white"",""plot_bgcolor"":""#E5ECF6"",""polar"":{""bgcolor"":""#E5ECF6"",""angularaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""radialaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""ternary"":{""bgcolor"":""#E5ECF6"",""aaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""baxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""caxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""coloraxis"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""colorscale"":{""sequential"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""sequentialminus"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""diverging"":[[0,""#8e0152""],[0.1,""#c51b7d""],[0.2,""#de77ae""],[0.3,""#f1b6da""],[0.4,""#fde0ef""],[0.5,""#f7f7f7""],[0.6,""#e6f5d0""],[0.7,""#b8e186""],[0.8,""#7fbc41""],[0.9,""#4d9221""],[1,""#276419""]]},""xaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""yaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""scene"":{""xaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""yaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""zaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2}},""shapedefaults"":{""line"":{""color"":""#2a3f5f""}},""annotationdefaults"":{""arrowcolor"":""#2a3f5f"",""arrowhead"":0,""arrowwidth"":1},""geo"":{""bgcolor"":""white"",""landcolor"":""#E5ECF6"",""subunitcolor"":""white"",""showland"":true,""showlakes"":true,""lakecolor"":""white""},""title"":{""x"":0.05},""mapbox"":{""style"":""light""}}},""xaxis"":{""anchor"":""y"",""domain"":[0.0,1.0],""title"":{""text"":""Model""}},""yaxis"":{""anchor"":""x"",""domain"":[0.0,1.0],""title"":{""text"":""Execution cost ($)""}},""legend"":{""title"":{""text"":""Model""},""tracegroupgap"":0},""title"":{""text"":""Costs of execution of 800 test queries per model""},""barmode"":""relative""}}"
365
+ ./html/plots/model_sizes.html,"Figure({
366
+ 'data': [{'alignmentgroup': 'True',
367
+ 'hovertemplate': 'Model=%{x}<br>Model size (B params)=%{y}<extra></extra>',
368
+ 'legendgroup': 'llama-2-70b-chat',
369
+ 'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
370
+ 'name': 'llama-2-70b-chat',
371
+ 'offsetgroup': 'llama-2-70b-chat',
372
+ 'orientation': 'v',
373
+ 'showlegend': True,
374
+ 'textposition': 'auto',
375
+ 'type': 'bar',
376
+ 'x': array(['llama-2-70b-chat'], dtype=object),
377
+ 'xaxis': 'x',
378
+ 'y': array([70.]),
379
+ 'yaxis': 'y'},
380
+ {'alignmentgroup': 'True',
381
+ 'hovertemplate': 'Model=%{x}<br>Model size (B params)=%{y}<extra></extra>',
382
+ 'legendgroup': 'Mixtral-8x7B-Instruct-v0.1',
383
+ 'marker': {'color': '#EF553B', 'pattern': {'shape': ''}},
384
+ 'name': 'Mixtral-8x7B-Instruct-v0.1',
385
+ 'offsetgroup': 'Mixtral-8x7B-Instruct-v0.1',
386
+ 'orientation': 'v',
387
+ 'showlegend': True,
388
+ 'textposition': 'auto',
389
+ 'type': 'bar',
390
+ 'x': array(['Mixtral-8x7B-Instruct-v0.1'], dtype=object),
391
+ 'xaxis': 'x',
392
+ 'y': array([56.]),
393
+ 'yaxis': 'y'},
394
+ {'alignmentgroup': 'True',
395
+ 'hovertemplate': 'Model=%{x}<br>Model size (B params)=%{y}<extra></extra>',
396
+ 'legendgroup': 'zephyr-7b-beta',
397
+ 'marker': {'color': '#00cc96', 'pattern': {'shape': ''}},
398
+ 'name': 'zephyr-7b-beta',
399
+ 'offsetgroup': 'zephyr-7b-beta',
400
+ 'orientation': 'v',
401
+ 'showlegend': True,
402
+ 'textposition': 'auto',
403
+ 'type': 'bar',
404
+ 'x': array(['zephyr-7b-beta'], dtype=object),
405
+ 'xaxis': 'x',
406
+ 'y': array([7.]),
407
+ 'yaxis': 'y'},
408
+ {'alignmentgroup': 'True',
409
+ 'hovertemplate': 'Model=%{x}<br>Model size (B params)=%{y}<extra></extra>',
410
+ 'legendgroup': 'Mistral-7B-Instruct-v0.2',
411
+ 'marker': {'color': '#ab63fa', 'pattern': {'shape': ''}},
412
+ 'name': 'Mistral-7B-Instruct-v0.2',
413
+ 'offsetgroup': 'Mistral-7B-Instruct-v0.2',
414
+ 'orientation': 'v',
415
+ 'showlegend': True,
416
+ 'textposition': 'auto',
417
+ 'type': 'bar',
418
+ 'x': array(['Mistral-7B-Instruct-v0.2'], dtype=object),
419
+ 'xaxis': 'x',
420
+ 'y': array([7.]),
421
+ 'yaxis': 'y'},
422
+ {'alignmentgroup': 'True',
423
+ 'hovertemplate': 'Model=%{x}<br>Model size (B params)=%{y}<extra></extra>',
424
+ 'legendgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
425
+ 'marker': {'color': '#FFA15A', 'pattern': {'shape': ''}},
426
+ 'name': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
427
+ 'offsetgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
428
+ 'orientation': 'v',
429
+ 'showlegend': True,
430
+ 'textposition': 'auto',
431
+ 'type': 'bar',
432
+ 'x': array(['TinyLlama/TinyLlama-1.1B-Chat-v1.0'], dtype=object),
433
+ 'xaxis': 'x',
434
+ 'y': array([1.1]),
435
+ 'yaxis': 'y'}],
436
+ 'layout': {'barmode': 'relative',
437
+ 'legend': {'title': {'text': 'Model'}, 'tracegroupgap': 0},
438
+ 'template': '...',
439
+ 'title': {'text': 'Model sizes in billions of parameters'},
440
+ 'xaxis': {'anchor': 'y', 'domain': [0.0, 1.0], 'title': {'text': 'Model'}},
441
+ 'yaxis': {'anchor': 'x', 'domain': [0.0, 1.0], 'title': {'text': 'Model size (B params)'}}}
442
+ })",Model sizes in billions of parameters,Note that some models have undisclosed sizes.,"{""data"":[{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eModel size (B params)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""llama-2-70b-chat"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""llama-2-70b-chat"",""offsetgroup"":""llama-2-70b-chat"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""llama-2-70b-chat""],""xaxis"":""x"",""y"":[70.0],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eModel size (B params)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mixtral-8x7B-Instruct-v0.1"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""Mixtral-8x7B-Instruct-v0.1"",""offsetgroup"":""Mixtral-8x7B-Instruct-v0.1"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""Mixtral-8x7B-Instruct-v0.1""],""xaxis"":""x"",""y"":[56.0],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eModel size (B params)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""zephyr-7b-beta"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""zephyr-7b-beta"",""offsetgroup"":""zephyr-7b-beta"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""zephyr-7b-beta""],""xaxis"":""x"",""y"":[7.0],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eModel size (B params)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral-7B-Instruct-v0.2"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""Mistral-7B-Instruct-v0.2"",""offsetgroup"":""Mistral-7B-Instruct-v0.2"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""Mistral-7B-Instruct-v0.2""],""xaxis"":""x"",""y"":[7.0],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eModel size (B params)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""offsetgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0""],""xaxis"":""x"",""y"":[1.1],""yaxis"":""y"",""type"":""bar""}],""layout"":{""template"":{""data"":{""histogram2dcontour"":[{""type"":""histogram2dcontour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""choropleth"":[{""type"":""choropleth"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""histogram2d"":[{""type"":""histogram2d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmap"":[{""type"":""heatmap"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmapgl"":[{""type"":""heatmapgl"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""contourcarpet"":[{""type"":""contourcarpet"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""contour"":[{""type"":""contour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""surface"":[{""type"":""surface"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""mesh3d"":[{""type"":""mesh3d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""scatter"":[{""fillpattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2},""type"":""scatter""}],""parcoords"":[{""type"":""parcoords"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolargl"":[{""type"":""scatterpolargl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""bar"":[{""error_x"":{""color"":""#2a3f5f""},""error_y"":{""color"":""#2a3f5f""},""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""bar""}],""scattergeo"":[{""type"":""scattergeo"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolar"":[{""type"":""scatterpolar"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""histogram"":[{""marker"":{""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""histogram""}],""scattergl"":[{""type"":""scattergl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatter3d"":[{""type"":""scatter3d"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattermapbox"":[{""type"":""scattermapbox"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterternary"":[{""type"":""scatterternary"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattercarpet"":[{""type"":""scattercarpet"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""carpet"":[{""aaxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""baxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""type"":""carpet""}],""table"":[{""cells"":{""fill"":{""color"":""#EBF0F8""},""line"":{""color"":""white""}},""header"":{""fill"":{""color"":""#C8D4E3""},""line"":{""color"":""white""}},""type"":""table""}],""barpolar"":[{""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""barpolar""}],""pie"":[{""automargin"":true,""type"":""pie""}]},""layout"":{""autotypenumbers"":""strict"",""colorway"":[""#636efa"",""#EF553B"",""#00cc96"",""#ab63fa"",""#FFA15A"",""#19d3f3"",""#FF6692"",""#B6E880"",""#FF97FF"",""#FECB52""],""font"":{""color"":""#2a3f5f""},""hovermode"":""closest"",""hoverlabel"":{""align"":""left""},""paper_bgcolor"":""white"",""plot_bgcolor"":""#E5ECF6"",""polar"":{""bgcolor"":""#E5ECF6"",""angularaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""radialaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""ternary"":{""bgcolor"":""#E5ECF6"",""aaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""baxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""caxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""coloraxis"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""colorscale"":{""sequential"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""sequentialminus"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""diverging"":[[0,""#8e0152""],[0.1,""#c51b7d""],[0.2,""#de77ae""],[0.3,""#f1b6da""],[0.4,""#fde0ef""],[0.5,""#f7f7f7""],[0.6,""#e6f5d0""],[0.7,""#b8e186""],[0.8,""#7fbc41""],[0.9,""#4d9221""],[1,""#276419""]]},""xaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""yaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""scene"":{""xaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""yaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""zaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2}},""shapedefaults"":{""line"":{""color"":""#2a3f5f""}},""annotationdefaults"":{""arrowcolor"":""#2a3f5f"",""arrowhead"":0,""arrowwidth"":1},""geo"":{""bgcolor"":""white"",""landcolor"":""#E5ECF6"",""subunitcolor"":""white"",""showland"":true,""showlakes"":true,""lakecolor"":""white""},""title"":{""x"":0.05},""mapbox"":{""style"":""light""}}},""xaxis"":{""anchor"":""y"",""domain"":[0.0,1.0],""title"":{""text"":""Model""}},""yaxis"":{""anchor"":""x"",""domain"":[0.0,1.0],""title"":{""text"":""Model size (B params)""}},""legend"":{""title"":{""text"":""Model""},""tracegroupgap"":0},""title"":{""text"":""Model sizes in billions of parameters""},""barmode"":""relative""}}"
data/2024-02-05 12:03:45.281624_model_costs.csv ADDED
@@ -0,0 +1,12 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ model,provider,cost_per_token,provider_pricing
2
+ gpt-3.5-turbo,OpenAI,"$1 / 1M input tokens, $2 / 1M output tokens","$1 / 1M input tokens, $2 / 1M output tokens"
3
+ gpt-4-turbo,OpenAI,"$10 / 1M input tokens, $30 / 1M output tokens","$10 / 1M input tokens, $30 / 1M output tokens"
4
+ gpt-4,OpenAI,"$30 / 1M input tokens, $60 / 1M output tokens","$30 / 1M input tokens, $60 / 1M output tokens"
5
+ llama-2-70b-chat,Together AI,$0.9 / 1M tokens,$0.9 / 1M tokens
6
+ Mixtral-8x7B-Instruct-v0.1,Together AI,$0.9 / 1M tokens,$0.9 / 1M tokens
7
+ zephyr-7b-beta,Hugging Face Inference Endpoint,$0.15 / 1M tokens,$1.3 / hour
8
+ Mistral-7B-Instruct-v0.2,Hugging Face Inference Endpoint,$0.14 / 1M tokens,$1.3 / hour
9
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,Hugging Face Inference Endpoint,$0.068 / 1M tokens,$0.6 / hour
10
+ gemini-pro,Google VertexAI,"$0.25 / 1M input tokens, $0.5 / 1M output tokens","$0.25 / 1M input characters, $0.5 / 1M output characters (60 queries per minute are free)"
11
+ chat-bison (PaLM 2),Google VertexAI,"$0.25 / 1M input tokens, $0.5 / 1M output tokens","$0.25 / 1M input tokens, $0.5 / 1M output tokens"
12
+ chat-bison-32k (PaLM 2 32K),Google VertexAI,"$0.25 / 1M input tokens, $0.5 / 1M output tokens","$0.25 / 1M input tokens, $0.5 / 1M output tokens"
data/2024-02-05 23:33:22.947120_summary.csv ADDED
@@ -0,0 +1,55 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ model,language,template_name,execution_time,characters_count,words_count,chunk_sizes_mean,chunk_sizes_min,chunk_sizes_max,chunk_generation_times_mean,chunk_generation_times_min,chunk_generation_times_max
2
+ Mistral-7B-Instruct-v0.2,english,json,4.278648148264204,342.8,55.15,4.1311870534561415,1.0,15.0,0.040544769239987996,0.00024437904357910156,60.7178213596344
3
+ Mistral-7B-Instruct-v0.2,english,markdown,3.7188014924526214,366.85,57.1375,4.239202657807309,1.0,16.0,0.03371991898375372,0.020945072174072266,0.25538039207458496
4
+ Mistral-7B-Instruct-v0.2,japanese,json,2.413569121701377,52.07857142857143,3.414285714285714,1.2991803278688525,1.0,11.0,0.039267738759305254,0.00047779083251953125,3.370748996734619
5
+ Mistral-7B-Instruct-v0.2,japanese,markdown,2.323612022399902,42.25,1.5833333333333333,1.1069868995633187,1.0,6.0,0.03958142719935121,0.0004932880401611328,0.2205650806427002
6
+ Mixtral-8x7B-Instruct-v0.1,english,json,3.643989532061343,404.10849056603774,62.575471698113205,4.137546333747872,1.0,15.0,0.014243678199270911,0.00020456314086914062,3.4127349853515625
7
+ Mixtral-8x7B-Instruct-v0.1,english,markdown,5.995457515120506,533.9270833333334,85.15625,4.360071452875127,1.0,15.0,0.016480832612607788,0.00021076202392578125,1.7103569507598877
8
+ Mixtral-8x7B-Instruct-v0.1,japanese,json,7.938035423738243,565.6496350364963,64.76642335766424,2.248940739450926,1.0,109.0,0.023964353726961752,0.00020885467529296875,76.45081758499146
9
+ Mixtral-8x7B-Instruct-v0.1,japanese,markdown,9.979603266716003,431.71666666666664,5.983333333333333,1.0810483702683527,1.0,12.0,0.017558807731893653,0.0002148151397705078,2.994176149368286
10
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,english,json,1.9458302193674548,366.25,61.58965517241379,4.169774654522613,1.0,13.0,0.012296600931852907,0.00024318695068359375,0.17363858222961426
11
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,english,markdown,1.6830505162477494,282.55,47.1125,3.9572829131652663,1.0,14.0,0.012217252319600401,0.0003170967102050781,0.15227961540222168
12
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,japanese,json,1.4167885013989039,72.81428571428572,8.8,2.0274463007159906,1.0,13.0,0.014790566363975749,0.00031280517578125,0.3310587406158447
13
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,japanese,markdown,1.336316986878713,89.78333333333333,12.716666666666667,2.432054176072235,1.0,13.0,0.013910464400900675,0.0005300045013427734,0.176621675491333
14
+ chat-bison,english,json,3.446989095211029,550.05,86.0,89.4390243902439,1.0,138.0,0.4258628240445765,0.0006544589996337891,2.2015340328216553
15
+ chat-bison,japanese,json,4.333498167991638,246.1,12.0,33.48299319727891,3.0,124.0,0.47770044917152044,0.0005426406860351562,3.5425846576690674
16
+ chat-bison (PaLM 2),english,json,2.5406186148524283,381.7267857142857,60.88125,78.31727422604872,1.0,142.0,0.3495202942369709,0.0003688335418701172,7.334931373596191
17
+ chat-bison (PaLM 2),english,markdown,2.9635989278554917,490.4875,78.5375,84.20386266094421,1.0,138.0,0.3641034907025841,0.0004639625549316406,4.600815534591675
18
+ chat-bison (PaLM 2),japanese,json,3.0616454005241396,232.68,10.48,34.21764705882353,3.0,124.0,0.326771635167739,0.0005857944488525391,2.7724690437316895
19
+ chat-bison (PaLM 2),japanese,markdown,4.669546687602997,431.725,13.85,31.74448529411765,2.0,124.0,0.27883222348549785,0.0005550384521484375,7.114030122756958
20
+ chat-bison-32k,english,json,3.74513863325119,538.4,84.25,88.26229508196721,1.0,134.0,0.47832588094179745,0.0006556510925292969,3.0114917755126953
21
+ chat-bison-32k,japanese,json,4.5112169027328495,241.45,11.8,35.77037037037037,6.0,124.0,0.5467217816246881,0.0005869865417480469,4.387756824493408
22
+ chat-bison-32k (PaLM 2 32K),english,json,7.142214598400252,335.47232142857143,53.799107142857146,77.18344289235826,1.0,133.0,1.4512595853652734,0.00041985511779785156,101.5493803024292
23
+ chat-bison-32k (PaLM 2 32K),english,markdown,3.44630788564682,429.95,69.35,82.6826923076923,1.0,133.0,0.5048719226167753,0.0005412101745605469,18.035786390304565
24
+ chat-bison-32k (PaLM 2 32K),japanese,json,5.072022783756256,272.85,10.35,34.320754716981135,4.0,124.0,0.5336985453119818,0.0005052089691162109,52.47814655303955
25
+ chat-bison-32k (PaLM 2 32K),japanese,markdown,6.1971998631954195,446.45,21.4,32.118705035971225,5.0,124.0,0.3856057263106751,0.0005400180816650391,7.165225505828857
26
+ gemini-pro,english,json,2.7415290858475547,388.5206321334504,62.01755926251097,204.58853444290338,1.0,988.0,1.4202116817663073,0.0004703998565673828,13.73231840133667
27
+ gemini-pro,english,markdown,3.0089986324310303,487.1458333333333,80.67708333333333,183.39607843137256,12.0,472.0,1.1130499073103362,0.0006177425384521484,4.875006198883057
28
+ gemini-pro,japanese,json,4.5300196591070145,276.6694915254237,6.983050847457627,91.1927374301676,4.0,333.0,1.4752027082709627,0.0006062984466552734,8.291066646575928
29
+ gemini-pro,japanese,markdown,6.166934008781727,422.7307692307692,9.096153846153847,90.83471074380165,9.0,266.0,1.3123543331445742,0.0006639957427978516,13.754565954208374
30
+ gpt-3.5-turbo,english,call,2.908525016600803,456.85911016949154,72.26059322033899,,,,,,
31
+ gpt-3.5-turbo,english,json,2.566863525494622,398.56960556844547,65.32366589327147,4.806746320443226,1.0,16.0,0.015585779219764062,0.0005395412445068359,1.4500916004180908
32
+ gpt-3.5-turbo,english,markdown,2.3388922008184285,506.90384615384613,81.99038461538461,5.050584403142365,1.0,16.0,0.01715806382989308,0.0005617141723632812,1.127073049545288
33
+ gpt-3.5-turbo,japanese,call,7.255881716940138,382.95,6.351111111111111,,,,,,
34
+ gpt-3.5-turbo,japanese,json,5.226112197780009,237.1069182389937,3.559748427672956,1.1291481969569905,1.0,7.0,0.02129129201220198,0.0005452632904052734,13.75982117652893
35
+ gpt-3.5-turbo,japanese,markdown,7.29901300883684,358.72131147540983,6.065573770491803,1.1894977168949772,1.0,15.0,0.021750167313542772,0.0005612373352050781,13.71114993095398
36
+ gpt-4,english,call,9.15708539162022,374.16815144766144,59.661469933184854,,,,,,
37
+ gpt-4,english,json,7.963626848197565,383.3707317073171,61.69512195121951,4.7834568389659005,1.0,16.0,0.08687007305138472,0.000537872314453125,3.531284809112549
38
+ gpt-4,english,markdown,10.02310108244419,428.35,67.825,4.990243192078054,1.0,16.0,0.10377185442257747,0.0005447864532470703,2.087376117706299
39
+ gpt-4,japanese,call,24.259297592319243,214.9076023391813,1.1695906432748537,,,,,,
40
+ gpt-4,japanese,json,22.703774025460252,211.63025210084032,4.168067226890757,1.1685226429101707,1.0,7.0,0.11835955503744466,0.0005507469177246094,3.5608017444610596
41
+ gpt-4,japanese,markdown,31.99519391655922,275.1,2.925,1.1327980234712787,1.0,9.0,0.12606545905407157,0.0005619525909423828,2.9794347286224365
42
+ gpt-4-turbo,english,call,7.319288367695279,372.86,58.532222222222224,,,,,,
43
+ gpt-4-turbo,english,json,6.457074524425879,407.0243902439024,64.18414634146342,4.735998183701559,1.0,17.0,0.06474667943090798,0.0006806850433349609,5.431884765625
44
+ gpt-4-turbo,english,markdown,8.325546002388,462.1125,71.925,4.984360253471754,1.0,16.0,0.07950969425127868,0.0006999969482421875,2.0926766395568848
45
+ gpt-4-turbo,japanese,call,32.67405146055443,372.7860465116279,24.886046511627907,,,,,,
46
+ gpt-4-turbo,japanese,json,19.359180968999862,250.44166666666666,6.183333333333334,1.184261339007763,1.0,8.0,0.08582140138847597,0.0006830692291259766,13.252992153167725
47
+ gpt-4-turbo,japanese,markdown,20.977174520492554,283.55,4.45,1.1460038395473375,1.0,10.0,0.07991695286011809,0.0007085800170898438,2.3845231533050537
48
+ llama-2-70b-chat,english,json,2.917410132025375,355.7463556851312,54.861030126336246,4.02267032967033,1.0,15.0,0.019103390617685005,0.0001990795135498047,3.8762006759643555
49
+ llama-2-70b-chat,english,markdown,4.99397261045417,827.5714285714286,125.95918367346938,4.177931176591799,1.0,16.0,0.018161741699259625,0.0002124309539794922,0.7439091205596924
50
+ llama-2-70b-chat,japanese,json,5.265992468681889,369.3768115942029,42.56521739130435,2.3362207250561435,1.0,15.0,0.023359512199899433,0.00020837783813476562,0.9314718246459961
51
+ llama-2-70b-chat,japanese,markdown,11.084085723449444,1379.6896551724137,158.01724137931035,2.2644745033674796,1.0,16.0,0.01566780037868879,0.0002117156982421875,76.44498753547668
52
+ zephyr-7b-beta,english,json,3.94231437737087,367.57232704402514,60.257861635220124,4.262252042007002,1.0,14.0,0.03629181767914927,0.0003070831298828125,0.4896988868713379
53
+ zephyr-7b-beta,english,markdown,4.959704548120499,358.9375,58.3625,4.390672782874618,1.0,15.0,0.05067269182351022,0.00040459632873535156,75.15552616119385
54
+ zephyr-7b-beta,japanese,json,2.339889786640803,41.583333333333336,3.6333333333333333,1.1566991191469633,1.0,7.0,0.042134473762636,0.018090486526489258,0.4599947929382324
55
+ zephyr-7b-beta,japanese,markdown,2.3176693956057233,38.1,2.3833333333333333,1.0343891402714933,1.0,4.0,0.041092377011053165,0.02583909034729004,0.4606599807739258
data/2024-02-06 07:53:19.636658_time_of_day_comparison.csv ADDED
@@ -0,0 +1,91 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ model,time_of_day,execution_time,characters_count,words_count
2
+ Mistral-7B-Instruct-v0.2,0-2 midnight,1.9149879813194275,37.8,2.95
3
+ Mistral-7B-Instruct-v0.2,12-14 afternoon,3.228973722457886,222.0625,32.25
4
+ Mistral-7B-Instruct-v0.2,15-17 late afternoon,3.2048643112182615,219.8625,31.8
5
+ Mistral-7B-Instruct-v0.2,18-20 evening,3.397640073299408,261.18333333333334,40.1
6
+ Mistral-7B-Instruct-v0.2,21-23 late evening,3.389284573495388,175.79375,25.68125
7
+ Mistral-7B-Instruct-v0.2,3-5 night,,,
8
+ Mistral-7B-Instruct-v0.2,6-8 early morning,,,
9
+ Mistral-7B-Instruct-v0.2,9-11 morning,3.734026002883911,362.9,58.35
10
+ Mixtral-8x7B-Instruct-v0.1,0-2 midnight,4.639010797279158,323.0394736842105,42.69210526315789
11
+ Mixtral-8x7B-Instruct-v0.1,12-14 afternoon,5.362903979589355,369.3192307692308,54.353846153846156
12
+ Mixtral-8x7B-Instruct-v0.1,15-17 late afternoon,5.80184749175942,347.9681818181818,47.27272727272727
13
+ Mixtral-8x7B-Instruct-v0.1,18-20 evening,3.6435119574237023,326.69,48.545
14
+ Mixtral-8x7B-Instruct-v0.1,21-23 late evening,5.62397656769588,395.15714285714284,49.02857142857143
15
+ Mixtral-8x7B-Instruct-v0.1,3-5 night,4.009439338194697,301.24545454545455,42.21818181818182
16
+ Mixtral-8x7B-Instruct-v0.1,6-8 early morning,4.526968242530536,285.045,41.86
17
+ Mixtral-8x7B-Instruct-v0.1,9-11 morning,3.9661054956285575,304.82,47.28
18
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,0-2 midnight,1.6341248273849487,210.2,34.2
19
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,12-14 afternoon,1.8381905496120452,308.795,51.08
20
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,15-17 late afternoon,1.7547113946505954,285.17857142857144,46.9
21
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,18-20 evening,1.7984187936782836,313.99,51.96
22
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,21-23 late evening,1.5875422928068372,192.78333333333333,31.261111111111113
23
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,3-5 night,2.0128010153770446,372.05,62.6
24
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,6-8 early morning,2.0273348593711855,372.13,62.53
25
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,9-11 morning,1.9041210174560548,372.05,62.6
26
+ chat-bison,0-2 midnight,3.890243631601334,398.075,49.0
27
+ chat-bison (PaLM 2),0-2 midnight,2.468383938074112,381.95,60.9
28
+ chat-bison (PaLM 2),12-14 afternoon,2.6460144804074215,376.28076923076924,55.965384615384615
29
+ chat-bison (PaLM 2),15-17 late afternoon,3.0387172081253744,381.1363636363636,53.35454545454545
30
+ chat-bison (PaLM 2),18-20 evening,2.688272579908371,367.07,55.89
31
+ chat-bison (PaLM 2),21-23 late evening,2.7250528037548065,382.725,52.95
32
+ chat-bison (PaLM 2),3-5 night,2.460119960308075,381.92,60.94
33
+ chat-bison (PaLM 2),6-8 early morning,2.4665334616388592,381.9214285714286,60.892857142857146
34
+ chat-bison (PaLM 2),9-11 morning,2.488477897644043,381.73,60.88
35
+ chat-bison-32k,0-2 midnight,4.128177767992019,389.925,48.025
36
+ chat-bison-32k (PaLM 2 32K),0-2 midnight,7.7498266498247785,335.75,53.85
37
+ chat-bison-32k (PaLM 2 32K),12-14 afternoon,5.014458654477046,339.3692307692308,49.323076923076925
38
+ chat-bison-32k (PaLM 2 32K),15-17 late afternoon,4.5047362284226855,348.65909090909093,48.35454545454545
39
+ chat-bison-32k (PaLM 2 32K),18-20 evening,7.7332194912433625,329.46,49.5
40
+ chat-bison-32k (PaLM 2 32K),21-23 late evening,7.796841062307358,349.95,47.805
41
+ chat-bison-32k (PaLM 2 32K),3-5 night,6.491292915344238,335.75,53.85
42
+ chat-bison-32k (PaLM 2 32K),6-8 early morning,9.141417106560299,335.75,53.85
43
+ chat-bison-32k (PaLM 2 32K),9-11 morning,7.7035503840446475,335.75,53.85
44
+ gemini-pro,0-2 midnight,3.338477972348531,369.825,55.9125
45
+ gemini-pro,12-14 afternoon,2.816922114008949,360.62307692307695,53.25769230769231
46
+ gemini-pro,15-17 late afternoon,2.9268629640903114,364.57272727272726,50.1
47
+ gemini-pro,18-20 evening,2.86901999375759,366.4,55.045
48
+ gemini-pro,21-23 late evening,3.7189874940246117,390.9142857142857,51.35
49
+ gemini-pro,3-5 night,2.8375814715210272,374.8,60.04
50
+ gemini-pro,6-8 early morning,2.7453590130460435,381.2214285714286,60.964285714285715
51
+ gemini-pro,9-11 morning,2.497767536007628,371.93,59.39
52
+ gpt-3.5-turbo,0-2 midnight,3.822115447632102,426.71923076923076,49.05
53
+ gpt-3.5-turbo,12-14 afternoon,3.9458200880459375,381.4428571428571,43.76190476190476
54
+ gpt-3.5-turbo,15-17 late afternoon,4.384064777692159,396.4357142857143,43.28333333333333
55
+ gpt-3.5-turbo,18-20 evening,3.5153889304115657,385.18095238095236,46.01428571428571
56
+ gpt-3.5-turbo,21-23 late evening,5.110168156187617,422.73510971786834,45.358934169278996
57
+ gpt-3.5-turbo,3-5 night,6.062970260473398,418.6192307692308,44.926923076923075
58
+ gpt-3.5-turbo,6-8 early morning,3.787998208734724,403.74444444444447,47.34444444444444
59
+ gpt-3.5-turbo,9-11 morning,3.126271222697364,389.9888888888889,50.93888888888889
60
+ gpt-4,0-2 midnight,12.3578163115329,334.075,41.35
61
+ gpt-4,12-14 afternoon,16.002364798386893,318.3095238095238,38.77142857142857
62
+ gpt-4,15-17 late afternoon,16.80607506932254,313.3595238095238,37.49285714285714
63
+ gpt-4,18-20 evening,13.841120740345547,318.0809523809524,40.19285714285714
64
+ gpt-4,21-23 late evening,14.298642643005493,314.336,37.012
65
+ gpt-4,3-5 night,12.813134506115546,316.93461538461537,37.93076923076923
66
+ gpt-4,6-8 early morning,14.348626694414351,323.5388888888889,40.544444444444444
67
+ gpt-4,9-11 morning,12.759107512468733,338.18333333333334,46.85
68
+ gpt-4-turbo,0-2 midnight,13.770663784850727,382.7613636363636,47.61818181818182
69
+ gpt-4-turbo,12-14 afternoon,13.997754749229976,351.01190476190476,46.03333333333333
70
+ gpt-4-turbo,15-17 late afternoon,22.320911452883767,381.65714285714284,47.35476190476191
71
+ gpt-4-turbo,18-20 evening,16.550320884159632,382.31666666666666,48.45
72
+ gpt-4-turbo,21-23 late evening,14.592236209392548,413.61,44.8
73
+ gpt-4-turbo,3-5 night,14.254795966698573,352.54615384615386,46.37692307692308
74
+ gpt-4-turbo,6-8 early morning,11.555620827939775,357.65555555555557,47.21666666666667
75
+ gpt-4-turbo,9-11 morning,13.686854598257277,381.8888888888889,55.02777777777778
76
+ llama-2-70b-chat,0-2 midnight,3.249819871626402,346.8875,52.06875
77
+ llama-2-70b-chat,12-14 afternoon,4.234376892130426,375.44615384615383,55.238461538461536
78
+ llama-2-70b-chat,15-17 late afternoon,3.6833307104881365,433.6636363636364,59.445454545454545
79
+ llama-2-70b-chat,18-20 evening,2.9706250462084185,317.245,47.4
80
+ llama-2-70b-chat,21-23 late evening,4.719581684340602,572.1689655172414,79.83103448275862
81
+ llama-2-70b-chat,3-5 night,2.8264514451677147,313.71,48.42
82
+ llama-2-70b-chat,6-8 early morning,2.8660141522424265,289.6642857142857,44.614285714285714
83
+ llama-2-70b-chat,9-11 morning,2.872361832027194,283.35,43.45
84
+ zephyr-7b-beta,0-2 midnight,3.7253047794103624,217.82083333333333,33.67916666666667
85
+ zephyr-7b-beta,12-14 afternoon,3.5789777278900146,277.6,44.016666666666666
86
+ zephyr-7b-beta,15-17 late afternoon,3.4592524923459447,248.59,38.9
87
+ zephyr-7b-beta,18-20 evening,3.5673056403795878,273.3666666666667,43.5
88
+ zephyr-7b-beta,21-23 late evening,3.45343524068594,176.23125,27.21875
89
+ zephyr-7b-beta,3-5 night,3.6954557319482166,216.55833333333334,33.46666666666667
90
+ zephyr-7b-beta,6-8 early morning,3.937663261095683,273.03333333333336,43.45
91
+ zephyr-7b-beta,9-11 morning,4.056525647640228,386.3,63.35
data/2024-02-06 09:35:10.194145_time_of_day_comparison.csv ADDED
@@ -0,0 +1,89 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ model,time_of_day,execution_time,characters_count,words_count
2
+ Mistral-7B-Instruct-v0.2,afternoon,3.228973722457886,222.0625,32.25
3
+ Mistral-7B-Instruct-v0.2,evening,3.397640073299408,261.18333333333334,40.1
4
+ Mistral-7B-Instruct-v0.2,late afternoon,3.2048643112182615,219.8625,31.8
5
+ Mistral-7B-Instruct-v0.2,late evening,3.389284573495388,175.79375,25.68125
6
+ Mistral-7B-Instruct-v0.2,midnight,1.9149879813194275,37.8,2.95
7
+ Mistral-7B-Instruct-v0.2,morning,3.734026002883911,362.9,58.35
8
+ Mixtral-8x7B-Instruct-v0.1,afternoon,5.362903979589355,369.3192307692308,54.353846153846156
9
+ Mixtral-8x7B-Instruct-v0.1,early morning,4.526968242530536,285.045,41.86
10
+ Mixtral-8x7B-Instruct-v0.1,evening,3.6435119574237023,326.69,48.545
11
+ Mixtral-8x7B-Instruct-v0.1,late afternoon,5.80184749175942,347.9681818181818,47.27272727272727
12
+ Mixtral-8x7B-Instruct-v0.1,late evening,5.62397656769588,395.15714285714284,49.02857142857143
13
+ Mixtral-8x7B-Instruct-v0.1,midnight,4.639010797279158,323.0394736842105,42.69210526315789
14
+ Mixtral-8x7B-Instruct-v0.1,morning,3.9661054956285575,304.82,47.28
15
+ Mixtral-8x7B-Instruct-v0.1,night,4.009439338194697,301.24545454545455,42.21818181818182
16
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,afternoon,1.8381905496120452,308.795,51.08
17
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,early morning,2.0273348593711855,372.13,62.53
18
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,evening,1.7984187936782836,313.99,51.96
19
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,late afternoon,1.7547113946505954,285.17857142857144,46.9
20
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,late evening,1.5875422928068372,192.78333333333333,31.261111111111113
21
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,midnight,1.6341248273849487,210.2,34.2
22
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,morning,1.9041210174560548,372.05,62.6
23
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,night,2.0128010153770446,372.05,62.6
24
+ chat-bison,midnight,3.890243631601334,398.075,49.0
25
+ chat-bison (PaLM 2),afternoon,2.6460144804074215,376.28076923076924,55.965384615384615
26
+ chat-bison (PaLM 2),early morning,2.4665334616388592,381.9214285714286,60.892857142857146
27
+ chat-bison (PaLM 2),evening,2.688272579908371,367.07,55.89
28
+ chat-bison (PaLM 2),late afternoon,3.0387172081253744,381.1363636363636,53.35454545454545
29
+ chat-bison (PaLM 2),late evening,2.7250528037548065,382.725,52.95
30
+ chat-bison (PaLM 2),midnight,2.468383938074112,381.95,60.9
31
+ chat-bison (PaLM 2),morning,2.488477897644043,381.73,60.88
32
+ chat-bison (PaLM 2),night,2.460119960308075,381.92,60.94
33
+ chat-bison-32k,midnight,4.128177767992019,389.925,48.025
34
+ chat-bison-32k (PaLM 2 32K),afternoon,5.014458654477046,339.3692307692308,49.323076923076925
35
+ chat-bison-32k (PaLM 2 32K),early morning,9.141417106560299,335.75,53.85
36
+ chat-bison-32k (PaLM 2 32K),evening,7.7332194912433625,329.46,49.5
37
+ chat-bison-32k (PaLM 2 32K),late afternoon,4.5047362284226855,348.65909090909093,48.35454545454545
38
+ chat-bison-32k (PaLM 2 32K),late evening,7.796841062307358,349.95,47.805
39
+ chat-bison-32k (PaLM 2 32K),midnight,7.7498266498247785,335.75,53.85
40
+ chat-bison-32k (PaLM 2 32K),morning,7.7035503840446475,335.75,53.85
41
+ chat-bison-32k (PaLM 2 32K),night,6.491292915344238,335.75,53.85
42
+ gemini-pro,afternoon,2.816922114008949,360.62307692307695,53.25769230769231
43
+ gemini-pro,early morning,2.7453590130460435,381.2214285714286,60.964285714285715
44
+ gemini-pro,evening,2.86901999375759,366.4,55.045
45
+ gemini-pro,late afternoon,2.9268629640903114,364.57272727272726,50.1
46
+ gemini-pro,late evening,3.7189874940246117,390.9142857142857,51.35
47
+ gemini-pro,midnight,3.338477972348531,369.825,55.9125
48
+ gemini-pro,morning,2.497767536007628,371.93,59.39
49
+ gemini-pro,night,2.8375814715210272,374.8,60.04
50
+ gpt-3.5-turbo,afternoon,3.9458200880459375,381.4428571428571,43.76190476190476
51
+ gpt-3.5-turbo,early morning,3.787998208734724,403.74444444444447,47.34444444444444
52
+ gpt-3.5-turbo,evening,3.5153889304115657,385.18095238095236,46.01428571428571
53
+ gpt-3.5-turbo,late afternoon,4.384064777692159,396.4357142857143,43.28333333333333
54
+ gpt-3.5-turbo,late evening,5.110168156187617,422.73510971786834,45.358934169278996
55
+ gpt-3.5-turbo,midnight,3.822115447632102,426.71923076923076,49.05
56
+ gpt-3.5-turbo,morning,3.126271222697364,389.9888888888889,50.93888888888889
57
+ gpt-3.5-turbo,night,6.062970260473398,418.6192307692308,44.926923076923075
58
+ gpt-4,afternoon,16.002364798386893,318.3095238095238,38.77142857142857
59
+ gpt-4,early morning,14.348626694414351,323.5388888888889,40.544444444444444
60
+ gpt-4,evening,13.841120740345547,318.0809523809524,40.19285714285714
61
+ gpt-4,late afternoon,16.80607506932254,313.3595238095238,37.49285714285714
62
+ gpt-4,late evening,14.298642643005493,314.336,37.012
63
+ gpt-4,midnight,12.3578163115329,334.075,41.35
64
+ gpt-4,morning,12.759107512468733,338.18333333333334,46.85
65
+ gpt-4,night,12.813134506115546,316.93461538461537,37.93076923076923
66
+ gpt-4-turbo,afternoon,13.997754749229976,351.01190476190476,46.03333333333333
67
+ gpt-4-turbo,early morning,11.555620827939775,357.65555555555557,47.21666666666667
68
+ gpt-4-turbo,evening,16.550320884159632,382.31666666666666,48.45
69
+ gpt-4-turbo,late afternoon,22.320911452883767,381.65714285714284,47.35476190476191
70
+ gpt-4-turbo,late evening,14.592236209392548,413.61,44.8
71
+ gpt-4-turbo,midnight,13.770663784850727,382.7613636363636,47.61818181818182
72
+ gpt-4-turbo,morning,13.686854598257277,381.8888888888889,55.02777777777778
73
+ gpt-4-turbo,night,14.254795966698573,352.54615384615386,46.37692307692308
74
+ llama-2-70b-chat,afternoon,4.234376892130426,375.44615384615383,55.238461538461536
75
+ llama-2-70b-chat,early morning,2.8660141522424265,289.6642857142857,44.614285714285714
76
+ llama-2-70b-chat,evening,2.9706250462084185,317.245,47.4
77
+ llama-2-70b-chat,late afternoon,3.6833307104881365,433.6636363636364,59.445454545454545
78
+ llama-2-70b-chat,late evening,4.719581684340602,572.1689655172414,79.83103448275862
79
+ llama-2-70b-chat,midnight,3.249819871626402,346.8875,52.06875
80
+ llama-2-70b-chat,morning,2.872361832027194,283.35,43.45
81
+ llama-2-70b-chat,night,2.8264514451677147,313.71,48.42
82
+ zephyr-7b-beta,afternoon,3.5789777278900146,277.6,44.016666666666666
83
+ zephyr-7b-beta,early morning,3.937663261095683,273.03333333333336,43.45
84
+ zephyr-7b-beta,evening,3.5673056403795878,273.3666666666667,43.5
85
+ zephyr-7b-beta,late afternoon,3.4592524923459447,248.59,38.9
86
+ zephyr-7b-beta,late evening,3.45343524068594,176.23125,27.21875
87
+ zephyr-7b-beta,midnight,3.7253047794103624,217.82083333333333,33.67916666666667
88
+ zephyr-7b-beta,morning,4.056525647640228,386.3,63.35
89
+ zephyr-7b-beta,night,3.6954557319482166,216.55833333333334,33.46666666666667
data/2024-02-06 09:42:04.306128_time_of_day_comparison.csv ADDED
@@ -0,0 +1,89 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ model,time_of_day,execution_time,characters_count,words_count
2
+ Mistral-7B-Instruct-v0.2,0,1.9149879813194275,37.8,2.95
3
+ Mistral-7B-Instruct-v0.2,3,3.734026002883911,362.9,58.35
4
+ Mistral-7B-Instruct-v0.2,4,3.228973722457886,222.0625,32.25
5
+ Mistral-7B-Instruct-v0.2,5,3.2048643112182615,219.8625,31.8
6
+ Mistral-7B-Instruct-v0.2,6,3.397640073299408,261.18333333333334,40.1
7
+ Mistral-7B-Instruct-v0.2,7,3.389284573495388,175.79375,25.68125
8
+ Mixtral-8x7B-Instruct-v0.1,0,4.639010797279158,323.0394736842105,42.69210526315789
9
+ Mixtral-8x7B-Instruct-v0.1,1,4.009439338194697,301.24545454545455,42.21818181818182
10
+ Mixtral-8x7B-Instruct-v0.1,2,4.526968242530536,285.045,41.86
11
+ Mixtral-8x7B-Instruct-v0.1,3,3.9661054956285575,304.82,47.28
12
+ Mixtral-8x7B-Instruct-v0.1,4,5.362903979589355,369.3192307692308,54.353846153846156
13
+ Mixtral-8x7B-Instruct-v0.1,5,5.80184749175942,347.9681818181818,47.27272727272727
14
+ Mixtral-8x7B-Instruct-v0.1,6,3.6435119574237023,326.69,48.545
15
+ Mixtral-8x7B-Instruct-v0.1,7,5.62397656769588,395.15714285714284,49.02857142857143
16
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,0,1.6341248273849487,210.2,34.2
17
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,1,2.0128010153770446,372.05,62.6
18
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,2,2.0273348593711855,372.13,62.53
19
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,3,1.9041210174560548,372.05,62.6
20
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,4,1.8381905496120452,308.795,51.08
21
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,5,1.7547113946505954,285.17857142857144,46.9
22
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,6,1.7984187936782836,313.99,51.96
23
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,7,1.5875422928068372,192.78333333333333,31.261111111111113
24
+ chat-bison,0,3.890243631601334,398.075,49.0
25
+ chat-bison (PaLM 2),0,2.468383938074112,381.95,60.9
26
+ chat-bison (PaLM 2),1,2.460119960308075,381.92,60.94
27
+ chat-bison (PaLM 2),2,2.4665334616388592,381.9214285714286,60.892857142857146
28
+ chat-bison (PaLM 2),3,2.488477897644043,381.73,60.88
29
+ chat-bison (PaLM 2),4,2.6460144804074215,376.28076923076924,55.965384615384615
30
+ chat-bison (PaLM 2),5,3.0387172081253744,381.1363636363636,53.35454545454545
31
+ chat-bison (PaLM 2),6,2.688272579908371,367.07,55.89
32
+ chat-bison (PaLM 2),7,2.7250528037548065,382.725,52.95
33
+ chat-bison-32k,0,4.128177767992019,389.925,48.025
34
+ chat-bison-32k (PaLM 2 32K),0,7.7498266498247785,335.75,53.85
35
+ chat-bison-32k (PaLM 2 32K),1,6.491292915344238,335.75,53.85
36
+ chat-bison-32k (PaLM 2 32K),2,9.141417106560299,335.75,53.85
37
+ chat-bison-32k (PaLM 2 32K),3,7.7035503840446475,335.75,53.85
38
+ chat-bison-32k (PaLM 2 32K),4,5.014458654477046,339.3692307692308,49.323076923076925
39
+ chat-bison-32k (PaLM 2 32K),5,4.5047362284226855,348.65909090909093,48.35454545454545
40
+ chat-bison-32k (PaLM 2 32K),6,7.7332194912433625,329.46,49.5
41
+ chat-bison-32k (PaLM 2 32K),7,7.796841062307358,349.95,47.805
42
+ gemini-pro,0,3.338477972348531,369.825,55.9125
43
+ gemini-pro,1,2.8375814715210272,374.8,60.04
44
+ gemini-pro,2,2.7453590130460435,381.2214285714286,60.964285714285715
45
+ gemini-pro,3,2.497767536007628,371.93,59.39
46
+ gemini-pro,4,2.816922114008949,360.62307692307695,53.25769230769231
47
+ gemini-pro,5,2.9268629640903114,364.57272727272726,50.1
48
+ gemini-pro,6,2.86901999375759,366.4,55.045
49
+ gemini-pro,7,3.7189874940246117,390.9142857142857,51.35
50
+ gpt-3.5-turbo,0,3.822115447632102,426.71923076923076,49.05
51
+ gpt-3.5-turbo,1,6.062970260473398,418.6192307692308,44.926923076923075
52
+ gpt-3.5-turbo,2,3.787998208734724,403.74444444444447,47.34444444444444
53
+ gpt-3.5-turbo,3,3.126271222697364,389.9888888888889,50.93888888888889
54
+ gpt-3.5-turbo,4,3.9458200880459375,381.4428571428571,43.76190476190476
55
+ gpt-3.5-turbo,5,4.384064777692159,396.4357142857143,43.28333333333333
56
+ gpt-3.5-turbo,6,3.5153889304115657,385.18095238095236,46.01428571428571
57
+ gpt-3.5-turbo,7,5.110168156187617,422.73510971786834,45.358934169278996
58
+ gpt-4,0,12.3578163115329,334.075,41.35
59
+ gpt-4,1,12.813134506115546,316.93461538461537,37.93076923076923
60
+ gpt-4,2,14.348626694414351,323.5388888888889,40.544444444444444
61
+ gpt-4,3,12.759107512468733,338.18333333333334,46.85
62
+ gpt-4,4,16.002364798386893,318.3095238095238,38.77142857142857
63
+ gpt-4,5,16.80607506932254,313.3595238095238,37.49285714285714
64
+ gpt-4,6,13.841120740345547,318.0809523809524,40.19285714285714
65
+ gpt-4,7,14.298642643005493,314.336,37.012
66
+ gpt-4-turbo,0,13.770663784850727,382.7613636363636,47.61818181818182
67
+ gpt-4-turbo,1,14.254795966698573,352.54615384615386,46.37692307692308
68
+ gpt-4-turbo,2,11.555620827939775,357.65555555555557,47.21666666666667
69
+ gpt-4-turbo,3,13.686854598257277,381.8888888888889,55.02777777777778
70
+ gpt-4-turbo,4,13.997754749229976,351.01190476190476,46.03333333333333
71
+ gpt-4-turbo,5,22.320911452883767,381.65714285714284,47.35476190476191
72
+ gpt-4-turbo,6,16.550320884159632,382.31666666666666,48.45
73
+ gpt-4-turbo,7,14.592236209392548,413.61,44.8
74
+ llama-2-70b-chat,0,3.249819871626402,346.8875,52.06875
75
+ llama-2-70b-chat,1,2.8264514451677147,313.71,48.42
76
+ llama-2-70b-chat,2,2.8660141522424265,289.6642857142857,44.614285714285714
77
+ llama-2-70b-chat,3,2.872361832027194,283.35,43.45
78
+ llama-2-70b-chat,4,4.234376892130426,375.44615384615383,55.238461538461536
79
+ llama-2-70b-chat,5,3.6833307104881365,433.6636363636364,59.445454545454545
80
+ llama-2-70b-chat,6,2.9706250462084185,317.245,47.4
81
+ llama-2-70b-chat,7,4.719581684340602,572.1689655172414,79.83103448275862
82
+ zephyr-7b-beta,0,3.7253047794103624,217.82083333333333,33.67916666666667
83
+ zephyr-7b-beta,1,3.6954557319482166,216.55833333333334,33.46666666666667
84
+ zephyr-7b-beta,2,3.937663261095683,273.03333333333336,43.45
85
+ zephyr-7b-beta,3,4.056525647640228,386.3,63.35
86
+ zephyr-7b-beta,4,3.5789777278900146,277.6,44.016666666666666
87
+ zephyr-7b-beta,5,3.4592524923459447,248.59,38.9
88
+ zephyr-7b-beta,6,3.5673056403795878,273.3666666666667,43.5
89
+ zephyr-7b-beta,7,3.45343524068594,176.23125,27.21875
data/2024-02-06 09:46:18.795794_time_of_day_comparison.csv ADDED
@@ -0,0 +1,89 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ model,time_of_day,execution_time,characters_count,words_count
2
+ Mistral-7B-Instruct-v0.2,midnight,1.9149879813194275,37.8,2.95
3
+ Mistral-7B-Instruct-v0.2,morning,3.734026002883911,362.9,58.35
4
+ Mistral-7B-Instruct-v0.2,afternoon,3.228973722457886,222.0625,32.25
5
+ Mistral-7B-Instruct-v0.2,late afternoon,3.2048643112182615,219.8625,31.8
6
+ Mistral-7B-Instruct-v0.2,evening,3.397640073299408,261.18333333333334,40.1
7
+ Mistral-7B-Instruct-v0.2,late evening,3.389284573495388,175.79375,25.68125
8
+ Mixtral-8x7B-Instruct-v0.1,midnight,4.639010797279158,323.0394736842105,42.69210526315789
9
+ Mixtral-8x7B-Instruct-v0.1,night,4.009439338194697,301.24545454545455,42.21818181818182
10
+ Mixtral-8x7B-Instruct-v0.1,early morning,4.526968242530536,285.045,41.86
11
+ Mixtral-8x7B-Instruct-v0.1,morning,3.9661054956285575,304.82,47.28
12
+ Mixtral-8x7B-Instruct-v0.1,afternoon,5.362903979589355,369.3192307692308,54.353846153846156
13
+ Mixtral-8x7B-Instruct-v0.1,late afternoon,5.80184749175942,347.9681818181818,47.27272727272727
14
+ Mixtral-8x7B-Instruct-v0.1,evening,3.6435119574237023,326.69,48.545
15
+ Mixtral-8x7B-Instruct-v0.1,late evening,5.62397656769588,395.15714285714284,49.02857142857143
16
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,midnight,1.6341248273849487,210.2,34.2
17
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,night,2.0128010153770446,372.05,62.6
18
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,early morning,2.0273348593711855,372.13,62.53
19
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,morning,1.9041210174560548,372.05,62.6
20
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,afternoon,1.8381905496120452,308.795,51.08
21
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,late afternoon,1.7547113946505954,285.17857142857144,46.9
22
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,evening,1.7984187936782836,313.99,51.96
23
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,late evening,1.5875422928068372,192.78333333333333,31.261111111111113
24
+ chat-bison,midnight,3.890243631601334,398.075,49.0
25
+ chat-bison (PaLM 2),midnight,2.468383938074112,381.95,60.9
26
+ chat-bison (PaLM 2),night,2.460119960308075,381.92,60.94
27
+ chat-bison (PaLM 2),early morning,2.4665334616388592,381.9214285714286,60.892857142857146
28
+ chat-bison (PaLM 2),morning,2.488477897644043,381.73,60.88
29
+ chat-bison (PaLM 2),afternoon,2.6460144804074215,376.28076923076924,55.965384615384615
30
+ chat-bison (PaLM 2),late afternoon,3.0387172081253744,381.1363636363636,53.35454545454545
31
+ chat-bison (PaLM 2),evening,2.688272579908371,367.07,55.89
32
+ chat-bison (PaLM 2),late evening,2.7250528037548065,382.725,52.95
33
+ chat-bison-32k,midnight,4.128177767992019,389.925,48.025
34
+ chat-bison-32k (PaLM 2 32K),midnight,7.7498266498247785,335.75,53.85
35
+ chat-bison-32k (PaLM 2 32K),night,6.491292915344238,335.75,53.85
36
+ chat-bison-32k (PaLM 2 32K),early morning,9.141417106560299,335.75,53.85
37
+ chat-bison-32k (PaLM 2 32K),morning,7.7035503840446475,335.75,53.85
38
+ chat-bison-32k (PaLM 2 32K),afternoon,5.014458654477046,339.3692307692308,49.323076923076925
39
+ chat-bison-32k (PaLM 2 32K),late afternoon,4.5047362284226855,348.65909090909093,48.35454545454545
40
+ chat-bison-32k (PaLM 2 32K),evening,7.7332194912433625,329.46,49.5
41
+ chat-bison-32k (PaLM 2 32K),late evening,7.796841062307358,349.95,47.805
42
+ gemini-pro,midnight,3.338477972348531,369.825,55.9125
43
+ gemini-pro,night,2.8375814715210272,374.8,60.04
44
+ gemini-pro,early morning,2.7453590130460435,381.2214285714286,60.964285714285715
45
+ gemini-pro,morning,2.497767536007628,371.93,59.39
46
+ gemini-pro,afternoon,2.816922114008949,360.62307692307695,53.25769230769231
47
+ gemini-pro,late afternoon,2.9268629640903114,364.57272727272726,50.1
48
+ gemini-pro,evening,2.86901999375759,366.4,55.045
49
+ gemini-pro,late evening,3.7189874940246117,390.9142857142857,51.35
50
+ gpt-3.5-turbo,midnight,3.822115447632102,426.71923076923076,49.05
51
+ gpt-3.5-turbo,night,6.062970260473398,418.6192307692308,44.926923076923075
52
+ gpt-3.5-turbo,early morning,3.787998208734724,403.74444444444447,47.34444444444444
53
+ gpt-3.5-turbo,morning,3.126271222697364,389.9888888888889,50.93888888888889
54
+ gpt-3.5-turbo,afternoon,3.9458200880459375,381.4428571428571,43.76190476190476
55
+ gpt-3.5-turbo,late afternoon,4.384064777692159,396.4357142857143,43.28333333333333
56
+ gpt-3.5-turbo,evening,3.5153889304115657,385.18095238095236,46.01428571428571
57
+ gpt-3.5-turbo,late evening,5.110168156187617,422.73510971786834,45.358934169278996
58
+ gpt-4,midnight,12.3578163115329,334.075,41.35
59
+ gpt-4,night,12.813134506115546,316.93461538461537,37.93076923076923
60
+ gpt-4,early morning,14.348626694414351,323.5388888888889,40.544444444444444
61
+ gpt-4,morning,12.759107512468733,338.18333333333334,46.85
62
+ gpt-4,afternoon,16.002364798386893,318.3095238095238,38.77142857142857
63
+ gpt-4,late afternoon,16.80607506932254,313.3595238095238,37.49285714285714
64
+ gpt-4,evening,13.841120740345547,318.0809523809524,40.19285714285714
65
+ gpt-4,late evening,14.298642643005493,314.336,37.012
66
+ gpt-4-turbo,midnight,13.770663784850727,382.7613636363636,47.61818181818182
67
+ gpt-4-turbo,night,14.254795966698573,352.54615384615386,46.37692307692308
68
+ gpt-4-turbo,early morning,11.555620827939775,357.65555555555557,47.21666666666667
69
+ gpt-4-turbo,morning,13.686854598257277,381.8888888888889,55.02777777777778
70
+ gpt-4-turbo,afternoon,13.997754749229976,351.01190476190476,46.03333333333333
71
+ gpt-4-turbo,late afternoon,22.320911452883767,381.65714285714284,47.35476190476191
72
+ gpt-4-turbo,evening,16.550320884159632,382.31666666666666,48.45
73
+ gpt-4-turbo,late evening,14.592236209392548,413.61,44.8
74
+ llama-2-70b-chat,midnight,3.249819871626402,346.8875,52.06875
75
+ llama-2-70b-chat,night,2.8264514451677147,313.71,48.42
76
+ llama-2-70b-chat,early morning,2.8660141522424265,289.6642857142857,44.614285714285714
77
+ llama-2-70b-chat,morning,2.872361832027194,283.35,43.45
78
+ llama-2-70b-chat,afternoon,4.234376892130426,375.44615384615383,55.238461538461536
79
+ llama-2-70b-chat,late afternoon,3.6833307104881365,433.6636363636364,59.445454545454545
80
+ llama-2-70b-chat,evening,2.9706250462084185,317.245,47.4
81
+ llama-2-70b-chat,late evening,4.719581684340602,572.1689655172414,79.83103448275862
82
+ zephyr-7b-beta,midnight,3.7253047794103624,217.82083333333333,33.67916666666667
83
+ zephyr-7b-beta,night,3.6954557319482166,216.55833333333334,33.46666666666667
84
+ zephyr-7b-beta,early morning,3.937663261095683,273.03333333333336,43.45
85
+ zephyr-7b-beta,morning,4.056525647640228,386.3,63.35
86
+ zephyr-7b-beta,afternoon,3.5789777278900146,277.6,44.016666666666666
87
+ zephyr-7b-beta,late afternoon,3.4592524923459447,248.59,38.9
88
+ zephyr-7b-beta,evening,3.5673056403795878,273.3666666666667,43.5
89
+ zephyr-7b-beta,late evening,3.45343524068594,176.23125,27.21875
data/2024-02-06 09:49:19.637072_time_of_day_comparison.csv ADDED
@@ -0,0 +1,89 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ model,time_of_day,execution_time,characters_count,words_count
2
+ Mistral-7B-Instruct-v0.2,morning,3.734026002883911,362.9,58.35
3
+ Mistral-7B-Instruct-v0.2,afternoon,3.228973722457886,222.0625,32.25
4
+ Mistral-7B-Instruct-v0.2,late afternoon,3.2048643112182615,219.8625,31.8
5
+ Mistral-7B-Instruct-v0.2,evening,3.397640073299408,261.18333333333334,40.1
6
+ Mistral-7B-Instruct-v0.2,late evening,3.389284573495388,175.79375,25.68125
7
+ Mistral-7B-Instruct-v0.2,midnight,1.9149879813194275,37.8,2.95
8
+ Mixtral-8x7B-Instruct-v0.1,early morning,4.526968242530536,285.045,41.86
9
+ Mixtral-8x7B-Instruct-v0.1,morning,3.9661054956285575,304.82,47.28
10
+ Mixtral-8x7B-Instruct-v0.1,afternoon,5.362903979589355,369.3192307692308,54.353846153846156
11
+ Mixtral-8x7B-Instruct-v0.1,late afternoon,5.80184749175942,347.9681818181818,47.27272727272727
12
+ Mixtral-8x7B-Instruct-v0.1,evening,3.6435119574237023,326.69,48.545
13
+ Mixtral-8x7B-Instruct-v0.1,late evening,5.62397656769588,395.15714285714284,49.02857142857143
14
+ Mixtral-8x7B-Instruct-v0.1,midnight,4.639010797279158,323.0394736842105,42.69210526315789
15
+ Mixtral-8x7B-Instruct-v0.1,night,4.009439338194697,301.24545454545455,42.21818181818182
16
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,early morning,2.0273348593711855,372.13,62.53
17
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,morning,1.9041210174560548,372.05,62.6
18
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,afternoon,1.8381905496120452,308.795,51.08
19
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,late afternoon,1.7547113946505954,285.17857142857144,46.9
20
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,evening,1.7984187936782836,313.99,51.96
21
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,late evening,1.5875422928068372,192.78333333333333,31.261111111111113
22
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,midnight,1.6341248273849487,210.2,34.2
23
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,night,2.0128010153770446,372.05,62.6
24
+ chat-bison,midnight,3.890243631601334,398.075,49.0
25
+ chat-bison (PaLM 2),early morning,2.4665334616388592,381.9214285714286,60.892857142857146
26
+ chat-bison (PaLM 2),morning,2.488477897644043,381.73,60.88
27
+ chat-bison (PaLM 2),afternoon,2.6460144804074215,376.28076923076924,55.965384615384615
28
+ chat-bison (PaLM 2),late afternoon,3.0387172081253744,381.1363636363636,53.35454545454545
29
+ chat-bison (PaLM 2),evening,2.688272579908371,367.07,55.89
30
+ chat-bison (PaLM 2),late evening,2.7250528037548065,382.725,52.95
31
+ chat-bison (PaLM 2),midnight,2.468383938074112,381.95,60.9
32
+ chat-bison (PaLM 2),night,2.460119960308075,381.92,60.94
33
+ chat-bison-32k,midnight,4.128177767992019,389.925,48.025
34
+ chat-bison-32k (PaLM 2 32K),early morning,9.141417106560299,335.75,53.85
35
+ chat-bison-32k (PaLM 2 32K),morning,7.7035503840446475,335.75,53.85
36
+ chat-bison-32k (PaLM 2 32K),afternoon,5.014458654477046,339.3692307692308,49.323076923076925
37
+ chat-bison-32k (PaLM 2 32K),late afternoon,4.5047362284226855,348.65909090909093,48.35454545454545
38
+ chat-bison-32k (PaLM 2 32K),evening,7.7332194912433625,329.46,49.5
39
+ chat-bison-32k (PaLM 2 32K),late evening,7.796841062307358,349.95,47.805
40
+ chat-bison-32k (PaLM 2 32K),midnight,7.7498266498247785,335.75,53.85
41
+ chat-bison-32k (PaLM 2 32K),night,6.491292915344238,335.75,53.85
42
+ gemini-pro,early morning,2.7453590130460435,381.2214285714286,60.964285714285715
43
+ gemini-pro,morning,2.497767536007628,371.93,59.39
44
+ gemini-pro,afternoon,2.816922114008949,360.62307692307695,53.25769230769231
45
+ gemini-pro,late afternoon,2.9268629640903114,364.57272727272726,50.1
46
+ gemini-pro,evening,2.86901999375759,366.4,55.045
47
+ gemini-pro,late evening,3.7189874940246117,390.9142857142857,51.35
48
+ gemini-pro,midnight,3.338477972348531,369.825,55.9125
49
+ gemini-pro,night,2.8375814715210272,374.8,60.04
50
+ gpt-3.5-turbo,early morning,3.787998208734724,403.74444444444447,47.34444444444444
51
+ gpt-3.5-turbo,morning,3.126271222697364,389.9888888888889,50.93888888888889
52
+ gpt-3.5-turbo,afternoon,3.9458200880459375,381.4428571428571,43.76190476190476
53
+ gpt-3.5-turbo,late afternoon,4.384064777692159,396.4357142857143,43.28333333333333
54
+ gpt-3.5-turbo,evening,3.5153889304115657,385.18095238095236,46.01428571428571
55
+ gpt-3.5-turbo,late evening,5.110168156187617,422.73510971786834,45.358934169278996
56
+ gpt-3.5-turbo,midnight,3.822115447632102,426.71923076923076,49.05
57
+ gpt-3.5-turbo,night,6.062970260473398,418.6192307692308,44.926923076923075
58
+ gpt-4,early morning,14.348626694414351,323.5388888888889,40.544444444444444
59
+ gpt-4,morning,12.759107512468733,338.18333333333334,46.85
60
+ gpt-4,afternoon,16.002364798386893,318.3095238095238,38.77142857142857
61
+ gpt-4,late afternoon,16.80607506932254,313.3595238095238,37.49285714285714
62
+ gpt-4,evening,13.841120740345547,318.0809523809524,40.19285714285714
63
+ gpt-4,late evening,14.298642643005493,314.336,37.012
64
+ gpt-4,midnight,12.3578163115329,334.075,41.35
65
+ gpt-4,night,12.813134506115546,316.93461538461537,37.93076923076923
66
+ gpt-4-turbo,early morning,11.555620827939775,357.65555555555557,47.21666666666667
67
+ gpt-4-turbo,morning,13.686854598257277,381.8888888888889,55.02777777777778
68
+ gpt-4-turbo,afternoon,13.997754749229976,351.01190476190476,46.03333333333333
69
+ gpt-4-turbo,late afternoon,22.320911452883767,381.65714285714284,47.35476190476191
70
+ gpt-4-turbo,evening,16.550320884159632,382.31666666666666,48.45
71
+ gpt-4-turbo,late evening,14.592236209392548,413.61,44.8
72
+ gpt-4-turbo,midnight,13.770663784850727,382.7613636363636,47.61818181818182
73
+ gpt-4-turbo,night,14.254795966698573,352.54615384615386,46.37692307692308
74
+ llama-2-70b-chat,early morning,2.8660141522424265,289.6642857142857,44.614285714285714
75
+ llama-2-70b-chat,morning,2.872361832027194,283.35,43.45
76
+ llama-2-70b-chat,afternoon,4.234376892130426,375.44615384615383,55.238461538461536
77
+ llama-2-70b-chat,late afternoon,3.6833307104881365,433.6636363636364,59.445454545454545
78
+ llama-2-70b-chat,evening,2.9706250462084185,317.245,47.4
79
+ llama-2-70b-chat,late evening,4.719581684340602,572.1689655172414,79.83103448275862
80
+ llama-2-70b-chat,midnight,3.249819871626402,346.8875,52.06875
81
+ llama-2-70b-chat,night,2.8264514451677147,313.71,48.42
82
+ zephyr-7b-beta,early morning,3.937663261095683,273.03333333333336,43.45
83
+ zephyr-7b-beta,morning,4.056525647640228,386.3,63.35
84
+ zephyr-7b-beta,afternoon,3.5789777278900146,277.6,44.016666666666666
85
+ zephyr-7b-beta,late afternoon,3.4592524923459447,248.59,38.9
86
+ zephyr-7b-beta,evening,3.5673056403795878,273.3666666666667,43.5
87
+ zephyr-7b-beta,late evening,3.45343524068594,176.23125,27.21875
88
+ zephyr-7b-beta,midnight,3.7253047794103624,217.82083333333333,33.67916666666667
89
+ zephyr-7b-beta,night,3.6954557319482166,216.55833333333334,33.46666666666667
data/2024-02-06 13:25:55.133644_general_plot.csv ADDED
@@ -0,0 +1,284 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ path,plot_object,header,description,plot_json
2
+ ./html/plots/response_times.html,"Figure({
3
+ 'data': [{'alignmentgroup': 'True',
4
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
5
+ 'legendgroup': 'Mistral-7B-Instruct-v0.2',
6
+ 'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
7
+ 'name': 'Mistral-7B-Instruct-v0.2',
8
+ 'offsetgroup': 'Mistral-7B-Instruct-v0.2',
9
+ 'orientation': 'v',
10
+ 'showlegend': True,
11
+ 'textposition': 'auto',
12
+ 'type': 'bar',
13
+ 'x': array(['Mistral-7B-Instruct-v0.2'], dtype=object),
14
+ 'xaxis': 'x',
15
+ 'y': array([3.27102681]),
16
+ 'yaxis': 'y'},
17
+ {'alignmentgroup': 'True',
18
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
19
+ 'legendgroup': 'Mixtral-8x7B-Instruct-v0.1',
20
+ 'marker': {'color': '#EF553B', 'pattern': {'shape': ''}},
21
+ 'name': 'Mixtral-8x7B-Instruct-v0.1',
22
+ 'offsetgroup': 'Mixtral-8x7B-Instruct-v0.1',
23
+ 'orientation': 'v',
24
+ 'showlegend': True,
25
+ 'textposition': 'auto',
26
+ 'type': 'bar',
27
+ 'x': array(['Mixtral-8x7B-Instruct-v0.1'], dtype=object),
28
+ 'xaxis': 'x',
29
+ 'y': array([4.83500647]),
30
+ 'yaxis': 'y'},
31
+ {'alignmentgroup': 'True',
32
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
33
+ 'legendgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
34
+ 'marker': {'color': '#00cc96', 'pattern': {'shape': ''}},
35
+ 'name': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
36
+ 'offsetgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
37
+ 'orientation': 'v',
38
+ 'showlegend': True,
39
+ 'textposition': 'auto',
40
+ 'type': 'bar',
41
+ 'x': array(['TinyLlama/TinyLlama-1.1B-Chat-v1.0'], dtype=object),
42
+ 'xaxis': 'x',
43
+ 'y': array([1.79273835]),
44
+ 'yaxis': 'y'},
45
+ {'alignmentgroup': 'True',
46
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
47
+ 'legendgroup': 'chat-bison',
48
+ 'marker': {'color': '#ab63fa', 'pattern': {'shape': ''}},
49
+ 'name': 'chat-bison',
50
+ 'offsetgroup': 'chat-bison',
51
+ 'orientation': 'v',
52
+ 'showlegend': True,
53
+ 'textposition': 'auto',
54
+ 'type': 'bar',
55
+ 'x': array(['chat-bison'], dtype=object),
56
+ 'xaxis': 'x',
57
+ 'y': array([3.89024363]),
58
+ 'yaxis': 'y'},
59
+ {'alignmentgroup': 'True',
60
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
61
+ 'legendgroup': 'chat-bison (PaLM 2)',
62
+ 'marker': {'color': '#FFA15A', 'pattern': {'shape': ''}},
63
+ 'name': 'chat-bison (PaLM 2)',
64
+ 'offsetgroup': 'chat-bison (PaLM 2)',
65
+ 'orientation': 'v',
66
+ 'showlegend': True,
67
+ 'textposition': 'auto',
68
+ 'type': 'bar',
69
+ 'x': array(['chat-bison (PaLM 2)'], dtype=object),
70
+ 'xaxis': 'x',
71
+ 'y': array([2.66830386]),
72
+ 'yaxis': 'y'},
73
+ {'alignmentgroup': 'True',
74
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
75
+ 'legendgroup': 'chat-bison-32k',
76
+ 'marker': {'color': '#19d3f3', 'pattern': {'shape': ''}},
77
+ 'name': 'chat-bison-32k',
78
+ 'offsetgroup': 'chat-bison-32k',
79
+ 'orientation': 'v',
80
+ 'showlegend': True,
81
+ 'textposition': 'auto',
82
+ 'type': 'bar',
83
+ 'x': array(['chat-bison-32k'], dtype=object),
84
+ 'xaxis': 'x',
85
+ 'y': array([4.12817777]),
86
+ 'yaxis': 'y'},
87
+ {'alignmentgroup': 'True',
88
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
89
+ 'legendgroup': 'chat-bison-32k (PaLM 2 32K)',
90
+ 'marker': {'color': '#FF6692', 'pattern': {'shape': ''}},
91
+ 'name': 'chat-bison-32k (PaLM 2 32K)',
92
+ 'offsetgroup': 'chat-bison-32k (PaLM 2 32K)',
93
+ 'orientation': 'v',
94
+ 'showlegend': True,
95
+ 'textposition': 'auto',
96
+ 'type': 'bar',
97
+ 'x': array(['chat-bison-32k (PaLM 2 32K)'], dtype=object),
98
+ 'xaxis': 'x',
99
+ 'y': array([6.73886213]),
100
+ 'yaxis': 'y'},
101
+ {'alignmentgroup': 'True',
102
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
103
+ 'legendgroup': 'gemini-pro',
104
+ 'marker': {'color': '#B6E880', 'pattern': {'shape': ''}},
105
+ 'name': 'gemini-pro',
106
+ 'offsetgroup': 'gemini-pro',
107
+ 'orientation': 'v',
108
+ 'showlegend': True,
109
+ 'textposition': 'auto',
110
+ 'type': 'bar',
111
+ 'x': array(['gemini-pro'], dtype=object),
112
+ 'xaxis': 'x',
113
+ 'y': array([3.03678889]),
114
+ 'yaxis': 'y'},
115
+ {'alignmentgroup': 'True',
116
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
117
+ 'legendgroup': 'gpt-3.5-turbo',
118
+ 'marker': {'color': '#FF97FF', 'pattern': {'shape': ''}},
119
+ 'name': 'gpt-3.5-turbo',
120
+ 'offsetgroup': 'gpt-3.5-turbo',
121
+ 'orientation': 'v',
122
+ 'showlegend': True,
123
+ 'textposition': 'auto',
124
+ 'type': 'bar',
125
+ 'x': array(['gpt-3.5-turbo'], dtype=object),
126
+ 'xaxis': 'x',
127
+ 'y': array([4.29307391]),
128
+ 'yaxis': 'y'},
129
+ {'alignmentgroup': 'True',
130
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
131
+ 'legendgroup': 'gpt-4',
132
+ 'marker': {'color': '#FECB52', 'pattern': {'shape': ''}},
133
+ 'name': 'gpt-4',
134
+ 'offsetgroup': 'gpt-4',
135
+ 'orientation': 'v',
136
+ 'showlegend': True,
137
+ 'textposition': 'auto',
138
+ 'type': 'bar',
139
+ 'x': array(['gpt-4'], dtype=object),
140
+ 'xaxis': 'x',
141
+ 'y': array([14.32373439]),
142
+ 'yaxis': 'y'},
143
+ {'alignmentgroup': 'True',
144
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
145
+ 'legendgroup': 'gpt-4-turbo',
146
+ 'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
147
+ 'name': 'gpt-4-turbo',
148
+ 'offsetgroup': 'gpt-4-turbo',
149
+ 'orientation': 'v',
150
+ 'showlegend': True,
151
+ 'textposition': 'auto',
152
+ 'type': 'bar',
153
+ 'x': array(['gpt-4-turbo'], dtype=object),
154
+ 'xaxis': 'x',
155
+ 'y': array([15.5354884]),
156
+ 'yaxis': 'y'},
157
+ {'alignmentgroup': 'True',
158
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
159
+ 'legendgroup': 'llama-2-70b-chat',
160
+ 'marker': {'color': '#EF553B', 'pattern': {'shape': ''}},
161
+ 'name': 'llama-2-70b-chat',
162
+ 'offsetgroup': 'llama-2-70b-chat',
163
+ 'orientation': 'v',
164
+ 'showlegend': True,
165
+ 'textposition': 'auto',
166
+ 'type': 'bar',
167
+ 'x': array(['llama-2-70b-chat'], dtype=object),
168
+ 'xaxis': 'x',
169
+ 'y': array([3.6742315]),
170
+ 'yaxis': 'y'},
171
+ {'alignmentgroup': 'True',
172
+ 'hovertemplate': 'Model=%{x}<br>Execution time (s)=%{y}<extra></extra>',
173
+ 'legendgroup': 'zephyr-7b-beta',
174
+ 'marker': {'color': '#00cc96', 'pattern': {'shape': ''}},
175
+ 'name': 'zephyr-7b-beta',
176
+ 'offsetgroup': 'zephyr-7b-beta',
177
+ 'orientation': 'v',
178
+ 'showlegend': True,
179
+ 'textposition': 'auto',
180
+ 'type': 'bar',
181
+ 'x': array(['zephyr-7b-beta'], dtype=object),
182
+ 'xaxis': 'x',
183
+ 'y': array([3.6370095]),
184
+ 'yaxis': 'y'}],
185
+ 'layout': {'barmode': 'relative',
186
+ 'legend': {'title': {'text': 'Model'}, 'tracegroupgap': 0},
187
+ 'template': '...',
188
+ 'title': {'text': 'Model endpoints response times'},
189
+ 'xaxis': {'anchor': 'y',
190
+ 'categoryarray': [Mistral-7B-Instruct-v0.2,
191
+ Mixtral-8x7B-Instruct-v0.1,
192
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,
193
+ chat-bison, chat-bison (PaLM 2), chat-
194
+ bison-32k, chat-bison-32k (PaLM 2 32K),
195
+ gemini-pro, gpt-3.5-turbo, gpt-4,
196
+ gpt-4-turbo, llama-2-70b-chat,
197
+ zephyr-7b-beta],
198
+ 'categoryorder': 'array',
199
+ 'domain': [0.0, 1.0],
200
+ 'title': {'text': 'Model'}},
201
+ 'yaxis': {'anchor': 'x', 'domain': [0.0, 1.0], 'title': {'text': 'Execution time (s)'}}}
202
+ })",Model endpoints response times,"This plot shows averaged response time for one query for each model.
203
+
204
+ We used `time.time()` result saved to variable before making the call to API and compared it to `time.time()` result after receiving the results.
205
+
206
+ It is also important to note that wee used litellm python library for all of the models which adds some overhead compared to pure curl calls.","{""data"":[{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral-7B-Instruct-v0.2"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""Mistral-7B-Instruct-v0.2"",""offsetgroup"":""Mistral-7B-Instruct-v0.2"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""Mistral-7B-Instruct-v0.2""],""xaxis"":""x"",""y"":[3.271026806036631],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mixtral-8x7B-Instruct-v0.1"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""Mixtral-8x7B-Instruct-v0.1"",""offsetgroup"":""Mixtral-8x7B-Instruct-v0.1"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""Mixtral-8x7B-Instruct-v0.1""],""xaxis"":""x"",""y"":[4.835006467343727],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""offsetgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0""],""xaxis"":""x"",""y"":[1.7927383464436197],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""chat-bison"",""offsetgroup"":""chat-bison"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""chat-bison""],""xaxis"":""x"",""y"":[3.890243631601334],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison (PaLM 2)"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""chat-bison (PaLM 2)"",""offsetgroup"":""chat-bison (PaLM 2)"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""chat-bison (PaLM 2)""],""xaxis"":""x"",""y"":[2.668303858522159],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison-32k"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""chat-bison-32k"",""offsetgroup"":""chat-bison-32k"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""chat-bison-32k""],""xaxis"":""x"",""y"":[4.128177767992019],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison-32k (PaLM 2 32K)"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""chat-bison-32k (PaLM 2 32K)"",""offsetgroup"":""chat-bison-32k (PaLM 2 32K)"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""chat-bison-32k (PaLM 2 32K)""],""xaxis"":""x"",""y"":[6.738862129823485],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gemini-pro"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""gemini-pro"",""offsetgroup"":""gemini-pro"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gemini-pro""],""xaxis"":""x"",""y"":[3.036788886637026],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-3.5-turbo"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""gpt-3.5-turbo"",""offsetgroup"":""gpt-3.5-turbo"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gpt-3.5-turbo""],""xaxis"":""x"",""y"":[4.293073908173212],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""gpt-4"",""offsetgroup"":""gpt-4"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gpt-4""],""xaxis"":""x"",""y"":[14.323734385105828],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4-turbo"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""gpt-4-turbo"",""offsetgroup"":""gpt-4-turbo"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""gpt-4-turbo""],""xaxis"":""x"",""y"":[15.535488395149827],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""llama-2-70b-chat"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""llama-2-70b-chat"",""offsetgroup"":""llama-2-70b-chat"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""llama-2-70b-chat""],""xaxis"":""x"",""y"":[3.6742314998615178],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution time (s)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""zephyr-7b-beta"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""zephyr-7b-beta"",""offsetgroup"":""zephyr-7b-beta"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""zephyr-7b-beta""],""xaxis"":""x"",""y"":[3.6370095004383316],""yaxis"":""y"",""type"":""bar""}],""layout"":{""template"":{""data"":{""histogram2dcontour"":[{""type"":""histogram2dcontour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""choropleth"":[{""type"":""choropleth"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""histogram2d"":[{""type"":""histogram2d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmap"":[{""type"":""heatmap"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmapgl"":[{""type"":""heatmapgl"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""contourcarpet"":[{""type"":""contourcarpet"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""contour"":[{""type"":""contour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""surface"":[{""type"":""surface"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""mesh3d"":[{""type"":""mesh3d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""scatter"":[{""fillpattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2},""type"":""scatter""}],""parcoords"":[{""type"":""parcoords"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolargl"":[{""type"":""scatterpolargl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""bar"":[{""error_x"":{""color"":""#2a3f5f""},""error_y"":{""color"":""#2a3f5f""},""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""bar""}],""scattergeo"":[{""type"":""scattergeo"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolar"":[{""type"":""scatterpolar"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""histogram"":[{""marker"":{""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""histogram""}],""scattergl"":[{""type"":""scattergl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatter3d"":[{""type"":""scatter3d"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattermapbox"":[{""type"":""scattermapbox"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterternary"":[{""type"":""scatterternary"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattercarpet"":[{""type"":""scattercarpet"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""carpet"":[{""aaxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""baxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""type"":""carpet""}],""table"":[{""cells"":{""fill"":{""color"":""#EBF0F8""},""line"":{""color"":""white""}},""header"":{""fill"":{""color"":""#C8D4E3""},""line"":{""color"":""white""}},""type"":""table""}],""barpolar"":[{""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""barpolar""}],""pie"":[{""automargin"":true,""type"":""pie""}]},""layout"":{""autotypenumbers"":""strict"",""colorway"":[""#636efa"",""#EF553B"",""#00cc96"",""#ab63fa"",""#FFA15A"",""#19d3f3"",""#FF6692"",""#B6E880"",""#FF97FF"",""#FECB52""],""font"":{""color"":""#2a3f5f""},""hovermode"":""closest"",""hoverlabel"":{""align"":""left""},""paper_bgcolor"":""white"",""plot_bgcolor"":""#E5ECF6"",""polar"":{""bgcolor"":""#E5ECF6"",""angularaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""radialaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""ternary"":{""bgcolor"":""#E5ECF6"",""aaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""baxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""caxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""coloraxis"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""colorscale"":{""sequential"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""sequentialminus"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""diverging"":[[0,""#8e0152""],[0.1,""#c51b7d""],[0.2,""#de77ae""],[0.3,""#f1b6da""],[0.4,""#fde0ef""],[0.5,""#f7f7f7""],[0.6,""#e6f5d0""],[0.7,""#b8e186""],[0.8,""#7fbc41""],[0.9,""#4d9221""],[1,""#276419""]]},""xaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""yaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""scene"":{""xaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""yaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""zaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2}},""shapedefaults"":{""line"":{""color"":""#2a3f5f""}},""annotationdefaults"":{""arrowcolor"":""#2a3f5f"",""arrowhead"":0,""arrowwidth"":1},""geo"":{""bgcolor"":""white"",""landcolor"":""#E5ECF6"",""subunitcolor"":""white"",""showland"":true,""showlakes"":true,""lakecolor"":""white""},""title"":{""x"":0.05},""mapbox"":{""style"":""light""}}},""xaxis"":{""anchor"":""y"",""domain"":[0.0,1.0],""title"":{""text"":""Model""},""categoryorder"":""array"",""categoryarray"":[""Mistral-7B-Instruct-v0.2"",""Mixtral-8x7B-Instruct-v0.1"",""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""chat-bison"",""chat-bison (PaLM 2)"",""chat-bison-32k"",""chat-bison-32k (PaLM 2 32K)"",""gemini-pro"",""gpt-3.5-turbo"",""gpt-4"",""gpt-4-turbo"",""llama-2-70b-chat"",""zephyr-7b-beta""]},""yaxis"":{""anchor"":""x"",""domain"":[0.0,1.0],""title"":{""text"":""Execution time (s)""}},""legend"":{""title"":{""text"":""Model""},""tracegroupgap"":0},""title"":{""text"":""Model endpoints response times""},""barmode"":""relative""}}"
207
+ ./html/plots/execution_costs.html,"Figure({
208
+ 'data': [{'alignmentgroup': 'True',
209
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
210
+ 'legendgroup': 'Mixtral-8x7B-Instruct-v0.1',
211
+ 'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
212
+ 'name': 'Mixtral-8x7B-Instruct-v0.1',
213
+ 'offsetgroup': 'Mixtral-8x7B-Instruct-v0.1',
214
+ 'orientation': 'v',
215
+ 'showlegend': True,
216
+ 'textposition': 'auto',
217
+ 'type': 'bar',
218
+ 'x': array(['Mixtral-8x7B-Instruct-v0.1'], dtype=object),
219
+ 'xaxis': 'x',
220
+ 'y': array([0.072612]),
221
+ 'yaxis': 'y'},
222
+ {'alignmentgroup': 'True',
223
+ 'hovertemplate': 'Model=%{x}<br>Execution cost ($)=%{y}<extra></extra>',
224
+ 'legendgroup': 'zephyr-7b-beta',
225
+ 'marker': {'color': '#EF553B', 'pattern': {'shape': ''}},
226
+ 'name': 'zephyr-7b-beta',
227
+ 'offsetgroup': 'zephyr-7b-beta',
228
+ 'orientation': 'v',
229
+ 'showlegend': True,
230
+ 'textposition': 'auto',
231
+ 'type': 'bar',
232
+ 'x': array(['zephyr-7b-beta'], dtype=object),
233
+ 'xaxis': 'x',
234
+ 'y': array([0.05180257]),
235
+ 'yaxis': 'y'}],
236
+ 'layout': {'barmode': 'relative',
237
+ 'legend': {'title': {'text': 'Model'}, 'tracegroupgap': 0},
238
+ 'template': '...',
239
+ 'title': {'text': 'Costs of execution of 800 test queries per model'},
240
+ 'xaxis': {'anchor': 'y', 'domain': [0.0, 1.0], 'title': {'text': 'Model'}},
241
+ 'yaxis': {'anchor': 'x', 'domain': [0.0, 1.0], 'title': {'text': 'Execution cost ($)'}}}
242
+ })",Costs of execution of 800 test queries per model,"Costs of experiments carried out to create this table, 800 test queries per model.
243
+
244
+ Note that pause and resume time cost was not included in the cost calculation for the models billed hourly.
245
+
246
+ Also although Gemini-Pro model is free for under 60 queries per minute we calculated the full cost for generating the tokens.","{""data"":[{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mixtral-8x7B-Instruct-v0.1"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""Mixtral-8x7B-Instruct-v0.1"",""offsetgroup"":""Mixtral-8x7B-Instruct-v0.1"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""Mixtral-8x7B-Instruct-v0.1""],""xaxis"":""x"",""y"":[0.07261200000000001],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eExecution cost ($)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""zephyr-7b-beta"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""zephyr-7b-beta"",""offsetgroup"":""zephyr-7b-beta"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""zephyr-7b-beta""],""xaxis"":""x"",""y"":[0.05180256798532274],""yaxis"":""y"",""type"":""bar""}],""layout"":{""template"":{""data"":{""histogram2dcontour"":[{""type"":""histogram2dcontour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""choropleth"":[{""type"":""choropleth"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""histogram2d"":[{""type"":""histogram2d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmap"":[{""type"":""heatmap"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmapgl"":[{""type"":""heatmapgl"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""contourcarpet"":[{""type"":""contourcarpet"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""contour"":[{""type"":""contour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""surface"":[{""type"":""surface"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""mesh3d"":[{""type"":""mesh3d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""scatter"":[{""fillpattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2},""type"":""scatter""}],""parcoords"":[{""type"":""parcoords"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolargl"":[{""type"":""scatterpolargl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""bar"":[{""error_x"":{""color"":""#2a3f5f""},""error_y"":{""color"":""#2a3f5f""},""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""bar""}],""scattergeo"":[{""type"":""scattergeo"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolar"":[{""type"":""scatterpolar"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""histogram"":[{""marker"":{""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""histogram""}],""scattergl"":[{""type"":""scattergl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatter3d"":[{""type"":""scatter3d"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattermapbox"":[{""type"":""scattermapbox"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterternary"":[{""type"":""scatterternary"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattercarpet"":[{""type"":""scattercarpet"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""carpet"":[{""aaxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""baxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""type"":""carpet""}],""table"":[{""cells"":{""fill"":{""color"":""#EBF0F8""},""line"":{""color"":""white""}},""header"":{""fill"":{""color"":""#C8D4E3""},""line"":{""color"":""white""}},""type"":""table""}],""barpolar"":[{""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""barpolar""}],""pie"":[{""automargin"":true,""type"":""pie""}]},""layout"":{""autotypenumbers"":""strict"",""colorway"":[""#636efa"",""#EF553B"",""#00cc96"",""#ab63fa"",""#FFA15A"",""#19d3f3"",""#FF6692"",""#B6E880"",""#FF97FF"",""#FECB52""],""font"":{""color"":""#2a3f5f""},""hovermode"":""closest"",""hoverlabel"":{""align"":""left""},""paper_bgcolor"":""white"",""plot_bgcolor"":""#E5ECF6"",""polar"":{""bgcolor"":""#E5ECF6"",""angularaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""radialaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""ternary"":{""bgcolor"":""#E5ECF6"",""aaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""baxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""caxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""coloraxis"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""colorscale"":{""sequential"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""sequentialminus"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""diverging"":[[0,""#8e0152""],[0.1,""#c51b7d""],[0.2,""#de77ae""],[0.3,""#f1b6da""],[0.4,""#fde0ef""],[0.5,""#f7f7f7""],[0.6,""#e6f5d0""],[0.7,""#b8e186""],[0.8,""#7fbc41""],[0.9,""#4d9221""],[1,""#276419""]]},""xaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""yaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""scene"":{""xaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""yaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""zaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2}},""shapedefaults"":{""line"":{""color"":""#2a3f5f""}},""annotationdefaults"":{""arrowcolor"":""#2a3f5f"",""arrowhead"":0,""arrowwidth"":1},""geo"":{""bgcolor"":""white"",""landcolor"":""#E5ECF6"",""subunitcolor"":""white"",""showland"":true,""showlakes"":true,""lakecolor"":""white""},""title"":{""x"":0.05},""mapbox"":{""style"":""light""}}},""xaxis"":{""anchor"":""y"",""domain"":[0.0,1.0],""title"":{""text"":""Model""}},""yaxis"":{""anchor"":""x"",""domain"":[0.0,1.0],""title"":{""text"":""Execution cost ($)""}},""legend"":{""title"":{""text"":""Model""},""tracegroupgap"":0},""title"":{""text"":""Costs of execution of 800 test queries per model""},""barmode"":""relative""}}"
247
+ ./html/plots/model_sizes.html,"Figure({
248
+ 'data': [{'alignmentgroup': 'True',
249
+ 'hovertemplate': 'Model=%{x}<br>Model size (B params)=%{y}<extra></extra>',
250
+ 'legendgroup': 'Mixtral-8x7B-Instruct-v0.1',
251
+ 'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
252
+ 'name': 'Mixtral-8x7B-Instruct-v0.1',
253
+ 'offsetgroup': 'Mixtral-8x7B-Instruct-v0.1',
254
+ 'orientation': 'v',
255
+ 'showlegend': True,
256
+ 'textposition': 'auto',
257
+ 'type': 'bar',
258
+ 'x': array(['Mixtral-8x7B-Instruct-v0.1'], dtype=object),
259
+ 'xaxis': 'x',
260
+ 'y': array([56]),
261
+ 'yaxis': 'y'},
262
+ {'alignmentgroup': 'True',
263
+ 'hovertemplate': 'Model=%{x}<br>Model size (B params)=%{y}<extra></extra>',
264
+ 'legendgroup': 'zephyr-7b-beta',
265
+ 'marker': {'color': '#EF553B', 'pattern': {'shape': ''}},
266
+ 'name': 'zephyr-7b-beta',
267
+ 'offsetgroup': 'zephyr-7b-beta',
268
+ 'orientation': 'v',
269
+ 'showlegend': True,
270
+ 'textposition': 'auto',
271
+ 'type': 'bar',
272
+ 'x': array(['zephyr-7b-beta'], dtype=object),
273
+ 'xaxis': 'x',
274
+ 'y': array([7]),
275
+ 'yaxis': 'y'}],
276
+ 'layout': {'barmode': 'relative',
277
+ 'legend': {'title': {'text': 'Model'}, 'tracegroupgap': 0},
278
+ 'template': '...',
279
+ 'title': {'text': 'Model sizes in billions of parameters'},
280
+ 'xaxis': {'anchor': 'y', 'domain': [0.0, 1.0], 'title': {'text': 'Model'}},
281
+ 'yaxis': {'anchor': 'x', 'domain': [0.0, 1.0], 'title': {'text': 'Model size (B params)'}}}
282
+ })",Model sizes in billions of parameters,"Model sizes based on release blogs and documentation of their respective developers.
283
+
284
+ Note that models, which sizes were not disclosed publicly were omitted from this comparison.","{""data"":[{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eModel size (B params)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mixtral-8x7B-Instruct-v0.1"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""Mixtral-8x7B-Instruct-v0.1"",""offsetgroup"":""Mixtral-8x7B-Instruct-v0.1"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""Mixtral-8x7B-Instruct-v0.1""],""xaxis"":""x"",""y"":[56],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{x}\u003cbr\u003eModel size (B params)=%{y}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""zephyr-7b-beta"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""zephyr-7b-beta"",""offsetgroup"":""zephyr-7b-beta"",""orientation"":""v"",""showlegend"":true,""textposition"":""auto"",""x"":[""zephyr-7b-beta""],""xaxis"":""x"",""y"":[7],""yaxis"":""y"",""type"":""bar""}],""layout"":{""template"":{""data"":{""histogram2dcontour"":[{""type"":""histogram2dcontour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""choropleth"":[{""type"":""choropleth"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""histogram2d"":[{""type"":""histogram2d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmap"":[{""type"":""heatmap"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmapgl"":[{""type"":""heatmapgl"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""contourcarpet"":[{""type"":""contourcarpet"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""contour"":[{""type"":""contour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""surface"":[{""type"":""surface"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""mesh3d"":[{""type"":""mesh3d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""scatter"":[{""fillpattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2},""type"":""scatter""}],""parcoords"":[{""type"":""parcoords"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolargl"":[{""type"":""scatterpolargl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""bar"":[{""error_x"":{""color"":""#2a3f5f""},""error_y"":{""color"":""#2a3f5f""},""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""bar""}],""scattergeo"":[{""type"":""scattergeo"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolar"":[{""type"":""scatterpolar"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""histogram"":[{""marker"":{""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""histogram""}],""scattergl"":[{""type"":""scattergl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatter3d"":[{""type"":""scatter3d"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattermapbox"":[{""type"":""scattermapbox"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterternary"":[{""type"":""scatterternary"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattercarpet"":[{""type"":""scattercarpet"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""carpet"":[{""aaxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""baxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""type"":""carpet""}],""table"":[{""cells"":{""fill"":{""color"":""#EBF0F8""},""line"":{""color"":""white""}},""header"":{""fill"":{""color"":""#C8D4E3""},""line"":{""color"":""white""}},""type"":""table""}],""barpolar"":[{""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""barpolar""}],""pie"":[{""automargin"":true,""type"":""pie""}]},""layout"":{""autotypenumbers"":""strict"",""colorway"":[""#636efa"",""#EF553B"",""#00cc96"",""#ab63fa"",""#FFA15A"",""#19d3f3"",""#FF6692"",""#B6E880"",""#FF97FF"",""#FECB52""],""font"":{""color"":""#2a3f5f""},""hovermode"":""closest"",""hoverlabel"":{""align"":""left""},""paper_bgcolor"":""white"",""plot_bgcolor"":""#E5ECF6"",""polar"":{""bgcolor"":""#E5ECF6"",""angularaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""radialaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""ternary"":{""bgcolor"":""#E5ECF6"",""aaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""baxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""caxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""coloraxis"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""colorscale"":{""sequential"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""sequentialminus"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""diverging"":[[0,""#8e0152""],[0.1,""#c51b7d""],[0.2,""#de77ae""],[0.3,""#f1b6da""],[0.4,""#fde0ef""],[0.5,""#f7f7f7""],[0.6,""#e6f5d0""],[0.7,""#b8e186""],[0.8,""#7fbc41""],[0.9,""#4d9221""],[1,""#276419""]]},""xaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""yaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""scene"":{""xaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""yaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""zaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2}},""shapedefaults"":{""line"":{""color"":""#2a3f5f""}},""annotationdefaults"":{""arrowcolor"":""#2a3f5f"",""arrowhead"":0,""arrowwidth"":1},""geo"":{""bgcolor"":""white"",""landcolor"":""#E5ECF6"",""subunitcolor"":""white"",""showland"":true,""showlakes"":true,""lakecolor"":""white""},""title"":{""x"":0.05},""mapbox"":{""style"":""light""}}},""xaxis"":{""anchor"":""y"",""domain"":[0.0,1.0],""title"":{""text"":""Model""}},""yaxis"":{""anchor"":""x"",""domain"":[0.0,1.0],""title"":{""text"":""Model size (B params)""}},""legend"":{""title"":{""text"":""Model""},""tracegroupgap"":0},""title"":{""text"":""Model sizes in billions of parameters""},""barmode"":""relative""}}"