Spaces:
Running
Running
Commit
·
86c5452
1
Parent(s):
f156119
2024-02-22 14:10:21 Publish script update
Browse files- app.py +12 -12
- data/general_plots.csv +374 -76
- data/model_costs.csv +58 -0
- data/output_plots.csv +0 -0
- data/summary.csv +95 -0
- pipeline/config.py +1 -1
- pipeline/models.py +22 -0
app.py
CHANGED
@@ -57,10 +57,10 @@ output_types_df = pd.DataFrame(
|
|
57 |
{"Output Type": queries_config.query_template.keys(), "Added text": queries_config.query_template.values()}
|
58 |
)
|
59 |
|
60 |
-
summary_df: pd.DataFrame = pd.read_csv("data/
|
61 |
time_of_day_comparison_df = pd.read_csv("data/time_of_day_comparison.csv")
|
62 |
general_plots = pd.read_csv("data/general_plots.csv")
|
63 |
-
model_costs_df = pd.read_csv("data/
|
64 |
time_of_day_plots = pd.read_csv("data/time_of_day_plots.csv")
|
65 |
output_plots = pd.read_csv("data/output_plots.csv")
|
66 |
|
@@ -97,6 +97,13 @@ def collapse_output_method_toggle():
|
|
97 |
button_text = "Un-collapse output method"
|
98 |
return dataframes()[0], button_text
|
99 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
100 |
|
101 |
def dataframes():
|
102 |
global collapse_languages, collapse_output_method, searched_query, summary_df, time_of_day_comparison_df, model_costs_df
|
@@ -117,9 +124,7 @@ def dataframes():
|
|
117 |
searched_model_names = [n for n in searched_model_names if n]
|
118 |
|
119 |
def for_dataframe(df):
|
120 |
-
|
121 |
-
return dataframe_style(df)
|
122 |
-
return dataframe_style(pd.concat(df[df.model.str.lower().str.contains(n)] for n in searched_model_names))
|
123 |
|
124 |
return (
|
125 |
for_dataframe(summary_df_processed),
|
@@ -172,18 +177,13 @@ def filter_plots(searched_query: str):
|
|
172 |
searched_model_names = [n.lower().strip() for n in searched_model_names]
|
173 |
searched_model_names = [n for n in searched_model_names if n]
|
174 |
|
175 |
-
def filter_dataframe(df):
|
176 |
-
if not searched_model_names:
|
177 |
-
return df
|
178 |
-
return pd.concat(df[df.model.str.lower().str.contains(n)] for n in searched_model_names)
|
179 |
-
|
180 |
results = []
|
181 |
for plot_display, plot, row in plots:
|
182 |
visible = True
|
183 |
if "df" in row and pd.notna(row["df"]):
|
184 |
buffer = io.StringIO(row["df"])
|
185 |
df = pd.read_csv(buffer)
|
186 |
-
df = filter_dataframe(df)
|
187 |
plot = px.bar(df, **json.loads(row["arguments"]))
|
188 |
plot.update_layout(autosize=True)
|
189 |
elif "for model" in row["header"] and searched_model_names:
|
@@ -316,4 +316,4 @@ Mainly OpenAI's GPT models and Google's Palm 2.
|
|
316 |
api_name="collapse_output_method_toggle",
|
317 |
)
|
318 |
|
319 |
-
demo.launch(
|
|
|
57 |
{"Output Type": queries_config.query_template.keys(), "Added text": queries_config.query_template.values()}
|
58 |
)
|
59 |
|
60 |
+
summary_df: pd.DataFrame = pd.read_csv("data/summary.csv")
|
61 |
time_of_day_comparison_df = pd.read_csv("data/time_of_day_comparison.csv")
|
62 |
general_plots = pd.read_csv("data/general_plots.csv")
|
63 |
+
model_costs_df = pd.read_csv("data/model_costs.csv")
|
64 |
time_of_day_plots = pd.read_csv("data/time_of_day_plots.csv")
|
65 |
output_plots = pd.read_csv("data/output_plots.csv")
|
66 |
|
|
|
97 |
button_text = "Un-collapse output method"
|
98 |
return dataframes()[0], button_text
|
99 |
|
100 |
+
def filter_dataframe(df, searched_model_names):
|
101 |
+
if not searched_model_names:
|
102 |
+
return df
|
103 |
+
filter_series = df.model == "" # False values
|
104 |
+
for n in searched_model_names:
|
105 |
+
filter_series = filter_series | df.model.str.lower().str.contains(n)
|
106 |
+
return df[filter_series]
|
107 |
|
108 |
def dataframes():
|
109 |
global collapse_languages, collapse_output_method, searched_query, summary_df, time_of_day_comparison_df, model_costs_df
|
|
|
124 |
searched_model_names = [n for n in searched_model_names if n]
|
125 |
|
126 |
def for_dataframe(df):
|
127 |
+
return dataframe_style(filter_dataframe(df, searched_model_names))
|
|
|
|
|
128 |
|
129 |
return (
|
130 |
for_dataframe(summary_df_processed),
|
|
|
177 |
searched_model_names = [n.lower().strip() for n in searched_model_names]
|
178 |
searched_model_names = [n for n in searched_model_names if n]
|
179 |
|
|
|
|
|
|
|
|
|
|
|
180 |
results = []
|
181 |
for plot_display, plot, row in plots:
|
182 |
visible = True
|
183 |
if "df" in row and pd.notna(row["df"]):
|
184 |
buffer = io.StringIO(row["df"])
|
185 |
df = pd.read_csv(buffer)
|
186 |
+
df = filter_dataframe(df, searched_model_names)
|
187 |
plot = px.bar(df, **json.loads(row["arguments"]))
|
188 |
plot.update_layout(autosize=True)
|
189 |
elif "for model" in row["header"] and searched_model_names:
|
|
|
316 |
api_name="collapse_output_method_toggle",
|
317 |
)
|
318 |
|
319 |
+
demo.launch()
|
data/general_plots.csv
CHANGED
@@ -10,7 +10,7 @@ execution_costs,./html/plots/execution_costs.html,"Figure({
|
|
10 |
'showlegend': True,
|
11 |
'textposition': 'auto',
|
12 |
'type': 'bar',
|
13 |
-
'x': array([
|
14 |
'xaxis': 'x',
|
15 |
'y': array(['gpt-4'], dtype=object),
|
16 |
'yaxis': 'y'},
|
@@ -24,7 +24,7 @@ execution_costs,./html/plots/execution_costs.html,"Figure({
|
|
24 |
'showlegend': True,
|
25 |
'textposition': 'auto',
|
26 |
'type': 'bar',
|
27 |
-
'x': array([
|
28 |
'xaxis': 'x',
|
29 |
'y': array(['gpt-4-turbo'], dtype=object),
|
30 |
'yaxis': 'y'},
|
@@ -38,119 +38,338 @@ execution_costs,./html/plots/execution_costs.html,"Figure({
|
|
38 |
'showlegend': True,
|
39 |
'textposition': 'auto',
|
40 |
'type': 'bar',
|
41 |
-
'x': array([0.
|
42 |
'xaxis': 'x',
|
43 |
'y': array(['gpt-3.5-turbo'], dtype=object),
|
44 |
'yaxis': 'y'},
|
45 |
{'alignmentgroup': 'True',
|
46 |
'hovertemplate': 'Model=%{y}<br>Execution cost ($)=%{x}<extra></extra>',
|
47 |
-
'legendgroup': '
|
48 |
'marker': {'color': '#ab63fa', 'pattern': {'shape': ''}},
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
49 |
'name': 'llama-2-70b-chat',
|
50 |
'offsetgroup': 'llama-2-70b-chat',
|
51 |
'orientation': 'h',
|
52 |
'showlegend': True,
|
53 |
'textposition': 'auto',
|
54 |
'type': 'bar',
|
55 |
-
'x': array([0.
|
56 |
'xaxis': 'x',
|
57 |
'y': array(['llama-2-70b-chat'], dtype=object),
|
58 |
'yaxis': 'y'},
|
59 |
{'alignmentgroup': 'True',
|
60 |
'hovertemplate': 'Model=%{y}<br>Execution cost ($)=%{x}<extra></extra>',
|
61 |
-
'legendgroup': '
|
62 |
-
'marker': {'color': '#
|
63 |
-
'name': '
|
64 |
-
'offsetgroup': '
|
65 |
'orientation': 'h',
|
66 |
'showlegend': True,
|
67 |
'textposition': 'auto',
|
68 |
'type': 'bar',
|
69 |
-
'x': array([0.
|
70 |
'xaxis': 'x',
|
71 |
-
'y': array(['
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
72 |
'yaxis': 'y'},
|
73 |
{'alignmentgroup': 'True',
|
74 |
'hovertemplate': 'Model=%{y}<br>Execution cost ($)=%{x}<extra></extra>',
|
75 |
'legendgroup': 'gemini-pro',
|
76 |
-
'marker': {'color': '#
|
77 |
'name': 'gemini-pro',
|
78 |
'offsetgroup': 'gemini-pro',
|
79 |
'orientation': 'h',
|
80 |
'showlegend': True,
|
81 |
'textposition': 'auto',
|
82 |
'type': 'bar',
|
83 |
-
'x': array([0.
|
84 |
'xaxis': 'x',
|
85 |
'y': array(['gemini-pro'], dtype=object),
|
86 |
'yaxis': 'y'},
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
87 |
{'alignmentgroup': 'True',
|
88 |
'hovertemplate': 'Model=%{y}<br>Execution cost ($)=%{x}<extra></extra>',
|
89 |
'legendgroup': 'chat-bison (PaLM 2)',
|
90 |
-
'marker': {'color': '#
|
91 |
'name': 'chat-bison (PaLM 2)',
|
92 |
'offsetgroup': 'chat-bison (PaLM 2)',
|
93 |
'orientation': 'h',
|
94 |
'showlegend': True,
|
95 |
'textposition': 'auto',
|
96 |
'type': 'bar',
|
97 |
-
'x': array([0.
|
98 |
'xaxis': 'x',
|
99 |
'y': array(['chat-bison (PaLM 2)'], dtype=object),
|
100 |
'yaxis': 'y'},
|
101 |
{'alignmentgroup': 'True',
|
102 |
'hovertemplate': 'Model=%{y}<br>Execution cost ($)=%{x}<extra></extra>',
|
103 |
'legendgroup': 'chat-bison-32k (PaLM 2 32K)',
|
104 |
-
'marker': {'color': '#
|
105 |
'name': 'chat-bison-32k (PaLM 2 32K)',
|
106 |
'offsetgroup': 'chat-bison-32k (PaLM 2 32K)',
|
107 |
'orientation': 'h',
|
108 |
'showlegend': True,
|
109 |
'textposition': 'auto',
|
110 |
'type': 'bar',
|
111 |
-
'x': array([0.
|
112 |
'xaxis': 'x',
|
113 |
'y': array(['chat-bison-32k (PaLM 2 32K)'], dtype=object),
|
114 |
'yaxis': 'y'},
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
115 |
{'alignmentgroup': 'True',
|
116 |
'hovertemplate': 'Model=%{y}<br>Execution cost ($)=%{x}<extra></extra>',
|
117 |
'legendgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
|
118 |
-
'marker': {'color': '#
|
119 |
'name': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
|
120 |
'offsetgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
|
121 |
'orientation': 'h',
|
122 |
'showlegend': True,
|
123 |
'textposition': 'auto',
|
124 |
'type': 'bar',
|
125 |
-
'x': array([0.
|
126 |
'xaxis': 'x',
|
127 |
'y': array(['TinyLlama/TinyLlama-1.1B-Chat-v1.0'], dtype=object),
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
128 |
'yaxis': 'y'}],
|
129 |
'layout': {'barmode': 'relative',
|
130 |
'legend': {'title': {'text': 'Model'}, 'tracegroupgap': 0},
|
131 |
'template': '...',
|
132 |
-
'title': {'text': 'Costs of execution of
|
133 |
'xaxis': {'anchor': 'y', 'domain': [0.0, 1.0], 'title': {'text': 'Execution cost ($)'}},
|
134 |
'yaxis': {'anchor': 'x',
|
135 |
-
'categoryarray': [
|
136 |
-
|
137 |
-
(
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
138 |
Mixtral-8x7B-Instruct-v0.1,
|
139 |
-
|
140 |
-
gpt-4-turbo, gpt-4],
|
141 |
'categoryorder': 'array',
|
142 |
'domain': [0.0, 1.0],
|
143 |
'title': {'text': 'Model'}}}
|
144 |
-
})",Costs of execution of 20 test queries per model,,"{""data"":[{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eExecution cost ($)=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""gpt-4"",""offsetgroup"":""gpt-4"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.1446],""xaxis"":""x"",""y"":[""gpt-4""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eExecution cost ($)=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4-turbo"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""gpt-4-turbo"",""offsetgroup"":""gpt-4-turbo"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.056],""xaxis"":""x"",""y"":[""gpt-4-turbo""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eExecution cost ($)=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-3.5-turbo"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""gpt-3.5-turbo"",""offsetgroup"":""gpt-3.5-turbo"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.00442],""xaxis"":""x"",""y"":[""gpt-3.5-turbo""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eExecution cost ($)=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""llama-2-70b-chat"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""llama-2-70b-chat"",""offsetgroup"":""llama-2-70b-chat"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.002808],""xaxis"":""x"",""y"":[""llama-2-70b-chat""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eExecution cost ($)=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mixtral-8x7B-Instruct-v0.1"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""Mixtral-8x7B-Instruct-v0.1"",""offsetgroup"":""Mixtral-8x7B-Instruct-v0.1"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.0020700000000000002],""xaxis"":""x"",""y"":[""Mixtral-8x7B-Instruct-v0.1""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eExecution cost ($)=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gemini-pro"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""gemini-pro"",""offsetgroup"":""gemini-pro"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.0011949999999999999],""xaxis"":""x"",""y"":[""gemini-pro""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eExecution cost ($)=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison (PaLM 2)"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""chat-bison (PaLM 2)"",""offsetgroup"":""chat-bison (PaLM 2)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.001075],""xaxis"":""x"",""y"":[""chat-bison (PaLM 2)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eExecution cost ($)=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison-32k (PaLM 2 32K)"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""chat-bison-32k (PaLM 2 32K)"",""offsetgroup"":""chat-bison-32k (PaLM 2 32K)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.0010249999999999999],""xaxis"":""x"",""y"":[""chat-bison-32k (PaLM 2 32K)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eExecution cost ($)=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""offsetgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.0006276866594950359],""xaxis"":""x"",""y"":[""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0""],""yaxis"":""y"",""type"":""bar""}],""layout"":{""template"":{""data"":{""histogram2dcontour"":[{""type"":""histogram2dcontour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""choropleth"":[{""type"":""choropleth"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""histogram2d"":[{""type"":""histogram2d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmap"":[{""type"":""heatmap"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmapgl"":[{""type"":""heatmapgl"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""contourcarpet"":[{""type"":""contourcarpet"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""contour"":[{""type"":""contour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""surface"":[{""type"":""surface"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""mesh3d"":[{""type"":""mesh3d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""scatter"":[{""fillpattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2},""type"":""scatter""}],""parcoords"":[{""type"":""parcoords"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolargl"":[{""type"":""scatterpolargl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""bar"":[{""error_x"":{""color"":""#2a3f5f""},""error_y"":{""color"":""#2a3f5f""},""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""bar""}],""scattergeo"":[{""type"":""scattergeo"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolar"":[{""type"":""scatterpolar"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""histogram"":[{""marker"":{""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""histogram""}],""scattergl"":[{""type"":""scattergl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatter3d"":[{""type"":""scatter3d"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattermapbox"":[{""type"":""scattermapbox"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterternary"":[{""type"":""scatterternary"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattercarpet"":[{""type"":""scattercarpet"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""carpet"":[{""aaxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""baxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""type"":""carpet""}],""table"":[{""cells"":{""fill"":{""color"":""#EBF0F8""},""line"":{""color"":""white""}},""header"":{""fill"":{""color"":""#C8D4E3""},""line"":{""color"":""white""}},""type"":""table""}],""barpolar"":[{""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""barpolar""}],""pie"":[{""automargin"":true,""type"":""pie""}]},""layout"":{""autotypenumbers"":""strict"",""colorway"":[""#636efa"",""#EF553B"",""#00cc96"",""#ab63fa"",""#FFA15A"",""#19d3f3"",""#FF6692"",""#B6E880"",""#FF97FF"",""#FECB52""],""font"":{""color"":""#2a3f5f""},""hovermode"":""closest"",""hoverlabel"":{""align"":""left""},""paper_bgcolor"":""white"",""plot_bgcolor"":""#E5ECF6"",""polar"":{""bgcolor"":""#E5ECF6"",""angularaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""radialaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""ternary"":{""bgcolor"":""#E5ECF6"",""aaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""baxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""caxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""coloraxis"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""colorscale"":{""sequential"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""sequentialminus"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""diverging"":[[0,""#8e0152""],[0.1,""#c51b7d""],[0.2,""#de77ae""],[0.3,""#f1b6da""],[0.4,""#fde0ef""],[0.5,""#f7f7f7""],[0.6,""#e6f5d0""],[0.7,""#b8e186""],[0.8,""#7fbc41""],[0.9,""#4d9221""],[1,""#276419""]]},""xaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""yaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""scene"":{""xaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""yaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""zaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2}},""shapedefaults"":{""line"":{""color"":""#2a3f5f""}},""annotationdefaults"":{""arrowcolor"":""#2a3f5f"",""arrowhead"":0,""arrowwidth"":1},""geo"":{""bgcolor"":""white"",""landcolor"":""#E5ECF6"",""subunitcolor"":""white"",""showland"":true,""showlakes"":true,""lakecolor"":""white""},""title"":{""x"":0.05},""mapbox"":{""style"":""light""}}},""xaxis"":{""anchor"":""y"",""domain"":[0.0,1.0],""title"":{""text"":""Execution cost ($)""}},""yaxis"":{""anchor"":""x"",""domain"":[0.0,1.0],""title"":{""text"":""Model""},""categoryorder"":""array"",""categoryarray"":[""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""chat-bison-32k (PaLM 2 32K)"",""chat-bison (PaLM 2)"",""gemini-pro"",""Mixtral-8x7B-Instruct-v0.1"",""llama-2-70b-chat"",""gpt-3.5-turbo"",""gpt-4-turbo"",""gpt-4""]},""legend"":{""title"":{""text"":""Model""},""tracegroupgap"":0},""title"":{""text"":""Costs of execution of 20 test queries per model""},""barmode"":""relative""}}","{""y"": ""model"", ""x"": ""model_query_costs"", ""color"": ""model"", ""orientation"": ""h"", ""title"": ""Costs of execution of 20 test queries per model"", ""labels"": {""model"": ""Model"", ""model_query_costs"": ""Execution cost ($)""}}",",model_query_costs,model
|
145 |
-
2,
|
146 |
-
1,
|
147 |
-
0,0.
|
148 |
-
|
149 |
-
|
150 |
-
|
151 |
-
|
152 |
-
|
153 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
154 |
"
|
155 |
model_sizes,./html/plots/model_sizes.html,"Figure({
|
156 |
'data': [{'alignmentgroup': 'True',
|
@@ -183,59 +402,59 @@ model_sizes,./html/plots/model_sizes.html,"Figure({
|
|
183 |
'yaxis': 'y'},
|
184 |
{'alignmentgroup': 'True',
|
185 |
'hovertemplate': 'Model=%{y}<br>Model size (B params)=%{x}<extra></extra>',
|
186 |
-
'legendgroup': '
|
187 |
'marker': {'color': '#00cc96', 'pattern': {'shape': ''}},
|
188 |
-
'name': '
|
189 |
-
'offsetgroup': '
|
190 |
'orientation': 'h',
|
191 |
'showlegend': True,
|
192 |
'textposition': 'auto',
|
193 |
'type': 'bar',
|
194 |
-
'x': array([
|
195 |
'xaxis': 'x',
|
196 |
-
'y': array(['
|
197 |
'yaxis': 'y'},
|
198 |
{'alignmentgroup': 'True',
|
199 |
'hovertemplate': 'Model=%{y}<br>Model size (B params)=%{x}<extra></extra>',
|
200 |
-
'legendgroup': '
|
201 |
'marker': {'color': '#ab63fa', 'pattern': {'shape': ''}},
|
202 |
-
'name': '
|
203 |
-
'offsetgroup': '
|
204 |
'orientation': 'h',
|
205 |
'showlegend': True,
|
206 |
'textposition': 'auto',
|
207 |
'type': 'bar',
|
208 |
-
'x': array([
|
209 |
'xaxis': 'x',
|
210 |
-
'y': array(['
|
211 |
'yaxis': 'y'},
|
212 |
{'alignmentgroup': 'True',
|
213 |
'hovertemplate': 'Model=%{y}<br>Model size (B params)=%{x}<extra></extra>',
|
214 |
-
'legendgroup': '
|
215 |
'marker': {'color': '#FFA15A', 'pattern': {'shape': ''}},
|
216 |
-
'name': '
|
217 |
-
'offsetgroup': '
|
218 |
'orientation': 'h',
|
219 |
'showlegend': True,
|
220 |
'textposition': 'auto',
|
221 |
'type': 'bar',
|
222 |
-
'x': array([
|
223 |
'xaxis': 'x',
|
224 |
-
'y': array(['
|
225 |
'yaxis': 'y'},
|
226 |
{'alignmentgroup': 'True',
|
227 |
'hovertemplate': 'Model=%{y}<br>Model size (B params)=%{x}<extra></extra>',
|
228 |
-
'legendgroup': '
|
229 |
'marker': {'color': '#19d3f3', 'pattern': {'shape': ''}},
|
230 |
-
'name': '
|
231 |
-
'offsetgroup': '
|
232 |
'orientation': 'h',
|
233 |
'showlegend': True,
|
234 |
'textposition': 'auto',
|
235 |
'type': 'bar',
|
236 |
-
'x': array([
|
237 |
'xaxis': 'x',
|
238 |
-
'y': array(['
|
239 |
'yaxis': 'y'},
|
240 |
{'alignmentgroup': 'True',
|
241 |
'hovertemplate': 'Model=%{y}<br>Model size (B params)=%{x}<extra></extra>',
|
@@ -253,17 +472,17 @@ model_sizes,./html/plots/model_sizes.html,"Figure({
|
|
253 |
'yaxis': 'y'},
|
254 |
{'alignmentgroup': 'True',
|
255 |
'hovertemplate': 'Model=%{y}<br>Model size (B params)=%{x}<extra></extra>',
|
256 |
-
'legendgroup': '
|
257 |
'marker': {'color': '#B6E880', 'pattern': {'shape': ''}},
|
258 |
-
'name': '
|
259 |
-
'offsetgroup': '
|
260 |
'orientation': 'h',
|
261 |
'showlegend': True,
|
262 |
'textposition': 'auto',
|
263 |
'type': 'bar',
|
264 |
'x': array([7.]),
|
265 |
'xaxis': 'x',
|
266 |
-
'y': array(['
|
267 |
'yaxis': 'y'},
|
268 |
{'alignmentgroup': 'True',
|
269 |
'hovertemplate': 'Model=%{y}<br>Model size (B params)=%{x}<extra></extra>',
|
@@ -295,8 +514,50 @@ model_sizes,./html/plots/model_sizes.html,"Figure({
|
|
295 |
'yaxis': 'y'},
|
296 |
{'alignmentgroup': 'True',
|
297 |
'hovertemplate': 'Model=%{y}<br>Model size (B params)=%{x}<extra></extra>',
|
298 |
-
'legendgroup': '
|
299 |
'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
300 |
'name': 'RedPajama-INCITE Chat (7B)',
|
301 |
'offsetgroup': 'RedPajama-INCITE Chat (7B)',
|
302 |
'orientation': 'h',
|
@@ -307,10 +568,38 @@ model_sizes,./html/plots/model_sizes.html,"Figure({
|
|
307 |
'xaxis': 'x',
|
308 |
'y': array(['RedPajama-INCITE Chat (7B)'], dtype=object),
|
309 |
'yaxis': 'y'},
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
310 |
{'alignmentgroup': 'True',
|
311 |
'hovertemplate': 'Model=%{y}<br>Model size (B params)=%{x}<extra></extra>',
|
312 |
'legendgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
|
313 |
-
'marker': {'color': '#
|
314 |
'name': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
|
315 |
'offsetgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
|
316 |
'orientation': 'h',
|
@@ -328,29 +617,38 @@ model_sizes,./html/plots/model_sizes.html,"Figure({
|
|
328 |
'xaxis': {'anchor': 'y', 'domain': [0.0, 1.0], 'title': {'text': 'Model size (B params)'}},
|
329 |
'yaxis': {'anchor': 'x',
|
330 |
'categoryarray': [TinyLlama/TinyLlama-1.1B-Chat-v1.0,
|
331 |
-
|
332 |
-
Chat (7B),
|
333 |
-
(
|
334 |
-
|
335 |
-
|
336 |
-
|
|
|
|
|
|
|
|
|
337 |
Mixtral-8x7B-Instruct-v0.1,
|
338 |
llama-2-70b-chat],
|
339 |
'categoryorder': 'array',
|
340 |
'domain': [0.0, 1.0],
|
341 |
'title': {'text': 'Model'}}}
|
342 |
-
})",Model sizes in billions of parameters,,"{""data"":[{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eModel size (B params)=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""llama-2-70b-chat"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""llama-2-70b-chat"",""offsetgroup"":""llama-2-70b-chat"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[70.0],""xaxis"":""x"",""y"":[""llama-2-70b-chat""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eModel size (B params)=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mixtral-8x7B-Instruct-v0.1"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""Mixtral-8x7B-Instruct-v0.1"",""offsetgroup"":""Mixtral-8x7B-Instruct-v0.1"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[56.0],""xaxis"":""x"",""y"":[""Mixtral-8x7B-Instruct-v0.1""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eModel size (B params)=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""WizardLM v1.2 (13B)"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""WizardLM v1.2 (13B)"",""offsetgroup"":""WizardLM v1.2 (13B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[13.0],""xaxis"":""x"",""y"":[""WizardLM v1.2 (13B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eModel size (B params)=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Upstage SOLAR Instruct v1 (11B)"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""Upstage SOLAR Instruct v1 (11B)"",""offsetgroup"":""Upstage SOLAR Instruct v1 (11B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[11.0],""xaxis"":""x"",""y"":[""Upstage SOLAR Instruct v1 (11B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eModel size (B params)=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""zephyr-7b-beta"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""zephyr-7b-beta"",""offsetgroup"":""zephyr-7b-beta"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[7.0],""xaxis"":""x"",""y"":[""zephyr-7b-beta""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eModel size (B params)=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral-7B-Instruct-v0.2"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""Mistral-7B-Instruct-v0.2"",""offsetgroup"":""Mistral-7B-Instruct-v0.2"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[7.0],""xaxis"":""x"",""y"":[""Mistral-7B-Instruct-v0.2""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eModel size (B params)=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Vicuna v1.5 (7B)"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""Vicuna v1.5 (7B)"",""offsetgroup"":""Vicuna v1.5 (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[7.0],""xaxis"":""x"",""y"":[""Vicuna v1.5 (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eModel size (B params)=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""LLaMA-2 Chat (7B)"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""LLaMA-2 Chat (7B)"",""offsetgroup"":""LLaMA-2 Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[7.0],""xaxis"":""x"",""y"":[""LLaMA-2 Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eModel size (B params)=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral (7B) Instruct v0.2 (Together AI)"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""Mistral (7B) Instruct v0.2 (Together AI)"",""offsetgroup"":""Mistral (7B) Instruct v0.2 (Together AI)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[7.0],""xaxis"":""x"",""y"":[""Mistral (7B) Instruct v0.2 (Together AI)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eModel size (B params)=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Qwen 1.5 Chat (7B)"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""Qwen 1.5 Chat (7B)"",""offsetgroup"":""Qwen 1.5 Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[7.0],""xaxis"":""x"",""y"":[""Qwen 1.5 Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eModel size (B params)=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""RedPajama-INCITE Chat (7B)"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""RedPajama-INCITE Chat (7B)"",""offsetgroup"":""RedPajama-INCITE Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[7.0],""xaxis"":""x"",""y"":[""RedPajama-INCITE Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eModel size (B params)=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""offsetgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[1.1],""xaxis"":""x"",""y"":[""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0""],""yaxis"":""y"",""type"":""bar""}],""layout"":{""template"":{""data"":{""histogram2dcontour"":[{""type"":""histogram2dcontour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""choropleth"":[{""type"":""choropleth"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""histogram2d"":[{""type"":""histogram2d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmap"":[{""type"":""heatmap"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmapgl"":[{""type"":""heatmapgl"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""contourcarpet"":[{""type"":""contourcarpet"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""contour"":[{""type"":""contour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""surface"":[{""type"":""surface"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""mesh3d"":[{""type"":""mesh3d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""scatter"":[{""fillpattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2},""type"":""scatter""}],""parcoords"":[{""type"":""parcoords"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolargl"":[{""type"":""scatterpolargl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""bar"":[{""error_x"":{""color"":""#2a3f5f""},""error_y"":{""color"":""#2a3f5f""},""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""bar""}],""scattergeo"":[{""type"":""scattergeo"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolar"":[{""type"":""scatterpolar"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""histogram"":[{""marker"":{""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""histogram""}],""scattergl"":[{""type"":""scattergl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatter3d"":[{""type"":""scatter3d"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattermapbox"":[{""type"":""scattermapbox"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterternary"":[{""type"":""scatterternary"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattercarpet"":[{""type"":""scattercarpet"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""carpet"":[{""aaxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""baxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""type"":""carpet""}],""table"":[{""cells"":{""fill"":{""color"":""#EBF0F8""},""line"":{""color"":""white""}},""header"":{""fill"":{""color"":""#C8D4E3""},""line"":{""color"":""white""}},""type"":""table""}],""barpolar"":[{""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""barpolar""}],""pie"":[{""automargin"":true,""type"":""pie""}]},""layout"":{""autotypenumbers"":""strict"",""colorway"":[""#636efa"",""#EF553B"",""#00cc96"",""#ab63fa"",""#FFA15A"",""#19d3f3"",""#FF6692"",""#B6E880"",""#FF97FF"",""#FECB52""],""font"":{""color"":""#2a3f5f""},""hovermode"":""closest"",""hoverlabel"":{""align"":""left""},""paper_bgcolor"":""white"",""plot_bgcolor"":""#E5ECF6"",""polar"":{""bgcolor"":""#E5ECF6"",""angularaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""radialaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""ternary"":{""bgcolor"":""#E5ECF6"",""aaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""baxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""caxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""coloraxis"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""colorscale"":{""sequential"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""sequentialminus"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""diverging"":[[0,""#8e0152""],[0.1,""#c51b7d""],[0.2,""#de77ae""],[0.3,""#f1b6da""],[0.4,""#fde0ef""],[0.5,""#f7f7f7""],[0.6,""#e6f5d0""],[0.7,""#b8e186""],[0.8,""#7fbc41""],[0.9,""#4d9221""],[1,""#276419""]]},""xaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""yaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""scene"":{""xaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""yaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""zaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2}},""shapedefaults"":{""line"":{""color"":""#2a3f5f""}},""annotationdefaults"":{""arrowcolor"":""#2a3f5f"",""arrowhead"":0,""arrowwidth"":1},""geo"":{""bgcolor"":""white"",""landcolor"":""#E5ECF6"",""subunitcolor"":""white"",""showland"":true,""showlakes"":true,""lakecolor"":""white""},""title"":{""x"":0.05},""mapbox"":{""style"":""light""}}},""xaxis"":{""anchor"":""y"",""domain"":[0.0,1.0],""title"":{""text"":""Model size (B params)""}},""yaxis"":{""anchor"":""x"",""domain"":[0.0,1.0],""title"":{""text"":""Model""},""categoryorder"":""array"",""categoryarray"":[""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""RedPajama-INCITE Chat (7B)"",""Qwen 1.5 Chat (7B)"",""Mistral (7B) Instruct v0.2 (Together AI)"",""LLaMA-2 Chat (7B)"",""Vicuna v1.5 (7B)"",""Mistral-7B-Instruct-v0.2"",""zephyr-7b-beta"",""Upstage SOLAR Instruct v1 (11B)"",""WizardLM v1.2 (13B)"",""Mixtral-8x7B-Instruct-v0.1"",""llama-2-70b-chat""]},""legend"":{""title"":{""text"":""Model""},""tracegroupgap"":0},""title"":{""text"":""Model sizes in billions of parameters""},""barmode"":""relative""}}","{""x"": ""model_sizes"", ""y"": ""model"", ""color"": ""model"", ""orientation"": ""h"", ""title"": ""Model sizes in billions of parameters"", ""labels"": {""model"": ""Model"", ""model_sizes"": ""Model size (B params)""}}",",model_sizes,model
|
343 |
0,70.0,llama-2-70b-chat
|
344 |
1,56.0,Mixtral-8x7B-Instruct-v0.1
|
345 |
-
|
346 |
-
|
347 |
-
|
|
|
|
|
348 |
3,7.0,Mistral-7B-Instruct-v0.2
|
349 |
-
|
350 |
-
|
351 |
-
|
352 |
-
|
353 |
-
|
|
|
|
|
|
|
354 |
4,1.1,TinyLlama/TinyLlama-1.1B-Chat-v1.0
|
355 |
"
|
356 |
model_context_lengths,./html/plots/model_context_lengths.html,"Figure({
|
|
|
10 |
'showlegend': True,
|
11 |
'textposition': 'auto',
|
12 |
'type': 'bar',
|
13 |
+
'x': array([17.4942]),
|
14 |
'xaxis': 'x',
|
15 |
'y': array(['gpt-4'], dtype=object),
|
16 |
'yaxis': 'y'},
|
|
|
24 |
'showlegend': True,
|
25 |
'textposition': 'auto',
|
26 |
'type': 'bar',
|
27 |
+
'x': array([8.7136]),
|
28 |
'xaxis': 'x',
|
29 |
'y': array(['gpt-4-turbo'], dtype=object),
|
30 |
'yaxis': 'y'},
|
|
|
38 |
'showlegend': True,
|
39 |
'textposition': 'auto',
|
40 |
'type': 'bar',
|
41 |
+
'x': array([0.74798]),
|
42 |
'xaxis': 'x',
|
43 |
'y': array(['gpt-3.5-turbo'], dtype=object),
|
44 |
'yaxis': 'y'},
|
45 |
{'alignmentgroup': 'True',
|
46 |
'hovertemplate': 'Model=%{y}<br>Execution cost ($)=%{x}<extra></extra>',
|
47 |
+
'legendgroup': 'Mixtral-8x7B-Instruct-v0.1',
|
48 |
'marker': {'color': '#ab63fa', 'pattern': {'shape': ''}},
|
49 |
+
'name': 'Mixtral-8x7B-Instruct-v0.1',
|
50 |
+
'offsetgroup': 'Mixtral-8x7B-Instruct-v0.1',
|
51 |
+
'orientation': 'h',
|
52 |
+
'showlegend': True,
|
53 |
+
'textposition': 'auto',
|
54 |
+
'type': 'bar',
|
55 |
+
'x': array([0.74277]),
|
56 |
+
'xaxis': 'x',
|
57 |
+
'y': array(['Mixtral-8x7B-Instruct-v0.1'], dtype=object),
|
58 |
+
'yaxis': 'y'},
|
59 |
+
{'alignmentgroup': 'True',
|
60 |
+
'hovertemplate': 'Model=%{y}<br>Execution cost ($)=%{x}<extra></extra>',
|
61 |
+
'legendgroup': 'zephyr-7b-beta',
|
62 |
+
'marker': {'color': '#FFA15A', 'pattern': {'shape': ''}},
|
63 |
+
'name': 'zephyr-7b-beta',
|
64 |
+
'offsetgroup': 'zephyr-7b-beta',
|
65 |
+
'orientation': 'h',
|
66 |
+
'showlegend': True,
|
67 |
+
'textposition': 'auto',
|
68 |
+
'type': 'bar',
|
69 |
+
'x': array([0.67250116]),
|
70 |
+
'xaxis': 'x',
|
71 |
+
'y': array(['zephyr-7b-beta'], dtype=object),
|
72 |
+
'yaxis': 'y'},
|
73 |
+
{'alignmentgroup': 'True',
|
74 |
+
'hovertemplate': 'Model=%{y}<br>Execution cost ($)=%{x}<extra></extra>',
|
75 |
+
'legendgroup': 'llama-2-70b-chat',
|
76 |
+
'marker': {'color': '#19d3f3', 'pattern': {'shape': ''}},
|
77 |
'name': 'llama-2-70b-chat',
|
78 |
'offsetgroup': 'llama-2-70b-chat',
|
79 |
'orientation': 'h',
|
80 |
'showlegend': True,
|
81 |
'textposition': 'auto',
|
82 |
'type': 'bar',
|
83 |
+
'x': array([0.665964]),
|
84 |
'xaxis': 'x',
|
85 |
'y': array(['llama-2-70b-chat'], dtype=object),
|
86 |
'yaxis': 'y'},
|
87 |
{'alignmentgroup': 'True',
|
88 |
'hovertemplate': 'Model=%{y}<br>Execution cost ($)=%{x}<extra></extra>',
|
89 |
+
'legendgroup': '01-ai Yi Chat (34B)',
|
90 |
+
'marker': {'color': '#FF6692', 'pattern': {'shape': ''}},
|
91 |
+
'name': '01-ai Yi Chat (34B)',
|
92 |
+
'offsetgroup': '01-ai Yi Chat (34B)',
|
93 |
'orientation': 'h',
|
94 |
'showlegend': True,
|
95 |
'textposition': 'auto',
|
96 |
'type': 'bar',
|
97 |
+
'x': array([0.405168]),
|
98 |
'xaxis': 'x',
|
99 |
+
'y': array(['01-ai Yi Chat (34B)'], dtype=object),
|
100 |
+
'yaxis': 'y'},
|
101 |
+
{'alignmentgroup': 'True',
|
102 |
+
'hovertemplate': 'Model=%{y}<br>Execution cost ($)=%{x}<extra></extra>',
|
103 |
+
'legendgroup': 'Mistral-7B-Instruct-v0.2',
|
104 |
+
'marker': {'color': '#B6E880', 'pattern': {'shape': ''}},
|
105 |
+
'name': 'Mistral-7B-Instruct-v0.2',
|
106 |
+
'offsetgroup': 'Mistral-7B-Instruct-v0.2',
|
107 |
+
'orientation': 'h',
|
108 |
+
'showlegend': True,
|
109 |
+
'textposition': 'auto',
|
110 |
+
'type': 'bar',
|
111 |
+
'x': array([0.23022898]),
|
112 |
+
'xaxis': 'x',
|
113 |
+
'y': array(['Mistral-7B-Instruct-v0.2'], dtype=object),
|
114 |
'yaxis': 'y'},
|
115 |
{'alignmentgroup': 'True',
|
116 |
'hovertemplate': 'Model=%{y}<br>Execution cost ($)=%{x}<extra></extra>',
|
117 |
'legendgroup': 'gemini-pro',
|
118 |
+
'marker': {'color': '#FF97FF', 'pattern': {'shape': ''}},
|
119 |
'name': 'gemini-pro',
|
120 |
'offsetgroup': 'gemini-pro',
|
121 |
'orientation': 'h',
|
122 |
'showlegend': True,
|
123 |
'textposition': 'auto',
|
124 |
'type': 'bar',
|
125 |
+
'x': array([0.178845]),
|
126 |
'xaxis': 'x',
|
127 |
'y': array(['gemini-pro'], dtype=object),
|
128 |
'yaxis': 'y'},
|
129 |
+
{'alignmentgroup': 'True',
|
130 |
+
'hovertemplate': 'Model=%{y}<br>Execution cost ($)=%{x}<extra></extra>',
|
131 |
+
'legendgroup': 'Snorkel Mistral PairRM DPO (7B)',
|
132 |
+
'marker': {'color': '#FECB52', 'pattern': {'shape': ''}},
|
133 |
+
'name': 'Snorkel Mistral PairRM DPO (7B)',
|
134 |
+
'offsetgroup': 'Snorkel Mistral PairRM DPO (7B)',
|
135 |
+
'orientation': 'h',
|
136 |
+
'showlegend': True,
|
137 |
+
'textposition': 'auto',
|
138 |
+
'type': 'bar',
|
139 |
+
'x': array([0.15948]),
|
140 |
+
'xaxis': 'x',
|
141 |
+
'y': array(['Snorkel Mistral PairRM DPO (7B)'], dtype=object),
|
142 |
+
'yaxis': 'y'},
|
143 |
{'alignmentgroup': 'True',
|
144 |
'hovertemplate': 'Model=%{y}<br>Execution cost ($)=%{x}<extra></extra>',
|
145 |
'legendgroup': 'chat-bison (PaLM 2)',
|
146 |
+
'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
|
147 |
'name': 'chat-bison (PaLM 2)',
|
148 |
'offsetgroup': 'chat-bison (PaLM 2)',
|
149 |
'orientation': 'h',
|
150 |
'showlegend': True,
|
151 |
'textposition': 'auto',
|
152 |
'type': 'bar',
|
153 |
+
'x': array([0.158515]),
|
154 |
'xaxis': 'x',
|
155 |
'y': array(['chat-bison (PaLM 2)'], dtype=object),
|
156 |
'yaxis': 'y'},
|
157 |
{'alignmentgroup': 'True',
|
158 |
'hovertemplate': 'Model=%{y}<br>Execution cost ($)=%{x}<extra></extra>',
|
159 |
'legendgroup': 'chat-bison-32k (PaLM 2 32K)',
|
160 |
+
'marker': {'color': '#EF553B', 'pattern': {'shape': ''}},
|
161 |
'name': 'chat-bison-32k (PaLM 2 32K)',
|
162 |
'offsetgroup': 'chat-bison-32k (PaLM 2 32K)',
|
163 |
'orientation': 'h',
|
164 |
'showlegend': True,
|
165 |
'textposition': 'auto',
|
166 |
'type': 'bar',
|
167 |
+
'x': array([0.151035]),
|
168 |
'xaxis': 'x',
|
169 |
'y': array(['chat-bison-32k (PaLM 2 32K)'], dtype=object),
|
170 |
'yaxis': 'y'},
|
171 |
+
{'alignmentgroup': 'True',
|
172 |
+
'hovertemplate': 'Model=%{y}<br>Execution cost ($)=%{x}<extra></extra>',
|
173 |
+
'legendgroup': 'Mistral (7B) Instruct v0.2 (Together AI)',
|
174 |
+
'marker': {'color': '#00cc96', 'pattern': {'shape': ''}},
|
175 |
+
'name': 'Mistral (7B) Instruct v0.2 (Together AI)',
|
176 |
+
'offsetgroup': 'Mistral (7B) Instruct v0.2 (Together AI)',
|
177 |
+
'orientation': 'h',
|
178 |
+
'showlegend': True,
|
179 |
+
'textposition': 'auto',
|
180 |
+
'type': 'bar',
|
181 |
+
'x': array([0.148248]),
|
182 |
+
'xaxis': 'x',
|
183 |
+
'y': array(['Mistral (7B) Instruct v0.2 (Together AI)'], dtype=object),
|
184 |
+
'yaxis': 'y'},
|
185 |
+
{'alignmentgroup': 'True',
|
186 |
+
'hovertemplate': 'Model=%{y}<br>Execution cost ($)=%{x}<extra></extra>',
|
187 |
+
'legendgroup': 'Chronos Hermes (13B)',
|
188 |
+
'marker': {'color': '#ab63fa', 'pattern': {'shape': ''}},
|
189 |
+
'name': 'Chronos Hermes (13B)',
|
190 |
+
'offsetgroup': 'Chronos Hermes (13B)',
|
191 |
+
'orientation': 'h',
|
192 |
+
'showlegend': True,
|
193 |
+
'textposition': 'auto',
|
194 |
+
'type': 'bar',
|
195 |
+
'x': array([0.141156]),
|
196 |
+
'xaxis': 'x',
|
197 |
+
'y': array(['Chronos Hermes (13B)'], dtype=object),
|
198 |
+
'yaxis': 'y'},
|
199 |
+
{'alignmentgroup': 'True',
|
200 |
+
'hovertemplate': 'Model=%{y}<br>Execution cost ($)=%{x}<extra></extra>',
|
201 |
+
'legendgroup': 'WizardLM v1.2 (13B)',
|
202 |
+
'marker': {'color': '#FFA15A', 'pattern': {'shape': ''}},
|
203 |
+
'name': 'WizardLM v1.2 (13B)',
|
204 |
+
'offsetgroup': 'WizardLM v1.2 (13B)',
|
205 |
+
'orientation': 'h',
|
206 |
+
'showlegend': True,
|
207 |
+
'textposition': 'auto',
|
208 |
+
'type': 'bar',
|
209 |
+
'x': array([0.131244]),
|
210 |
+
'xaxis': 'x',
|
211 |
+
'y': array(['WizardLM v1.2 (13B)'], dtype=object),
|
212 |
+
'yaxis': 'y'},
|
213 |
{'alignmentgroup': 'True',
|
214 |
'hovertemplate': 'Model=%{y}<br>Execution cost ($)=%{x}<extra></extra>',
|
215 |
'legendgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
|
216 |
+
'marker': {'color': '#19d3f3', 'pattern': {'shape': ''}},
|
217 |
'name': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
|
218 |
'offsetgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
|
219 |
'orientation': 'h',
|
220 |
'showlegend': True,
|
221 |
'textposition': 'auto',
|
222 |
'type': 'bar',
|
223 |
+
'x': array([0.11099814]),
|
224 |
'xaxis': 'x',
|
225 |
'y': array(['TinyLlama/TinyLlama-1.1B-Chat-v1.0'], dtype=object),
|
226 |
+
'yaxis': 'y'},
|
227 |
+
{'alignmentgroup': 'True',
|
228 |
+
'hovertemplate': 'Model=%{y}<br>Execution cost ($)=%{x}<extra></extra>',
|
229 |
+
'legendgroup': 'LLaMA-2 Chat (7B)',
|
230 |
+
'marker': {'color': '#FF6692', 'pattern': {'shape': ''}},
|
231 |
+
'name': 'LLaMA-2 Chat (7B)',
|
232 |
+
'offsetgroup': 'LLaMA-2 Chat (7B)',
|
233 |
+
'orientation': 'h',
|
234 |
+
'showlegend': True,
|
235 |
+
'textposition': 'auto',
|
236 |
+
'type': 'bar',
|
237 |
+
'x': array([0.103212]),
|
238 |
+
'xaxis': 'x',
|
239 |
+
'y': array(['LLaMA-2 Chat (7B)'], dtype=object),
|
240 |
+
'yaxis': 'y'},
|
241 |
+
{'alignmentgroup': 'True',
|
242 |
+
'hovertemplate': 'Model=%{y}<br>Execution cost ($)=%{x}<extra></extra>',
|
243 |
+
'legendgroup': 'Upstage SOLAR Instruct v1 (11B)',
|
244 |
+
'marker': {'color': '#B6E880', 'pattern': {'shape': ''}},
|
245 |
+
'name': 'Upstage SOLAR Instruct v1 (11B)',
|
246 |
+
'offsetgroup': 'Upstage SOLAR Instruct v1 (11B)',
|
247 |
+
'orientation': 'h',
|
248 |
+
'showlegend': True,
|
249 |
+
'textposition': 'auto',
|
250 |
+
'type': 'bar',
|
251 |
+
'x': array([0.10254]),
|
252 |
+
'xaxis': 'x',
|
253 |
+
'y': array(['Upstage SOLAR Instruct v1 (11B)'], dtype=object),
|
254 |
+
'yaxis': 'y'},
|
255 |
+
{'alignmentgroup': 'True',
|
256 |
+
'hovertemplate': 'Model=%{y}<br>Execution cost ($)=%{x}<extra></extra>',
|
257 |
+
'legendgroup': 'Vicuna v1.5 (7B)',
|
258 |
+
'marker': {'color': '#FF97FF', 'pattern': {'shape': ''}},
|
259 |
+
'name': 'Vicuna v1.5 (7B)',
|
260 |
+
'offsetgroup': 'Vicuna v1.5 (7B)',
|
261 |
+
'orientation': 'h',
|
262 |
+
'showlegend': True,
|
263 |
+
'textposition': 'auto',
|
264 |
+
'type': 'bar',
|
265 |
+
'x': array([0.097484]),
|
266 |
+
'xaxis': 'x',
|
267 |
+
'y': array(['Vicuna v1.5 (7B)'], dtype=object),
|
268 |
+
'yaxis': 'y'},
|
269 |
+
{'alignmentgroup': 'True',
|
270 |
+
'hovertemplate': 'Model=%{y}<br>Execution cost ($)=%{x}<extra></extra>',
|
271 |
+
'legendgroup': 'Qwen 1.5 Chat (7B)',
|
272 |
+
'marker': {'color': '#FECB52', 'pattern': {'shape': ''}},
|
273 |
+
'name': 'Qwen 1.5 Chat (7B)',
|
274 |
+
'offsetgroup': 'Qwen 1.5 Chat (7B)',
|
275 |
+
'orientation': 'h',
|
276 |
+
'showlegend': True,
|
277 |
+
'textposition': 'auto',
|
278 |
+
'type': 'bar',
|
279 |
+
'x': array([0.092256]),
|
280 |
+
'xaxis': 'x',
|
281 |
+
'y': array(['Qwen 1.5 Chat (7B)'], dtype=object),
|
282 |
+
'yaxis': 'y'},
|
283 |
+
{'alignmentgroup': 'True',
|
284 |
+
'hovertemplate': 'Model=%{y}<br>Execution cost ($)=%{x}<extra></extra>',
|
285 |
+
'legendgroup': 'OpenHermes-2.5-Mistral (7B)',
|
286 |
+
'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
|
287 |
+
'name': 'OpenHermes-2.5-Mistral (7B)',
|
288 |
+
'offsetgroup': 'OpenHermes-2.5-Mistral (7B)',
|
289 |
+
'orientation': 'h',
|
290 |
+
'showlegend': True,
|
291 |
+
'textposition': 'auto',
|
292 |
+
'type': 'bar',
|
293 |
+
'x': array([0.089096]),
|
294 |
+
'xaxis': 'x',
|
295 |
+
'y': array(['OpenHermes-2.5-Mistral (7B)'], dtype=object),
|
296 |
+
'yaxis': 'y'},
|
297 |
+
{'alignmentgroup': 'True',
|
298 |
+
'hovertemplate': 'Model=%{y}<br>Execution cost ($)=%{x}<extra></extra>',
|
299 |
+
'legendgroup': 'Falcon Instruct (7B)',
|
300 |
+
'marker': {'color': '#EF553B', 'pattern': {'shape': ''}},
|
301 |
+
'name': 'Falcon Instruct (7B)',
|
302 |
+
'offsetgroup': 'Falcon Instruct (7B)',
|
303 |
+
'orientation': 'h',
|
304 |
+
'showlegend': True,
|
305 |
+
'textposition': 'auto',
|
306 |
+
'type': 'bar',
|
307 |
+
'x': array([0.07428]),
|
308 |
+
'xaxis': 'x',
|
309 |
+
'y': array(['Falcon Instruct (7B)'], dtype=object),
|
310 |
+
'yaxis': 'y'},
|
311 |
+
{'alignmentgroup': 'True',
|
312 |
+
'hovertemplate': 'Model=%{y}<br>Execution cost ($)=%{x}<extra></extra>',
|
313 |
+
'legendgroup': 'RedPajama-INCITE Chat (7B)',
|
314 |
+
'marker': {'color': '#00cc96', 'pattern': {'shape': ''}},
|
315 |
+
'name': 'RedPajama-INCITE Chat (7B)',
|
316 |
+
'offsetgroup': 'RedPajama-INCITE Chat (7B)',
|
317 |
+
'orientation': 'h',
|
318 |
+
'showlegend': True,
|
319 |
+
'textposition': 'auto',
|
320 |
+
'type': 'bar',
|
321 |
+
'x': array([0.07172]),
|
322 |
+
'xaxis': 'x',
|
323 |
+
'y': array(['RedPajama-INCITE Chat (7B)'], dtype=object),
|
324 |
'yaxis': 'y'}],
|
325 |
'layout': {'barmode': 'relative',
|
326 |
'legend': {'title': {'text': 'Model'}, 'tracegroupgap': 0},
|
327 |
'template': '...',
|
328 |
+
'title': {'text': 'Costs of execution of 5560 test queries per model'},
|
329 |
'xaxis': {'anchor': 'y', 'domain': [0.0, 1.0], 'title': {'text': 'Execution cost ($)'}},
|
330 |
'yaxis': {'anchor': 'x',
|
331 |
+
'categoryarray': [RedPajama-INCITE Chat (7B), Falcon
|
332 |
+
Instruct (7B), OpenHermes-2.5-Mistral
|
333 |
+
(7B), Qwen 1.5 Chat (7B), Vicuna v1.5
|
334 |
+
(7B), Upstage SOLAR Instruct v1 (11B),
|
335 |
+
LLaMA-2 Chat (7B),
|
336 |
+
TinyLlama/TinyLlama-1.1B-Chat-v1.0,
|
337 |
+
WizardLM v1.2 (13B), Chronos Hermes
|
338 |
+
(13B), Mistral (7B) Instruct v0.2
|
339 |
+
(Together AI), chat-bison-32k (PaLM 2
|
340 |
+
32K), chat-bison (PaLM 2), Snorkel
|
341 |
+
Mistral PairRM DPO (7B), gemini-pro,
|
342 |
+
Mistral-7B-Instruct-v0.2, 01-ai Yi Chat
|
343 |
+
(34B), llama-2-70b-chat, zephyr-7b-beta,
|
344 |
Mixtral-8x7B-Instruct-v0.1,
|
345 |
+
gpt-3.5-turbo, gpt-4-turbo, gpt-4],
|
|
|
346 |
'categoryorder': 'array',
|
347 |
'domain': [0.0, 1.0],
|
348 |
'title': {'text': 'Model'}}}
|
349 |
+
})",Costs of execution of 5560 test queries per model,,"{""data"":[{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eExecution cost ($)=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""gpt-4"",""offsetgroup"":""gpt-4"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[17.4942],""xaxis"":""x"",""y"":[""gpt-4""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eExecution cost ($)=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4-turbo"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""gpt-4-turbo"",""offsetgroup"":""gpt-4-turbo"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[8.7136],""xaxis"":""x"",""y"":[""gpt-4-turbo""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eExecution cost ($)=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-3.5-turbo"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""gpt-3.5-turbo"",""offsetgroup"":""gpt-3.5-turbo"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.74798],""xaxis"":""x"",""y"":[""gpt-3.5-turbo""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eExecution cost ($)=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mixtral-8x7B-Instruct-v0.1"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""Mixtral-8x7B-Instruct-v0.1"",""offsetgroup"":""Mixtral-8x7B-Instruct-v0.1"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.7427699999999999],""xaxis"":""x"",""y"":[""Mixtral-8x7B-Instruct-v0.1""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eExecution cost ($)=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""zephyr-7b-beta"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""zephyr-7b-beta"",""offsetgroup"":""zephyr-7b-beta"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.6725011554823982],""xaxis"":""x"",""y"":[""zephyr-7b-beta""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eExecution cost ($)=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""llama-2-70b-chat"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""llama-2-70b-chat"",""offsetgroup"":""llama-2-70b-chat"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.665964],""xaxis"":""x"",""y"":[""llama-2-70b-chat""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eExecution cost ($)=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""01-ai Yi Chat (34B)"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""01-ai Yi Chat (34B)"",""offsetgroup"":""01-ai Yi Chat (34B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.40516800000000003],""xaxis"":""x"",""y"":[""01-ai Yi Chat (34B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eExecution cost ($)=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral-7B-Instruct-v0.2"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""Mistral-7B-Instruct-v0.2"",""offsetgroup"":""Mistral-7B-Instruct-v0.2"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.23022897595829436],""xaxis"":""x"",""y"":[""Mistral-7B-Instruct-v0.2""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eExecution cost ($)=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gemini-pro"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""gemini-pro"",""offsetgroup"":""gemini-pro"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.178845],""xaxis"":""x"",""y"":[""gemini-pro""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eExecution cost ($)=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Snorkel Mistral PairRM DPO (7B)"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""Snorkel Mistral PairRM DPO (7B)"",""offsetgroup"":""Snorkel Mistral PairRM DPO (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.15948],""xaxis"":""x"",""y"":[""Snorkel Mistral PairRM DPO (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eExecution cost ($)=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison (PaLM 2)"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""chat-bison (PaLM 2)"",""offsetgroup"":""chat-bison (PaLM 2)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.15851500000000002],""xaxis"":""x"",""y"":[""chat-bison (PaLM 2)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eExecution cost ($)=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison-32k (PaLM 2 32K)"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""chat-bison-32k (PaLM 2 32K)"",""offsetgroup"":""chat-bison-32k (PaLM 2 32K)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.151035],""xaxis"":""x"",""y"":[""chat-bison-32k (PaLM 2 32K)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eExecution cost ($)=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral (7B) Instruct v0.2 (Together AI)"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""Mistral (7B) Instruct v0.2 (Together AI)"",""offsetgroup"":""Mistral (7B) Instruct v0.2 (Together AI)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.14824800000000002],""xaxis"":""x"",""y"":[""Mistral (7B) Instruct v0.2 (Together AI)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eExecution cost ($)=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Chronos Hermes (13B)"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""Chronos Hermes (13B)"",""offsetgroup"":""Chronos Hermes (13B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.141156],""xaxis"":""x"",""y"":[""Chronos Hermes (13B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eExecution cost ($)=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""WizardLM v1.2 (13B)"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""WizardLM v1.2 (13B)"",""offsetgroup"":""WizardLM v1.2 (13B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.131244],""xaxis"":""x"",""y"":[""WizardLM v1.2 (13B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eExecution cost ($)=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""offsetgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.11099814383188883],""xaxis"":""x"",""y"":[""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eExecution cost ($)=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""LLaMA-2 Chat (7B)"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""LLaMA-2 Chat (7B)"",""offsetgroup"":""LLaMA-2 Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.103212],""xaxis"":""x"",""y"":[""LLaMA-2 Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eExecution cost ($)=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Upstage SOLAR Instruct v1 (11B)"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""Upstage SOLAR Instruct v1 (11B)"",""offsetgroup"":""Upstage SOLAR Instruct v1 (11B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.10253999999999999],""xaxis"":""x"",""y"":[""Upstage SOLAR Instruct v1 (11B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eExecution cost ($)=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Vicuna v1.5 (7B)"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""Vicuna v1.5 (7B)"",""offsetgroup"":""Vicuna v1.5 (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.097484],""xaxis"":""x"",""y"":[""Vicuna v1.5 (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eExecution cost ($)=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Qwen 1.5 Chat (7B)"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""Qwen 1.5 Chat (7B)"",""offsetgroup"":""Qwen 1.5 Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.092256],""xaxis"":""x"",""y"":[""Qwen 1.5 Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eExecution cost ($)=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""OpenHermes-2.5-Mistral (7B)"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""OpenHermes-2.5-Mistral (7B)"",""offsetgroup"":""OpenHermes-2.5-Mistral (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.08909600000000001],""xaxis"":""x"",""y"":[""OpenHermes-2.5-Mistral (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eExecution cost ($)=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Falcon Instruct (7B)"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""Falcon Instruct (7B)"",""offsetgroup"":""Falcon Instruct (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.07428],""xaxis"":""x"",""y"":[""Falcon Instruct (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eExecution cost ($)=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""RedPajama-INCITE Chat (7B)"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""RedPajama-INCITE Chat (7B)"",""offsetgroup"":""RedPajama-INCITE Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.07172],""xaxis"":""x"",""y"":[""RedPajama-INCITE Chat (7B)""],""yaxis"":""y"",""type"":""bar""}],""layout"":{""template"":{""data"":{""histogram2dcontour"":[{""type"":""histogram2dcontour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""choropleth"":[{""type"":""choropleth"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""histogram2d"":[{""type"":""histogram2d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmap"":[{""type"":""heatmap"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmapgl"":[{""type"":""heatmapgl"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""contourcarpet"":[{""type"":""contourcarpet"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""contour"":[{""type"":""contour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""surface"":[{""type"":""surface"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""mesh3d"":[{""type"":""mesh3d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""scatter"":[{""fillpattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2},""type"":""scatter""}],""parcoords"":[{""type"":""parcoords"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolargl"":[{""type"":""scatterpolargl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""bar"":[{""error_x"":{""color"":""#2a3f5f""},""error_y"":{""color"":""#2a3f5f""},""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""bar""}],""scattergeo"":[{""type"":""scattergeo"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolar"":[{""type"":""scatterpolar"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""histogram"":[{""marker"":{""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""histogram""}],""scattergl"":[{""type"":""scattergl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatter3d"":[{""type"":""scatter3d"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattermapbox"":[{""type"":""scattermapbox"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterternary"":[{""type"":""scatterternary"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattercarpet"":[{""type"":""scattercarpet"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""carpet"":[{""aaxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""baxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""type"":""carpet""}],""table"":[{""cells"":{""fill"":{""color"":""#EBF0F8""},""line"":{""color"":""white""}},""header"":{""fill"":{""color"":""#C8D4E3""},""line"":{""color"":""white""}},""type"":""table""}],""barpolar"":[{""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""barpolar""}],""pie"":[{""automargin"":true,""type"":""pie""}]},""layout"":{""autotypenumbers"":""strict"",""colorway"":[""#636efa"",""#EF553B"",""#00cc96"",""#ab63fa"",""#FFA15A"",""#19d3f3"",""#FF6692"",""#B6E880"",""#FF97FF"",""#FECB52""],""font"":{""color"":""#2a3f5f""},""hovermode"":""closest"",""hoverlabel"":{""align"":""left""},""paper_bgcolor"":""white"",""plot_bgcolor"":""#E5ECF6"",""polar"":{""bgcolor"":""#E5ECF6"",""angularaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""radialaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""ternary"":{""bgcolor"":""#E5ECF6"",""aaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""baxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""caxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""coloraxis"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""colorscale"":{""sequential"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""sequentialminus"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""diverging"":[[0,""#8e0152""],[0.1,""#c51b7d""],[0.2,""#de77ae""],[0.3,""#f1b6da""],[0.4,""#fde0ef""],[0.5,""#f7f7f7""],[0.6,""#e6f5d0""],[0.7,""#b8e186""],[0.8,""#7fbc41""],[0.9,""#4d9221""],[1,""#276419""]]},""xaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""yaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""scene"":{""xaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""yaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""zaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2}},""shapedefaults"":{""line"":{""color"":""#2a3f5f""}},""annotationdefaults"":{""arrowcolor"":""#2a3f5f"",""arrowhead"":0,""arrowwidth"":1},""geo"":{""bgcolor"":""white"",""landcolor"":""#E5ECF6"",""subunitcolor"":""white"",""showland"":true,""showlakes"":true,""lakecolor"":""white""},""title"":{""x"":0.05},""mapbox"":{""style"":""light""}}},""xaxis"":{""anchor"":""y"",""domain"":[0.0,1.0],""title"":{""text"":""Execution cost ($)""}},""yaxis"":{""anchor"":""x"",""domain"":[0.0,1.0],""title"":{""text"":""Model""},""categoryorder"":""array"",""categoryarray"":[""RedPajama-INCITE Chat (7B)"",""Falcon Instruct (7B)"",""OpenHermes-2.5-Mistral (7B)"",""Qwen 1.5 Chat (7B)"",""Vicuna v1.5 (7B)"",""Upstage SOLAR Instruct v1 (11B)"",""LLaMA-2 Chat (7B)"",""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""WizardLM v1.2 (13B)"",""Chronos Hermes (13B)"",""Mistral (7B) Instruct v0.2 (Together AI)"",""chat-bison-32k (PaLM 2 32K)"",""chat-bison (PaLM 2)"",""Snorkel Mistral PairRM DPO (7B)"",""gemini-pro"",""Mistral-7B-Instruct-v0.2"",""01-ai Yi Chat (34B)"",""llama-2-70b-chat"",""zephyr-7b-beta"",""Mixtral-8x7B-Instruct-v0.1"",""gpt-3.5-turbo"",""gpt-4-turbo"",""gpt-4""]},""legend"":{""title"":{""text"":""Model""},""tracegroupgap"":0},""title"":{""text"":""Costs of execution of 5560 test queries per model""},""barmode"":""relative""}}","{""y"": ""model"", ""x"": ""model_query_costs"", ""color"": ""model"", ""orientation"": ""h"", ""title"": ""Costs of execution of 5560 test queries per model"", ""labels"": {""model"": ""Model"", ""model_query_costs"": ""Execution cost ($)""}}",",model_query_costs,model
|
350 |
+
2,17.4942,gpt-4
|
351 |
+
1,8.7136,gpt-4-turbo
|
352 |
+
0,0.74798,gpt-3.5-turbo
|
353 |
+
4,0.7427699999999999,Mixtral-8x7B-Instruct-v0.1
|
354 |
+
5,0.6725011554823982,zephyr-7b-beta
|
355 |
+
3,0.665964,llama-2-70b-chat
|
356 |
+
11,0.40516800000000003,01-ai Yi Chat (34B)
|
357 |
+
6,0.23022897595829436,Mistral-7B-Instruct-v0.2
|
358 |
+
8,0.178845,gemini-pro
|
359 |
+
43,0.15948,Snorkel Mistral PairRM DPO (7B)
|
360 |
+
9,0.15851500000000002,chat-bison (PaLM 2)
|
361 |
+
10,0.151035,chat-bison-32k (PaLM 2 32K)
|
362 |
+
26,0.14824800000000002,Mistral (7B) Instruct v0.2 (Together AI)
|
363 |
+
12,0.141156,Chronos Hermes (13B)
|
364 |
+
55,0.131244,WizardLM v1.2 (13B)
|
365 |
+
7,0.11099814383188883,TinyLlama/TinyLlama-1.1B-Chat-v1.0
|
366 |
+
24,0.103212,LLaMA-2 Chat (7B)
|
367 |
+
56,0.10253999999999999,Upstage SOLAR Instruct v1 (11B)
|
368 |
+
17,0.097484,Vicuna v1.5 (7B)
|
369 |
+
40,0.092256,Qwen 1.5 Chat (7B)
|
370 |
+
46,0.08909600000000001,OpenHermes-2.5-Mistral (7B)
|
371 |
+
48,0.07428,Falcon Instruct (7B)
|
372 |
+
51,0.07172,RedPajama-INCITE Chat (7B)
|
373 |
"
|
374 |
model_sizes,./html/plots/model_sizes.html,"Figure({
|
375 |
'data': [{'alignmentgroup': 'True',
|
|
|
402 |
'yaxis': 'y'},
|
403 |
{'alignmentgroup': 'True',
|
404 |
'hovertemplate': 'Model=%{y}<br>Model size (B params)=%{x}<extra></extra>',
|
405 |
+
'legendgroup': '01-ai Yi Chat (34B)',
|
406 |
'marker': {'color': '#00cc96', 'pattern': {'shape': ''}},
|
407 |
+
'name': '01-ai Yi Chat (34B)',
|
408 |
+
'offsetgroup': '01-ai Yi Chat (34B)',
|
409 |
'orientation': 'h',
|
410 |
'showlegend': True,
|
411 |
'textposition': 'auto',
|
412 |
'type': 'bar',
|
413 |
+
'x': array([34.]),
|
414 |
'xaxis': 'x',
|
415 |
+
'y': array(['01-ai Yi Chat (34B)'], dtype=object),
|
416 |
'yaxis': 'y'},
|
417 |
{'alignmentgroup': 'True',
|
418 |
'hovertemplate': 'Model=%{y}<br>Model size (B params)=%{x}<extra></extra>',
|
419 |
+
'legendgroup': 'WizardLM v1.2 (13B)',
|
420 |
'marker': {'color': '#ab63fa', 'pattern': {'shape': ''}},
|
421 |
+
'name': 'WizardLM v1.2 (13B)',
|
422 |
+
'offsetgroup': 'WizardLM v1.2 (13B)',
|
423 |
'orientation': 'h',
|
424 |
'showlegend': True,
|
425 |
'textposition': 'auto',
|
426 |
'type': 'bar',
|
427 |
+
'x': array([13.]),
|
428 |
'xaxis': 'x',
|
429 |
+
'y': array(['WizardLM v1.2 (13B)'], dtype=object),
|
430 |
'yaxis': 'y'},
|
431 |
{'alignmentgroup': 'True',
|
432 |
'hovertemplate': 'Model=%{y}<br>Model size (B params)=%{x}<extra></extra>',
|
433 |
+
'legendgroup': 'Chronos Hermes (13B)',
|
434 |
'marker': {'color': '#FFA15A', 'pattern': {'shape': ''}},
|
435 |
+
'name': 'Chronos Hermes (13B)',
|
436 |
+
'offsetgroup': 'Chronos Hermes (13B)',
|
437 |
'orientation': 'h',
|
438 |
'showlegend': True,
|
439 |
'textposition': 'auto',
|
440 |
'type': 'bar',
|
441 |
+
'x': array([13.]),
|
442 |
'xaxis': 'x',
|
443 |
+
'y': array(['Chronos Hermes (13B)'], dtype=object),
|
444 |
'yaxis': 'y'},
|
445 |
{'alignmentgroup': 'True',
|
446 |
'hovertemplate': 'Model=%{y}<br>Model size (B params)=%{x}<extra></extra>',
|
447 |
+
'legendgroup': 'Upstage SOLAR Instruct v1 (11B)',
|
448 |
'marker': {'color': '#19d3f3', 'pattern': {'shape': ''}},
|
449 |
+
'name': 'Upstage SOLAR Instruct v1 (11B)',
|
450 |
+
'offsetgroup': 'Upstage SOLAR Instruct v1 (11B)',
|
451 |
'orientation': 'h',
|
452 |
'showlegend': True,
|
453 |
'textposition': 'auto',
|
454 |
'type': 'bar',
|
455 |
+
'x': array([11.]),
|
456 |
'xaxis': 'x',
|
457 |
+
'y': array(['Upstage SOLAR Instruct v1 (11B)'], dtype=object),
|
458 |
'yaxis': 'y'},
|
459 |
{'alignmentgroup': 'True',
|
460 |
'hovertemplate': 'Model=%{y}<br>Model size (B params)=%{x}<extra></extra>',
|
|
|
472 |
'yaxis': 'y'},
|
473 |
{'alignmentgroup': 'True',
|
474 |
'hovertemplate': 'Model=%{y}<br>Model size (B params)=%{x}<extra></extra>',
|
475 |
+
'legendgroup': 'Mistral-7B-Instruct-v0.2',
|
476 |
'marker': {'color': '#B6E880', 'pattern': {'shape': ''}},
|
477 |
+
'name': 'Mistral-7B-Instruct-v0.2',
|
478 |
+
'offsetgroup': 'Mistral-7B-Instruct-v0.2',
|
479 |
'orientation': 'h',
|
480 |
'showlegend': True,
|
481 |
'textposition': 'auto',
|
482 |
'type': 'bar',
|
483 |
'x': array([7.]),
|
484 |
'xaxis': 'x',
|
485 |
+
'y': array(['Mistral-7B-Instruct-v0.2'], dtype=object),
|
486 |
'yaxis': 'y'},
|
487 |
{'alignmentgroup': 'True',
|
488 |
'hovertemplate': 'Model=%{y}<br>Model size (B params)=%{x}<extra></extra>',
|
|
|
514 |
'yaxis': 'y'},
|
515 |
{'alignmentgroup': 'True',
|
516 |
'hovertemplate': 'Model=%{y}<br>Model size (B params)=%{x}<extra></extra>',
|
517 |
+
'legendgroup': 'Snorkel Mistral PairRM DPO (7B)',
|
518 |
'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
|
519 |
+
'name': 'Snorkel Mistral PairRM DPO (7B)',
|
520 |
+
'offsetgroup': 'Snorkel Mistral PairRM DPO (7B)',
|
521 |
+
'orientation': 'h',
|
522 |
+
'showlegend': True,
|
523 |
+
'textposition': 'auto',
|
524 |
+
'type': 'bar',
|
525 |
+
'x': array([7.]),
|
526 |
+
'xaxis': 'x',
|
527 |
+
'y': array(['Snorkel Mistral PairRM DPO (7B)'], dtype=object),
|
528 |
+
'yaxis': 'y'},
|
529 |
+
{'alignmentgroup': 'True',
|
530 |
+
'hovertemplate': 'Model=%{y}<br>Model size (B params)=%{x}<extra></extra>',
|
531 |
+
'legendgroup': 'OpenHermes-2.5-Mistral (7B)',
|
532 |
+
'marker': {'color': '#EF553B', 'pattern': {'shape': ''}},
|
533 |
+
'name': 'OpenHermes-2.5-Mistral (7B)',
|
534 |
+
'offsetgroup': 'OpenHermes-2.5-Mistral (7B)',
|
535 |
+
'orientation': 'h',
|
536 |
+
'showlegend': True,
|
537 |
+
'textposition': 'auto',
|
538 |
+
'type': 'bar',
|
539 |
+
'x': array([7.]),
|
540 |
+
'xaxis': 'x',
|
541 |
+
'y': array(['OpenHermes-2.5-Mistral (7B)'], dtype=object),
|
542 |
+
'yaxis': 'y'},
|
543 |
+
{'alignmentgroup': 'True',
|
544 |
+
'hovertemplate': 'Model=%{y}<br>Model size (B params)=%{x}<extra></extra>',
|
545 |
+
'legendgroup': 'Falcon Instruct (7B)',
|
546 |
+
'marker': {'color': '#00cc96', 'pattern': {'shape': ''}},
|
547 |
+
'name': 'Falcon Instruct (7B)',
|
548 |
+
'offsetgroup': 'Falcon Instruct (7B)',
|
549 |
+
'orientation': 'h',
|
550 |
+
'showlegend': True,
|
551 |
+
'textposition': 'auto',
|
552 |
+
'type': 'bar',
|
553 |
+
'x': array([7.]),
|
554 |
+
'xaxis': 'x',
|
555 |
+
'y': array(['Falcon Instruct (7B)'], dtype=object),
|
556 |
+
'yaxis': 'y'},
|
557 |
+
{'alignmentgroup': 'True',
|
558 |
+
'hovertemplate': 'Model=%{y}<br>Model size (B params)=%{x}<extra></extra>',
|
559 |
+
'legendgroup': 'RedPajama-INCITE Chat (7B)',
|
560 |
+
'marker': {'color': '#ab63fa', 'pattern': {'shape': ''}},
|
561 |
'name': 'RedPajama-INCITE Chat (7B)',
|
562 |
'offsetgroup': 'RedPajama-INCITE Chat (7B)',
|
563 |
'orientation': 'h',
|
|
|
568 |
'xaxis': 'x',
|
569 |
'y': array(['RedPajama-INCITE Chat (7B)'], dtype=object),
|
570 |
'yaxis': 'y'},
|
571 |
+
{'alignmentgroup': 'True',
|
572 |
+
'hovertemplate': 'Model=%{y}<br>Model size (B params)=%{x}<extra></extra>',
|
573 |
+
'legendgroup': 'zephyr-7b-beta',
|
574 |
+
'marker': {'color': '#FFA15A', 'pattern': {'shape': ''}},
|
575 |
+
'name': 'zephyr-7b-beta',
|
576 |
+
'offsetgroup': 'zephyr-7b-beta',
|
577 |
+
'orientation': 'h',
|
578 |
+
'showlegend': True,
|
579 |
+
'textposition': 'auto',
|
580 |
+
'type': 'bar',
|
581 |
+
'x': array([7.]),
|
582 |
+
'xaxis': 'x',
|
583 |
+
'y': array(['zephyr-7b-beta'], dtype=object),
|
584 |
+
'yaxis': 'y'},
|
585 |
+
{'alignmentgroup': 'True',
|
586 |
+
'hovertemplate': 'Model=%{y}<br>Model size (B params)=%{x}<extra></extra>',
|
587 |
+
'legendgroup': 'LLaMA-2 Chat (7B)',
|
588 |
+
'marker': {'color': '#19d3f3', 'pattern': {'shape': ''}},
|
589 |
+
'name': 'LLaMA-2 Chat (7B)',
|
590 |
+
'offsetgroup': 'LLaMA-2 Chat (7B)',
|
591 |
+
'orientation': 'h',
|
592 |
+
'showlegend': True,
|
593 |
+
'textposition': 'auto',
|
594 |
+
'type': 'bar',
|
595 |
+
'x': array([7.]),
|
596 |
+
'xaxis': 'x',
|
597 |
+
'y': array(['LLaMA-2 Chat (7B)'], dtype=object),
|
598 |
+
'yaxis': 'y'},
|
599 |
{'alignmentgroup': 'True',
|
600 |
'hovertemplate': 'Model=%{y}<br>Model size (B params)=%{x}<extra></extra>',
|
601 |
'legendgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
|
602 |
+
'marker': {'color': '#FF6692', 'pattern': {'shape': ''}},
|
603 |
'name': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
|
604 |
'offsetgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
|
605 |
'orientation': 'h',
|
|
|
617 |
'xaxis': {'anchor': 'y', 'domain': [0.0, 1.0], 'title': {'text': 'Model size (B params)'}},
|
618 |
'yaxis': {'anchor': 'x',
|
619 |
'categoryarray': [TinyLlama/TinyLlama-1.1B-Chat-v1.0,
|
620 |
+
LLaMA-2 Chat (7B), zephyr-7b-beta,
|
621 |
+
RedPajama-INCITE Chat (7B), Falcon
|
622 |
+
Instruct (7B), OpenHermes-2.5-Mistral
|
623 |
+
(7B), Snorkel Mistral PairRM DPO (7B),
|
624 |
+
Qwen 1.5 Chat (7B), Mistral (7B)
|
625 |
+
Instruct v0.2 (Together AI),
|
626 |
+
Mistral-7B-Instruct-v0.2, Vicuna v1.5
|
627 |
+
(7B), Upstage SOLAR Instruct v1 (11B),
|
628 |
+
Chronos Hermes (13B), WizardLM v1.2
|
629 |
+
(13B), 01-ai Yi Chat (34B),
|
630 |
Mixtral-8x7B-Instruct-v0.1,
|
631 |
llama-2-70b-chat],
|
632 |
'categoryorder': 'array',
|
633 |
'domain': [0.0, 1.0],
|
634 |
'title': {'text': 'Model'}}}
|
635 |
+
})",Model sizes in billions of parameters,,"{""data"":[{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eModel size (B params)=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""llama-2-70b-chat"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""llama-2-70b-chat"",""offsetgroup"":""llama-2-70b-chat"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[70.0],""xaxis"":""x"",""y"":[""llama-2-70b-chat""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eModel size (B params)=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mixtral-8x7B-Instruct-v0.1"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""Mixtral-8x7B-Instruct-v0.1"",""offsetgroup"":""Mixtral-8x7B-Instruct-v0.1"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[56.0],""xaxis"":""x"",""y"":[""Mixtral-8x7B-Instruct-v0.1""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eModel size (B params)=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""01-ai Yi Chat (34B)"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""01-ai Yi Chat (34B)"",""offsetgroup"":""01-ai Yi Chat (34B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[34.0],""xaxis"":""x"",""y"":[""01-ai Yi Chat (34B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eModel size (B params)=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""WizardLM v1.2 (13B)"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""WizardLM v1.2 (13B)"",""offsetgroup"":""WizardLM v1.2 (13B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[13.0],""xaxis"":""x"",""y"":[""WizardLM v1.2 (13B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eModel size (B params)=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Chronos Hermes (13B)"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""Chronos Hermes (13B)"",""offsetgroup"":""Chronos Hermes (13B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[13.0],""xaxis"":""x"",""y"":[""Chronos Hermes (13B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eModel size (B params)=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Upstage SOLAR Instruct v1 (11B)"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""Upstage SOLAR Instruct v1 (11B)"",""offsetgroup"":""Upstage SOLAR Instruct v1 (11B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[11.0],""xaxis"":""x"",""y"":[""Upstage SOLAR Instruct v1 (11B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eModel size (B params)=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Vicuna v1.5 (7B)"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""Vicuna v1.5 (7B)"",""offsetgroup"":""Vicuna v1.5 (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[7.0],""xaxis"":""x"",""y"":[""Vicuna v1.5 (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eModel size (B params)=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral-7B-Instruct-v0.2"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""Mistral-7B-Instruct-v0.2"",""offsetgroup"":""Mistral-7B-Instruct-v0.2"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[7.0],""xaxis"":""x"",""y"":[""Mistral-7B-Instruct-v0.2""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eModel size (B params)=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral (7B) Instruct v0.2 (Together AI)"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""Mistral (7B) Instruct v0.2 (Together AI)"",""offsetgroup"":""Mistral (7B) Instruct v0.2 (Together AI)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[7.0],""xaxis"":""x"",""y"":[""Mistral (7B) Instruct v0.2 (Together AI)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eModel size (B params)=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Qwen 1.5 Chat (7B)"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""Qwen 1.5 Chat (7B)"",""offsetgroup"":""Qwen 1.5 Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[7.0],""xaxis"":""x"",""y"":[""Qwen 1.5 Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eModel size (B params)=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Snorkel Mistral PairRM DPO (7B)"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""Snorkel Mistral PairRM DPO (7B)"",""offsetgroup"":""Snorkel Mistral PairRM DPO (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[7.0],""xaxis"":""x"",""y"":[""Snorkel Mistral PairRM DPO (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eModel size (B params)=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""OpenHermes-2.5-Mistral (7B)"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""OpenHermes-2.5-Mistral (7B)"",""offsetgroup"":""OpenHermes-2.5-Mistral (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[7.0],""xaxis"":""x"",""y"":[""OpenHermes-2.5-Mistral (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eModel size (B params)=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Falcon Instruct (7B)"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""Falcon Instruct (7B)"",""offsetgroup"":""Falcon Instruct (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[7.0],""xaxis"":""x"",""y"":[""Falcon Instruct (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eModel size (B params)=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""RedPajama-INCITE Chat (7B)"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""RedPajama-INCITE Chat (7B)"",""offsetgroup"":""RedPajama-INCITE Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[7.0],""xaxis"":""x"",""y"":[""RedPajama-INCITE Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eModel size (B params)=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""zephyr-7b-beta"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""zephyr-7b-beta"",""offsetgroup"":""zephyr-7b-beta"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[7.0],""xaxis"":""x"",""y"":[""zephyr-7b-beta""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eModel size (B params)=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""LLaMA-2 Chat (7B)"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""LLaMA-2 Chat (7B)"",""offsetgroup"":""LLaMA-2 Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[7.0],""xaxis"":""x"",""y"":[""LLaMA-2 Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eModel size (B params)=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""offsetgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[1.1],""xaxis"":""x"",""y"":[""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0""],""yaxis"":""y"",""type"":""bar""}],""layout"":{""template"":{""data"":{""histogram2dcontour"":[{""type"":""histogram2dcontour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""choropleth"":[{""type"":""choropleth"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""histogram2d"":[{""type"":""histogram2d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmap"":[{""type"":""heatmap"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmapgl"":[{""type"":""heatmapgl"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""contourcarpet"":[{""type"":""contourcarpet"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""contour"":[{""type"":""contour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""surface"":[{""type"":""surface"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""mesh3d"":[{""type"":""mesh3d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""scatter"":[{""fillpattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2},""type"":""scatter""}],""parcoords"":[{""type"":""parcoords"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolargl"":[{""type"":""scatterpolargl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""bar"":[{""error_x"":{""color"":""#2a3f5f""},""error_y"":{""color"":""#2a3f5f""},""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""bar""}],""scattergeo"":[{""type"":""scattergeo"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolar"":[{""type"":""scatterpolar"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""histogram"":[{""marker"":{""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""histogram""}],""scattergl"":[{""type"":""scattergl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatter3d"":[{""type"":""scatter3d"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattermapbox"":[{""type"":""scattermapbox"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterternary"":[{""type"":""scatterternary"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattercarpet"":[{""type"":""scattercarpet"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""carpet"":[{""aaxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""baxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""type"":""carpet""}],""table"":[{""cells"":{""fill"":{""color"":""#EBF0F8""},""line"":{""color"":""white""}},""header"":{""fill"":{""color"":""#C8D4E3""},""line"":{""color"":""white""}},""type"":""table""}],""barpolar"":[{""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""barpolar""}],""pie"":[{""automargin"":true,""type"":""pie""}]},""layout"":{""autotypenumbers"":""strict"",""colorway"":[""#636efa"",""#EF553B"",""#00cc96"",""#ab63fa"",""#FFA15A"",""#19d3f3"",""#FF6692"",""#B6E880"",""#FF97FF"",""#FECB52""],""font"":{""color"":""#2a3f5f""},""hovermode"":""closest"",""hoverlabel"":{""align"":""left""},""paper_bgcolor"":""white"",""plot_bgcolor"":""#E5ECF6"",""polar"":{""bgcolor"":""#E5ECF6"",""angularaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""radialaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""ternary"":{""bgcolor"":""#E5ECF6"",""aaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""baxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""caxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""coloraxis"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""colorscale"":{""sequential"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""sequentialminus"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""diverging"":[[0,""#8e0152""],[0.1,""#c51b7d""],[0.2,""#de77ae""],[0.3,""#f1b6da""],[0.4,""#fde0ef""],[0.5,""#f7f7f7""],[0.6,""#e6f5d0""],[0.7,""#b8e186""],[0.8,""#7fbc41""],[0.9,""#4d9221""],[1,""#276419""]]},""xaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""yaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""scene"":{""xaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""yaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""zaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2}},""shapedefaults"":{""line"":{""color"":""#2a3f5f""}},""annotationdefaults"":{""arrowcolor"":""#2a3f5f"",""arrowhead"":0,""arrowwidth"":1},""geo"":{""bgcolor"":""white"",""landcolor"":""#E5ECF6"",""subunitcolor"":""white"",""showland"":true,""showlakes"":true,""lakecolor"":""white""},""title"":{""x"":0.05},""mapbox"":{""style"":""light""}}},""xaxis"":{""anchor"":""y"",""domain"":[0.0,1.0],""title"":{""text"":""Model size (B params)""}},""yaxis"":{""anchor"":""x"",""domain"":[0.0,1.0],""title"":{""text"":""Model""},""categoryorder"":""array"",""categoryarray"":[""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""LLaMA-2 Chat (7B)"",""zephyr-7b-beta"",""RedPajama-INCITE Chat (7B)"",""Falcon Instruct (7B)"",""OpenHermes-2.5-Mistral (7B)"",""Snorkel Mistral PairRM DPO (7B)"",""Qwen 1.5 Chat (7B)"",""Mistral (7B) Instruct v0.2 (Together AI)"",""Mistral-7B-Instruct-v0.2"",""Vicuna v1.5 (7B)"",""Upstage SOLAR Instruct v1 (11B)"",""Chronos Hermes (13B)"",""WizardLM v1.2 (13B)"",""01-ai Yi Chat (34B)"",""Mixtral-8x7B-Instruct-v0.1"",""llama-2-70b-chat""]},""legend"":{""title"":{""text"":""Model""},""tracegroupgap"":0},""title"":{""text"":""Model sizes in billions of parameters""},""barmode"":""relative""}}","{""x"": ""model_sizes"", ""y"": ""model"", ""color"": ""model"", ""orientation"": ""h"", ""title"": ""Model sizes in billions of parameters"", ""labels"": {""model"": ""Model"", ""model_sizes"": ""Model size (B params)""}}",",model_sizes,model
|
636 |
0,70.0,llama-2-70b-chat
|
637 |
1,56.0,Mixtral-8x7B-Instruct-v0.1
|
638 |
+
5,34.0,01-ai Yi Chat (34B)
|
639 |
+
15,13.0,WizardLM v1.2 (13B)
|
640 |
+
6,13.0,Chronos Hermes (13B)
|
641 |
+
16,11.0,Upstage SOLAR Instruct v1 (11B)
|
642 |
+
7,7.0,Vicuna v1.5 (7B)
|
643 |
3,7.0,Mistral-7B-Instruct-v0.2
|
644 |
+
9,7.0,Mistral (7B) Instruct v0.2 (Together AI)
|
645 |
+
10,7.0,Qwen 1.5 Chat (7B)
|
646 |
+
11,7.0,Snorkel Mistral PairRM DPO (7B)
|
647 |
+
12,7.0,OpenHermes-2.5-Mistral (7B)
|
648 |
+
13,7.0,Falcon Instruct (7B)
|
649 |
+
14,7.0,RedPajama-INCITE Chat (7B)
|
650 |
+
2,7.0,zephyr-7b-beta
|
651 |
+
8,7.0,LLaMA-2 Chat (7B)
|
652 |
4,1.1,TinyLlama/TinyLlama-1.1B-Chat-v1.0
|
653 |
"
|
654 |
model_context_lengths,./html/plots/model_context_lengths.html,"Figure({
|
data/model_costs.csv
ADDED
@@ -0,0 +1,58 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
model,provider,cost_per_token,provider_pricing
|
2 |
+
gpt-3.5-turbo,OpenAI,"$1 / 1M input tokens, $2 / 1M output tokens","$1 / 1M input tokens, $2 / 1M output tokens"
|
3 |
+
gpt-4-turbo,OpenAI,"$10 / 1M input tokens, $30 / 1M output tokens","$10 / 1M input tokens, $30 / 1M output tokens"
|
4 |
+
gpt-4,OpenAI,"$30 / 1M input tokens, $60 / 1M output tokens","$30 / 1M input tokens, $60 / 1M output tokens"
|
5 |
+
llama-2-70b-chat,Together AI,$0.9 / 1M tokens,$0.9 / 1M tokens
|
6 |
+
Mixtral-8x7B-Instruct-v0.1,Together AI,$0.9 / 1M tokens,$0.9 / 1M tokens
|
7 |
+
zephyr-7b-beta,Hugging Face Inference Endpoint,$0.15 / 1M tokens,$1.3 / hour
|
8 |
+
Mistral-7B-Instruct-v0.2,Hugging Face Inference Endpoint,$0.14 / 1M tokens,$1.3 / hour
|
9 |
+
TinyLlama/TinyLlama-1.1B-Chat-v1.0,Hugging Face Inference Endpoint,$0.068 / 1M tokens,$0.6 / hour
|
10 |
+
gemini-pro,Google VertexAI,"$0.25 / 1M input tokens, $0.5 / 1M output tokens","$0.25 / 1M input characters, $0.5 / 1M output characters (60 queries per minute are free)"
|
11 |
+
chat-bison (PaLM 2),Google VertexAI,"$0.25 / 1M input tokens, $0.5 / 1M output tokens","$0.25 / 1M input tokens, $0.5 / 1M output tokens"
|
12 |
+
chat-bison-32k (PaLM 2 32K),Google VertexAI,"$0.25 / 1M input tokens, $0.5 / 1M output tokens","$0.25 / 1M input tokens, $0.5 / 1M output tokens"
|
13 |
+
01-ai Yi Chat (34B),Together AI,$0.8 / 1M tokens,$0.8 / 1M tokens
|
14 |
+
Chronos Hermes (13B),Together AI,$0.3 / 1M tokens,$0.3 / 1M tokens
|
15 |
+
Deepseek Coder Instruct (33B),Together AI,$0.8 / 1M tokens,$0.8 / 1M tokens
|
16 |
+
Platypus2 Instruct (70B),Together AI,$0.9 / 1M tokens,$0.9 / 1M tokens
|
17 |
+
MythoMax-L2 (13B),Together AI,$0.3 / 1M tokens,$0.3 / 1M tokens
|
18 |
+
Vicuna v1.5 (13B),Together AI,$0.3 / 1M tokens,$0.3 / 1M tokens
|
19 |
+
Vicuna v1.5 (7B),Together AI,$0.2 / 1M tokens,$0.2 / 1M tokens
|
20 |
+
Code Llama Instruct (13B),Together AI,$0.3 / 1M tokens,$0.3 / 1M tokens
|
21 |
+
Code Llama Instruct (34B),Together AI,$0.8 / 1M tokens,$0.8 / 1M tokens
|
22 |
+
Code Llama Instruct (70B),Together AI,$0.9 / 1M tokens,$0.9 / 1M tokens
|
23 |
+
Code Llama Instruct (7B),Together AI,$0.2 / 1M tokens,$0.2 / 1M tokens
|
24 |
+
LLaMA-2 Chat (13B),Together AI,$0.3 / 1M tokens,$0.3 / 1M tokens
|
25 |
+
LLaMA-2 Chat (70B),Together AI,$0.9 / 1M tokens,$0.9 / 1M tokens
|
26 |
+
LLaMA-2 Chat (7B),Together AI,$0.2 / 1M tokens,$0.2 / 1M tokens
|
27 |
+
Mistral (7B) Instruct,Together AI,$0.2 / 1M tokens,$0.2 / 1M tokens
|
28 |
+
Mistral (7B) Instruct v0.2 (Together AI),Together AI,$0.2 / 1M tokens,$0.2 / 1M tokens
|
29 |
+
Mixtral-8x7B Instruct (46.7B),Together AI,$0.9 / 1M tokens,$0.9 / 1M tokens
|
30 |
+
Nous Capybara v1.9 (7B),Together AI,$0.2 / 1M tokens,$0.2 / 1M tokens
|
31 |
+
Nous Hermes 2 - Mixtral 8x7B-DPO (46.7B),Together AI,$0.9 / 1M tokens,$0.9 / 1M tokens
|
32 |
+
Nous Hermes 2 - Mixtral 8x7B-SFT (46.7B),Together AI,$0.9 / 1M tokens,$0.9 / 1M tokens
|
33 |
+
Nous Hermes LLaMA-2 (7B),Together AI,$0.2 / 1M tokens,$0.2 / 1M tokens
|
34 |
+
Nous Hermes Llama-2 (13B),Together AI,$0.3 / 1M tokens,$0.3 / 1M tokens
|
35 |
+
Nous Hermes-2 Yi (34B),Together AI,$0.8 / 1M tokens,$0.8 / 1M tokens
|
36 |
+
OpenChat 3.5 (7B),Together AI,$0.2 / 1M tokens,$0.2 / 1M tokens
|
37 |
+
OpenOrca Mistral (7B) 8K,Together AI,$0.2 / 1M tokens,$0.2 / 1M tokens
|
38 |
+
Qwen-Chat (7B),Together AI,$0.2 / 1M tokens,$0.2 / 1M tokens
|
39 |
+
Qwen 1.5 Chat (0.5B),Together AI,$0.1 / 1M tokens,$0.1 / 1M tokens
|
40 |
+
Qwen 1.5 Chat (1.8B),Together AI,$0.1 / 1M tokens,$0.1 / 1M tokens
|
41 |
+
Qwen 1.5 Chat (4B),Together AI,$0.1 / 1M tokens,$0.1 / 1M tokens
|
42 |
+
Qwen 1.5 Chat (7B),Together AI,$0.2 / 1M tokens,$0.2 / 1M tokens
|
43 |
+
Qwen 1.5 Chat (14B),Together AI,$0.3 / 1M tokens,$0.3 / 1M tokens
|
44 |
+
Qwen 1.5 Chat (72B),Together AI,$0.9 / 1M tokens,$0.9 / 1M tokens
|
45 |
+
Snorkel Mistral PairRM DPO (7B),Together AI,$0.2 / 1M tokens,$0.2 / 1M tokens
|
46 |
+
Alpaca (7B),Together AI,$0.2 / 1M tokens,$0.2 / 1M tokens
|
47 |
+
OpenHermes-2-Mistral (7B),Together AI,$0.2 / 1M tokens,$0.2 / 1M tokens
|
48 |
+
OpenHermes-2.5-Mistral (7B),Together AI,$0.2 / 1M tokens,$0.2 / 1M tokens
|
49 |
+
Falcon Instruct (40B),Together AI,$0.8 / 1M tokens,$0.8 / 1M tokens
|
50 |
+
Falcon Instruct (7B),Together AI,$0.2 / 1M tokens,$0.2 / 1M tokens
|
51 |
+
LLaMA-2-7B-32K-Instruct (7B),Together AI,$0.2 / 1M tokens,$0.2 / 1M tokens
|
52 |
+
RedPajama-INCITE Chat (3B),Together AI,$0.1 / 1M tokens,$0.1 / 1M tokens
|
53 |
+
RedPajama-INCITE Chat (7B),Together AI,$0.2 / 1M tokens,$0.2 / 1M tokens
|
54 |
+
StripedHyena Nous (7B),Together AI,$0.2 / 1M tokens,$0.2 / 1M tokens
|
55 |
+
ReMM SLERP L2 (13B),Together AI,$0.3 / 1M tokens,$0.3 / 1M tokens
|
56 |
+
Toppy M (7B),Together AI,$0.2 / 1M tokens,$0.2 / 1M tokens
|
57 |
+
WizardLM v1.2 (13B),Together AI,$0.3 / 1M tokens,$0.3 / 1M tokens
|
58 |
+
Upstage SOLAR Instruct v1 (11B),Together AI,$0.3 / 1M tokens,$0.3 / 1M tokens
|
data/output_plots.csv
CHANGED
The diff for this file is too large to render.
See raw diff
|
|
data/summary.csv
ADDED
@@ -0,0 +1,95 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
model,language,template_name,execution_time,characters_count,words_count,chunk_sizes_mean,chunk_sizes_min,chunk_sizes_max,chunk_generation_times_mean,chunk_generation_times_min,chunk_generation_times_max
|
2 |
+
01-ai Yi Chat (34B),english,json,3.740751821820329,339.4756097560976,57.926829268292686,3.8364112458654906,1.0,14.0,0.028872832803768254,0.0004601478576660156,0.6119933128356934
|
3 |
+
01-ai Yi Chat (34B),english,markdown,4.911168761369659,545.0121951219512,91.32926829268293,4.251426940639269,1.0,15.0,0.029400016551148402,0.000396728515625,0.6902577877044678
|
4 |
+
01-ai Yi Chat (34B),japanese,json,13.06497314438891,388.7910447761194,11.104477611940299,1.1905393053016453,1.0,10.0,0.03675604747026014,0.00048804283142089844,0.6865222454071045
|
5 |
+
01-ai Yi Chat (34B),japanese,markdown,20.104321274038863,587.4657534246576,17.876712328767123,1.151120654945645,1.0,13.0,0.036697812292211376,0.0004608631134033203,0.6928038597106934
|
6 |
+
Chronos Hermes (13B),english,json,2.974407357828958,368.92857142857144,63.107142857142854,3.5136054421768708,1.0,15.0,0.02094727554559167,0.00027179718017578125,0.6065487861633301
|
7 |
+
Chronos Hermes (13B),english,markdown,2.6719689165673604,361.8536585365854,61.97560975609756,3.6452088452088454,1.0,14.0,0.02059152469002351,0.0004761219024658203,0.28253698348999023
|
8 |
+
Chronos Hermes (13B),japanese,json,15.704193201558343,687.3620689655172,23.344827586206897,1.1621337997376475,1.0,14.0,0.023474197327925606,0.0003821849822998047,0.3109428882598877
|
9 |
+
Chronos Hermes (13B),japanese,markdown,11.713542679945627,1075.8,142.26666666666668,2.5384615384615383,1.0,16.0,0.023924544976345302,0.0004260540008544922,0.34424543380737305
|
10 |
+
Falcon Instruct (7B),english,json,1.9191903869311016,82.66666666666667,15.766666666666667,4.235695986336465,1.0,13.0,0.012606756387868567,0.0004930496215820312,0.08649563789367676
|
11 |
+
Falcon Instruct (7B),english,markdown,1.8954222866746246,89.24590163934427,15.245901639344263,4.60965283657917,1.0,13.0,0.012657315119356548,0.0003917217254638672,0.09382963180541992
|
12 |
+
Falcon Instruct (7B),japanese,json,0.9907723726370395,35.37179487179487,7.051282051282051,3.6983914209115283,1.0,10.0,0.013643914509075258,0.00037479400634765625,0.0781710147857666
|
13 |
+
Falcon Instruct (7B),japanese,markdown,0.6273794174194336,8.873417721518987,2.088607594936709,3.3864734299516908,1.0,13.0,0.010549438172492428,0.000865936279296875,0.034580230712890625
|
14 |
+
LLaMA-2 Chat (7B),english,json,2.602991385893388,348.05194805194805,60.311688311688314,3.5179837227618798,1.0,14.0,0.007298828235414905,0.0002570152282714844,0.12662744522094727
|
15 |
+
LLaMA-2 Chat (7B),english,markdown,2.678575509124332,402.0416666666667,69.375,3.747669601242879,1.0,16.0,0.0077138773707266855,0.00035452842712402344,0.2196364402770996
|
16 |
+
LLaMA-2 Chat (7B),japanese,json,4.055958332334246,471.92857142857144,53.114285714285714,1.9620478707608244,1.0,14.0,0.009438785980169328,0.00035572052001953125,0.1930844783782959
|
17 |
+
LLaMA-2 Chat (7B),japanese,markdown,4.446276148704634,717.1232876712329,67.6986301369863,1.8702440070022508,1.0,16.0,0.008583835081750738,0.0003447532653808594,0.2040574550628662
|
18 |
+
Mistral (7B) Instruct v0.2 (Together AI),english,json,2.0136800810822053,344.508547008547,56.93589743589744,3.8069040423120515,1.0,15.0,0.00794907963001192,0.0002071857452392578,0.30161213874816895
|
19 |
+
Mistral (7B) Instruct v0.2 (Together AI),english,markdown,2.5499956497567235,452.242774566474,73.121387283237,3.7100720789074355,1.0,15.0,0.007905251983898002,0.0002067089080810547,0.4635443687438965
|
20 |
+
Mistral (7B) Instruct v0.2 (Together AI),japanese,json,3.768558966402976,271.26490066225165,5.172185430463577,1.0484271417236173,1.0,13.0,0.009928898496573373,0.00023865699768066406,2.616291046142578
|
21 |
+
Mistral (7B) Instruct v0.2 (Together AI),japanese,markdown,7.687208134916764,1178.012658227848,138.30379746835442,1.9892057113543091,1.0,109.0,0.010960863498020433,0.00021409988403320312,8.214757204055786
|
22 |
+
Mistral-7B-Instruct-v0.2,english,json,4.278648148264204,342.8,55.15,4.1311870534561415,1.0,15.0,0.040544769239987996,0.00024437904357910156,60.7178213596344
|
23 |
+
Mistral-7B-Instruct-v0.2,english,markdown,3.7188014924526214,366.85,57.1375,4.239202657807309,1.0,16.0,0.03371991898375372,0.020945072174072266,0.25538039207458496
|
24 |
+
Mistral-7B-Instruct-v0.2,japanese,json,2.413569121701377,52.07857142857143,3.414285714285714,1.2991803278688525,1.0,11.0,0.039267738759305254,0.00047779083251953125,3.370748996734619
|
25 |
+
Mistral-7B-Instruct-v0.2,japanese,markdown,2.323612022399902,42.25,1.5833333333333333,1.1069868995633187,1.0,6.0,0.03958142719935121,0.0004932880401611328,0.2205650806427002
|
26 |
+
Mixtral-8x7B-Instruct-v0.1,english,json,3.665129848137623,403.2542016806723,62.4390756302521,4.138125060633172,1.0,15.0,0.01437194579115682,0.0002009868621826172,3.4127349853515625
|
27 |
+
Mixtral-8x7B-Instruct-v0.1,english,markdown,5.775103669417532,522.9172932330827,83.45864661654136,4.350284606242572,1.0,15.0,0.015317759848210679,0.00020313262939453125,1.7103569507598877
|
28 |
+
Mixtral-8x7B-Instruct-v0.1,japanese,json,7.287098480350196,556.9218106995885,63.477366255144034,2.2494971825601304,1.0,109.0,0.02290278010061531,0.00020551681518554688,76.45081758499146
|
29 |
+
Mixtral-8x7B-Instruct-v0.1,japanese,markdown,9.511569020294008,432.14285714285717,7.2976190476190474,1.0973066110456153,1.0,12.0,0.017938276822029118,0.00019669532775878906,3.0317282676696777
|
30 |
+
OpenHermes-2.5-Mistral (7B),english,json,2.2801950351301445,356.66265060240966,58.87951807228916,3.619833700171191,1.0,15.0,0.009280798020646228,0.0003464221954345703,0.34207844734191895
|
31 |
+
OpenHermes-2.5-Mistral (7B),english,markdown,2.5686250015308985,381.69736842105266,63.828947368421055,3.9398343066684776,1.0,15.0,0.009823806159897504,0.00034999847412109375,0.32857298851013184
|
32 |
+
OpenHermes-2.5-Mistral (7B),japanese,json,2.385033627835716,143.78048780487805,4.060975609756097,1.0738682940158484,1.0,8.0,0.013302163463633877,0.0003523826599121094,0.34746313095092773
|
33 |
+
OpenHermes-2.5-Mistral (7B),japanese,markdown,4.09419917478794,346.7682926829268,4.865853658536586,1.0120297540662704,1.0,9.0,0.010479846772686987,0.0003566741943359375,0.6548421382904053
|
34 |
+
Qwen 1.5 Chat (7B),english,json,2.176741310312778,316.40506329113924,52.949367088607595,3.865161589608783,1.0,15.0,0.0067587282957351615,0.00036597251892089844,0.13403892517089844
|
35 |
+
Qwen 1.5 Chat (7B),english,markdown,2.384753034084658,433.1898734177215,71.48101265822785,4.243799603174603,1.0,15.0,0.00671186927883398,0.00036978721618652344,0.14255690574645996
|
36 |
+
Qwen 1.5 Chat (7B),japanese,json,2.2887367900413804,207.50632911392404,4.139240506329114,1.4821880650994574,1.0,17.0,0.007465819402801624,0.00038743019104003906,0.21312594413757324
|
37 |
+
Qwen 1.5 Chat (7B),japanese,markdown,2.041359633575251,220.80246913580248,1.876543209876543,1.465142950765954,1.0,17.0,0.007345383120587039,0.00035572052001953125,0.13096904754638672
|
38 |
+
RedPajama-INCITE Chat (7B),english,json,1.9923779017785017,56.0,5.514705882352941,2.9337442218798153,1.0,15.0,0.02580270341070848,0.00044846534729003906,0.131911039352417
|
39 |
+
RedPajama-INCITE Chat (7B),english,markdown,2.0556714431099268,55.04347826086956,5.217391304347826,2.928296067848882,1.0,70.0,0.02626570611158149,0.0004153251647949219,0.939018964767456
|
40 |
+
RedPajama-INCITE Chat (7B),japanese,json,1.801509298929354,53.58536585365854,5.853658536585366,2.816666666666667,1.0,13.0,0.02727127411426642,0.0003719329833984375,0.1054222583770752
|
41 |
+
RedPajama-INCITE Chat (7B),japanese,markdown,1.896126465099614,77.59756097560975,4.439024390243903,4.019583070120025,1.0,70.0,0.02732501960749575,0.0007987022399902344,0.4024965763092041
|
42 |
+
Snorkel Mistral PairRM DPO (7B),english,json,3.095366932551066,949.9333333333333,150.72,3.8147890340544013,1.0,15.0,0.007307618875579115,0.00022792816162109375,0.1967298984527588
|
43 |
+
Snorkel Mistral PairRM DPO (7B),english,markdown,2.583486044406891,507.9625,78.75,4.004829013501528,1.0,15.0,0.00809382158769837,0.0003504753112792969,0.27209019660949707
|
44 |
+
Snorkel Mistral PairRM DPO (7B),japanese,json,7.790234556680994,1704.5189873417721,208.60759493670886,1.981328075570531,1.0,15.0,0.008026355929728519,0.0003476142883300781,0.49362945556640625
|
45 |
+
Snorkel Mistral PairRM DPO (7B),japanese,markdown,89.00719798347096,17120.925925925927,504.25925925925924,1.0784030121985644,1.0,14.0,0.005559155525883009,0.00032520294189453125,1.1380209922790527
|
46 |
+
TinyLlama/TinyLlama-1.1B-Chat-v1.0,english,json,1.9458302193674548,366.25,61.58965517241379,4.169774654522613,1.0,13.0,0.012296600931852907,0.00024318695068359375,0.17363858222961426
|
47 |
+
TinyLlama/TinyLlama-1.1B-Chat-v1.0,english,markdown,1.6830505162477494,282.55,47.1125,3.9572829131652663,1.0,14.0,0.012217252319600401,0.0003170967102050781,0.15227961540222168
|
48 |
+
TinyLlama/TinyLlama-1.1B-Chat-v1.0,japanese,json,1.4167885013989039,72.81428571428572,8.8,2.0274463007159906,1.0,13.0,0.014790566363975749,0.00031280517578125,0.3310587406158447
|
49 |
+
TinyLlama/TinyLlama-1.1B-Chat-v1.0,japanese,markdown,1.336316986878713,89.78333333333333,12.716666666666667,2.432054176072235,1.0,13.0,0.013910464400900675,0.0005300045013427734,0.176621675491333
|
50 |
+
Vicuna v1.5 (7B),english,json,2.851835834980011,372.4375,63.9875,3.508596325953839,1.0,15.0,0.011230722554045582,0.0003688335418701172,0.11755537986755371
|
51 |
+
Vicuna v1.5 (7B),english,markdown,2.0539027697000747,382.4230769230769,64.55128205128206,3.7235051803769816,1.0,15.0,0.011191664883712751,0.00037550926208496094,0.1981511116027832
|
52 |
+
Vicuna v1.5 (7B),japanese,json,4.896489579230547,304.5,16.9375,1.2847254268574066,1.0,15.0,0.015209688069330176,0.0003762245178222656,0.319460391998291
|
53 |
+
Vicuna v1.5 (7B),japanese,markdown,5.635414824556949,301.55223880597015,3.2686567164179103,1.034511008704557,1.0,11.0,0.015171443860590671,0.0003802776336669922,0.19443845748901367
|
54 |
+
WizardLM v1.2 (13B),english,json,3.101118081236539,280.52054794520546,48.0958904109589,3.2891101831031158,1.0,15.0,0.021355988586442935,0.00036406517028808594,0.4714198112487793
|
55 |
+
WizardLM v1.2 (13B),english,markdown,3.5972929232650332,357.5138888888889,61.013888888888886,3.8293662600416543,1.0,14.0,0.02164479360378984,0.0005571842193603516,0.5012450218200684
|
56 |
+
WizardLM v1.2 (13B),japanese,json,6.448913824267503,213.4878048780488,4.7682926829268295,1.0483262470806636,1.0,7.0,0.027856862946922703,0.00034737586975097656,0.5480227470397949
|
57 |
+
WizardLM v1.2 (13B),japanese,markdown,8.740011346049425,292.6341463414634,7.634146341463414,1.0085319211532804,1.0,9.0,0.02801978238888618,0.0004551410675048828,0.8807919025421143
|
58 |
+
chat-bison (PaLM 2),english,json,2.5406186148524283,381.7267857142857,60.88125,78.31727422604872,1.0,142.0,0.3495202942369709,0.0003688335418701172,7.334931373596191
|
59 |
+
chat-bison (PaLM 2),english,markdown,2.9635989278554917,490.4875,78.5375,84.20386266094421,1.0,138.0,0.3641034907025841,0.0004639625549316406,4.600815534591675
|
60 |
+
chat-bison (PaLM 2),japanese,json,3.0616454005241396,232.68,10.48,34.21764705882353,3.0,124.0,0.326771635167739,0.0005857944488525391,2.7724690437316895
|
61 |
+
chat-bison (PaLM 2),japanese,markdown,4.669546687602997,431.725,13.85,31.74448529411765,2.0,124.0,0.27883222348549785,0.0005550384521484375,7.114030122756958
|
62 |
+
chat-bison-32k (PaLM 2 32K),english,json,7.142214598400252,335.47232142857143,53.799107142857146,77.18344289235826,1.0,133.0,1.4512595853652734,0.00041985511779785156,101.5493803024292
|
63 |
+
chat-bison-32k (PaLM 2 32K),english,markdown,3.44630788564682,429.95,69.35,82.6826923076923,1.0,133.0,0.5048719226167753,0.0005412101745605469,18.035786390304565
|
64 |
+
chat-bison-32k (PaLM 2 32K),japanese,json,5.072022783756256,272.85,10.35,34.320754716981135,4.0,124.0,0.5336985453119818,0.0005052089691162109,52.47814655303955
|
65 |
+
chat-bison-32k (PaLM 2 32K),japanese,markdown,6.1971998631954195,446.45,21.4,32.118705035971225,5.0,124.0,0.3856057263106751,0.0005400180816650391,7.165225505828857
|
66 |
+
gemini-pro,english,json,2.7415290858475547,388.5206321334504,62.01755926251097,204.58853444290338,1.0,988.0,1.4202116817663073,0.0004703998565673828,13.73231840133667
|
67 |
+
gemini-pro,english,markdown,3.0089986324310303,487.1458333333333,80.67708333333333,183.39607843137256,12.0,472.0,1.1130499073103362,0.0006177425384521484,4.875006198883057
|
68 |
+
gemini-pro,japanese,json,4.5300196591070145,276.6694915254237,6.983050847457627,91.1927374301676,4.0,333.0,1.4752027082709627,0.0006062984466552734,8.291066646575928
|
69 |
+
gemini-pro,japanese,markdown,6.166934008781727,422.7307692307692,9.096153846153847,90.83471074380165,9.0,266.0,1.3123543331445742,0.0006639957427978516,13.754565954208374
|
70 |
+
gpt-3.5-turbo,english,call,2.908525016600803,456.85911016949154,72.26059322033899,,,,,,
|
71 |
+
gpt-3.5-turbo,english,json,2.566863525494622,398.56960556844547,65.32366589327147,4.806746320443226,1.0,16.0,0.015585779219764062,0.0005395412445068359,1.4500916004180908
|
72 |
+
gpt-3.5-turbo,english,markdown,2.3388922008184285,506.90384615384613,81.99038461538461,5.050584403142365,1.0,16.0,0.01715806382989308,0.0005617141723632812,1.127073049545288
|
73 |
+
gpt-3.5-turbo,japanese,call,7.255881716940138,382.95,6.351111111111111,,,,,,
|
74 |
+
gpt-3.5-turbo,japanese,json,5.226112197780009,237.1069182389937,3.559748427672956,1.1291481969569905,1.0,7.0,0.02129129201220198,0.0005452632904052734,13.75982117652893
|
75 |
+
gpt-3.5-turbo,japanese,markdown,7.29901300883684,358.72131147540983,6.065573770491803,1.1894977168949772,1.0,15.0,0.021750167313542772,0.0005612373352050781,13.71114993095398
|
76 |
+
gpt-4,english,call,9.15708539162022,374.16815144766144,59.661469933184854,,,,,,
|
77 |
+
gpt-4,english,json,7.963626848197565,383.3707317073171,61.69512195121951,4.7834568389659005,1.0,16.0,0.08687007305138472,0.000537872314453125,3.531284809112549
|
78 |
+
gpt-4,english,markdown,10.02310108244419,428.35,67.825,4.990243192078054,1.0,16.0,0.10377185442257747,0.0005447864532470703,2.087376117706299
|
79 |
+
gpt-4,japanese,call,24.259297592319243,214.9076023391813,1.1695906432748537,,,,,,
|
80 |
+
gpt-4,japanese,json,22.703774025460252,211.63025210084032,4.168067226890757,1.1685226429101707,1.0,7.0,0.11835955503744466,0.0005507469177246094,3.5608017444610596
|
81 |
+
gpt-4,japanese,markdown,31.99519391655922,275.1,2.925,1.1327980234712787,1.0,9.0,0.12606545905407157,0.0005619525909423828,2.9794347286224365
|
82 |
+
gpt-4-turbo,english,call,7.319288367695279,372.86,58.532222222222224,,,,,,
|
83 |
+
gpt-4-turbo,english,json,6.457074524425879,407.0243902439024,64.18414634146342,4.735998183701559,1.0,17.0,0.06474667943090798,0.0006806850433349609,5.431884765625
|
84 |
+
gpt-4-turbo,english,markdown,8.325546002388,462.1125,71.925,4.984360253471754,1.0,16.0,0.07950969425127868,0.0006999969482421875,2.0926766395568848
|
85 |
+
gpt-4-turbo,japanese,call,32.67405146055443,372.7860465116279,24.886046511627907,,,,,,
|
86 |
+
gpt-4-turbo,japanese,json,19.359180968999862,250.44166666666666,6.183333333333334,1.184261339007763,1.0,8.0,0.08582140138847597,0.0006830692291259766,13.252992153167725
|
87 |
+
gpt-4-turbo,japanese,markdown,20.977174520492554,283.55,4.45,1.1460038395473375,1.0,10.0,0.07991695286011809,0.0007085800170898438,2.3845231533050537
|
88 |
+
llama-2-70b-chat,english,json,2.917410132025375,355.7463556851312,54.861030126336246,4.02267032967033,1.0,15.0,0.019103390617685005,0.0001990795135498047,3.8762006759643555
|
89 |
+
llama-2-70b-chat,english,markdown,4.99397261045417,827.5714285714286,125.95918367346938,4.177931176591799,1.0,16.0,0.018161741699259625,0.0002124309539794922,0.7439091205596924
|
90 |
+
llama-2-70b-chat,japanese,json,5.265992468681889,369.3768115942029,42.56521739130435,2.3362207250561435,1.0,15.0,0.023359512199899433,0.00020837783813476562,0.9314718246459961
|
91 |
+
llama-2-70b-chat,japanese,markdown,11.084085723449444,1379.6896551724137,158.01724137931035,2.2644745033674796,1.0,16.0,0.01566780037868879,0.0002117156982421875,76.44498753547668
|
92 |
+
zephyr-7b-beta,english,json,4.252429554081262,376.7899686520376,61.78369905956113,4.26030553291036,1.0,14.0,0.03764735399563352,0.0003070831298828125,1.0504331588745117
|
93 |
+
zephyr-7b-beta,english,markdown,4.788659170695714,376.10714285714283,61.15,4.393408427200668,1.0,15.0,0.04506704832147846,0.00040459632873535156,75.15552616119385
|
94 |
+
zephyr-7b-beta,japanese,json,2.6574003274624163,44.75,3.6923076923076925,1.152208358090711,1.0,7.0,0.044344271615274496,0.018090486526489258,1.1675689220428467
|
95 |
+
zephyr-7b-beta,japanese,markdown,2.6084938406944276,40.0,2.39,1.0282776349614395,1.0,4.0,0.042658403845250145,0.02583909034729004,1.2674541473388672
|
pipeline/config.py
CHANGED
@@ -36,7 +36,7 @@ class QueriesConfig(Config):
|
|
36 |
class MeasurementsConfig(Config):
|
37 |
mock: bool = False
|
38 |
remove_old_measurements: bool = False
|
39 |
-
small_dataset: bool =
|
40 |
|
41 |
|
42 |
class QueriesDatasetConfig(Config):
|
|
|
36 |
class MeasurementsConfig(Config):
|
37 |
mock: bool = False
|
38 |
remove_old_measurements: bool = False
|
39 |
+
small_dataset: bool = False
|
40 |
|
41 |
|
42 |
class QueriesDatasetConfig(Config):
|
pipeline/models.py
CHANGED
@@ -1,5 +1,6 @@
|
|
1 |
import os
|
2 |
from dataclasses import dataclass
|
|
|
3 |
|
4 |
|
5 |
@dataclass(unsafe_hash=True)
|
@@ -525,6 +526,27 @@ MISSING_MEASUREMENTS = ['Mistral-7B-Instruct-v0.2',
|
|
525 |
'WizardLM v1.2 (13B)',
|
526 |
'Upstage SOLAR Instruct v1 (11B)']
|
527 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
528 |
for model in MODELS:
|
529 |
if model.model_display_name in MISSING_MEASUREMENTS:
|
530 |
model.selected = True
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
import os
|
2 |
from dataclasses import dataclass
|
3 |
+
import re
|
4 |
|
5 |
|
6 |
@dataclass(unsafe_hash=True)
|
|
|
526 |
'WizardLM v1.2 (13B)',
|
527 |
'Upstage SOLAR Instruct v1 (11B)']
|
528 |
|
529 |
+
def together_ai_price(billions_of_parameters):
|
530 |
+
if billions_of_parameters <= 4:
|
531 |
+
return 0.1
|
532 |
+
elif 4.1 <= billions_of_parameters <= 8:
|
533 |
+
return 0.2
|
534 |
+
elif 8.1 <= billions_of_parameters <= 21:
|
535 |
+
return 0.3
|
536 |
+
elif 21.1 <= billions_of_parameters <= 41:
|
537 |
+
return 0.8
|
538 |
+
elif 41 < billions_of_parameters: # <= 70:
|
539 |
+
return 0.9
|
540 |
+
|
541 |
for model in MODELS:
|
542 |
if model.model_display_name in MISSING_MEASUREMENTS:
|
543 |
model.selected = True
|
544 |
+
|
545 |
+
if model.provider == "Together AI":
|
546 |
+
pattern = r"\((\d+(\.\d+)?)B\)"
|
547 |
+
match = re.search(pattern, model.model_display_name)
|
548 |
+
if match:
|
549 |
+
number_in_parenthesis = float(match.group(1))
|
550 |
+
model.size_billion_parameters = number_in_parenthesis
|
551 |
+
model.cost_per_million_tokens = together_ai_price(model.size_billion_parameters)
|
552 |
+
model.__post_init__()
|