diff --git "a/data/summary_metrics_plots.csv" "b/data/summary_metrics_plots.csv"
--- "a/data/summary_metrics_plots.csv"
+++ "b/data/summary_metrics_plots.csv"
@@ -1,7 +1,7 @@
plot_object,header,plot_json,description,df,arguments
"Figure({
'data': [{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
BERT score P=%{x}',
+ 'hovertemplate': 'Model=%{y}
BERT score precision=%{x}',
'legendgroup': 'gpt-3.5-turbo',
'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
'name': 'gpt-3.5-turbo',
@@ -10,12 +10,12 @@ plot_object,header,plot_json,description,df,arguments
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.4943981], dtype=float32),
+ 'x': array([0.49478123], dtype=float32),
'xaxis': 'x',
'y': array(['gpt-3.5-turbo'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
BERT score P=%{x}',
+ 'hovertemplate': 'Model=%{y}
BERT score precision=%{x}',
'legendgroup': 'gpt-4',
'marker': {'color': '#EF553B', 'pattern': {'shape': ''}},
'name': 'gpt-4',
@@ -24,12 +24,12 @@ plot_object,header,plot_json,description,df,arguments
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.48605907], dtype=float32),
+ 'x': array([0.4864653], dtype=float32),
'xaxis': 'x',
'y': array(['gpt-4'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
BERT score P=%{x}',
+ 'hovertemplate': 'Model=%{y}
BERT score precision=%{x}',
'legendgroup': 'gpt-4-turbo',
'marker': {'color': '#00cc96', 'pattern': {'shape': ''}},
'name': 'gpt-4-turbo',
@@ -38,12 +38,12 @@ plot_object,header,plot_json,description,df,arguments
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.42728576], dtype=float32),
+ 'x': array([0.42933634], dtype=float32),
'xaxis': 'x',
'y': array(['gpt-4-turbo'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
BERT score P=%{x}',
+ 'hovertemplate': 'Model=%{y}
BERT score precision=%{x}',
'legendgroup': 'Mistral (7B) Instruct v0.2 (Together AI)',
'marker': {'color': '#ab63fa', 'pattern': {'shape': ''}},
'name': 'Mistral (7B) Instruct v0.2 (Together AI)',
@@ -52,12 +52,12 @@ plot_object,header,plot_json,description,df,arguments
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.3647361], dtype=float32),
+ 'x': array([0.36488953], dtype=float32),
'xaxis': 'x',
'y': array(['Mistral (7B) Instruct v0.2 (Together AI)'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
BERT score P=%{x}',
+ 'hovertemplate': 'Model=%{y}
BERT score precision=%{x}',
'legendgroup': 'OpenHermes-2.5-Mistral (7B)',
'marker': {'color': '#FFA15A', 'pattern': {'shape': ''}},
'name': 'OpenHermes-2.5-Mistral (7B)',
@@ -66,12 +66,12 @@ plot_object,header,plot_json,description,df,arguments
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.3618188], dtype=float32),
+ 'x': array([0.3621834], dtype=float32),
'xaxis': 'x',
'y': array(['OpenHermes-2.5-Mistral (7B)'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
BERT score P=%{x}',
+ 'hovertemplate': 'Model=%{y}
BERT score precision=%{x}',
'legendgroup': 'Qwen 1.5 Chat (7B)',
'marker': {'color': '#19d3f3', 'pattern': {'shape': ''}},
'name': 'Qwen 1.5 Chat (7B)',
@@ -80,12 +80,12 @@ plot_object,header,plot_json,description,df,arguments
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.34855434], dtype=float32),
+ 'x': array([0.34898603], dtype=float32),
'xaxis': 'x',
'y': array(['Qwen 1.5 Chat (7B)'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
BERT score P=%{x}',
+ 'hovertemplate': 'Model=%{y}
BERT score precision=%{x}',
'legendgroup': 'WizardLM v1.2 (13B)',
'marker': {'color': '#FF6692', 'pattern': {'shape': ''}},
'name': 'WizardLM v1.2 (13B)',
@@ -94,12 +94,12 @@ plot_object,header,plot_json,description,df,arguments
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.34085444], dtype=float32),
+ 'x': array([0.3420949], dtype=float32),
'xaxis': 'x',
'y': array(['WizardLM v1.2 (13B)'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
BERT score P=%{x}',
+ 'hovertemplate': 'Model=%{y}
BERT score precision=%{x}',
'legendgroup': '01-ai Yi Chat (34B)',
'marker': {'color': '#B6E880', 'pattern': {'shape': ''}},
'name': '01-ai Yi Chat (34B)',
@@ -108,12 +108,12 @@ plot_object,header,plot_json,description,df,arguments
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.33974892], dtype=float32),
+ 'x': array([0.33981326], dtype=float32),
'xaxis': 'x',
'y': array(['01-ai Yi Chat (34B)'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
BERT score P=%{x}',
+ 'hovertemplate': 'Model=%{y}
BERT score precision=%{x}',
'legendgroup': 'LLaMA-2 Chat (7B)',
'marker': {'color': '#FF97FF', 'pattern': {'shape': ''}},
'name': 'LLaMA-2 Chat (7B)',
@@ -122,12 +122,12 @@ plot_object,header,plot_json,description,df,arguments
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.3203912], dtype=float32),
+ 'x': array([0.32074162], dtype=float32),
'xaxis': 'x',
'y': array(['LLaMA-2 Chat (7B)'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
BERT score P=%{x}',
+ 'hovertemplate': 'Model=%{y}
BERT score precision=%{x}',
'legendgroup': 'Snorkel Mistral PairRM DPO (7B)',
'marker': {'color': '#FECB52', 'pattern': {'shape': ''}},
'name': 'Snorkel Mistral PairRM DPO (7B)',
@@ -136,12 +136,12 @@ plot_object,header,plot_json,description,df,arguments
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.31672964], dtype=float32),
+ 'x': array([0.3167385], dtype=float32),
'xaxis': 'x',
'y': array(['Snorkel Mistral PairRM DPO (7B)'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
BERT score P=%{x}',
+ 'hovertemplate': 'Model=%{y}
BERT score precision=%{x}',
'legendgroup': 'Chronos Hermes (13B)',
'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
'name': 'Chronos Hermes (13B)',
@@ -150,12 +150,12 @@ plot_object,header,plot_json,description,df,arguments
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.3124825], dtype=float32),
+ 'x': array([0.31285536], dtype=float32),
'xaxis': 'x',
'y': array(['Chronos Hermes (13B)'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
BERT score P=%{x}',
+ 'hovertemplate': 'Model=%{y}
BERT score precision=%{x}',
'legendgroup': 'Falcon Instruct (7B)',
'marker': {'color': '#EF553B', 'pattern': {'shape': ''}},
'name': 'Falcon Instruct (7B)',
@@ -164,12 +164,12 @@ plot_object,header,plot_json,description,df,arguments
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.2895086], dtype=float32),
+ 'x': array([0.30270517], dtype=float32),
'xaxis': 'x',
'y': array(['Falcon Instruct (7B)'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
BERT score P=%{x}',
+ 'hovertemplate': 'Model=%{y}
BERT score precision=%{x}',
'legendgroup': 'Vicuna v1.5 (7B)',
'marker': {'color': '#00cc96', 'pattern': {'shape': ''}},
'name': 'Vicuna v1.5 (7B)',
@@ -178,12 +178,12 @@ plot_object,header,plot_json,description,df,arguments
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.284109], dtype=float32),
+ 'x': array([0.28434175], dtype=float32),
'xaxis': 'x',
'y': array(['Vicuna v1.5 (7B)'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
BERT score P=%{x}',
+ 'hovertemplate': 'Model=%{y}
BERT score precision=%{x}',
'legendgroup': 'RedPajama-INCITE Chat (7B)',
'marker': {'color': '#ab63fa', 'pattern': {'shape': ''}},
'name': 'RedPajama-INCITE Chat (7B)',
@@ -192,12 +192,12 @@ plot_object,header,plot_json,description,df,arguments
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.261367], dtype=float32),
+ 'x': array([0.26832756], dtype=float32),
'xaxis': 'x',
'y': array(['RedPajama-INCITE Chat (7B)'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
BERT score P=%{x}',
+ 'hovertemplate': 'Model=%{y}
BERT score precision=%{x}',
'legendgroup': 'chat-bison (PaLM 2)',
'marker': {'color': '#FFA15A', 'pattern': {'shape': ''}},
'name': 'chat-bison (PaLM 2)',
@@ -206,12 +206,12 @@ plot_object,header,plot_json,description,df,arguments
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.23117188], dtype=float32),
+ 'x': array([0.23123139], dtype=float32),
'xaxis': 'x',
'y': array(['chat-bison (PaLM 2)'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
BERT score P=%{x}',
+ 'hovertemplate': 'Model=%{y}
BERT score precision=%{x}',
'legendgroup': 'gemini-pro',
'marker': {'color': '#19d3f3', 'pattern': {'shape': ''}},
'name': 'gemini-pro',
@@ -220,12 +220,12 @@ plot_object,header,plot_json,description,df,arguments
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.23105659], dtype=float32),
+ 'x': array([0.23109974], dtype=float32),
'xaxis': 'x',
'y': array(['gemini-pro'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
BERT score P=%{x}',
+ 'hovertemplate': 'Model=%{y}
BERT score precision=%{x}',
'legendgroup': 'chat-bison-32k (PaLM 2 32K)',
'marker': {'color': '#FF6692', 'pattern': {'shape': ''}},
'name': 'chat-bison-32k (PaLM 2 32K)',
@@ -234,12 +234,12 @@ plot_object,header,plot_json,description,df,arguments
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.23046139], dtype=float32),
+ 'x': array([0.23051436], dtype=float32),
'xaxis': 'x',
'y': array(['chat-bison-32k (PaLM 2 32K)'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
BERT score P=%{x}',
+ 'hovertemplate': 'Model=%{y}
BERT score precision=%{x}',
'legendgroup': 'llama-2-70b-chat',
'marker': {'color': '#B6E880', 'pattern': {'shape': ''}},
'name': 'llama-2-70b-chat',
@@ -248,12 +248,12 @@ plot_object,header,plot_json,description,df,arguments
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.20800962], dtype=float32),
+ 'x': array([0.20810011], dtype=float32),
'xaxis': 'x',
'y': array(['llama-2-70b-chat'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
BERT score P=%{x}',
+ 'hovertemplate': 'Model=%{y}
BERT score precision=%{x}',
'legendgroup': 'Mixtral-8x7B-Instruct-v0.1',
'marker': {'color': '#FF97FF', 'pattern': {'shape': ''}},
'name': 'Mixtral-8x7B-Instruct-v0.1',
@@ -262,12 +262,12 @@ plot_object,header,plot_json,description,df,arguments
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.19128644], dtype=float32),
+ 'x': array([0.19137934], dtype=float32),
'xaxis': 'x',
'y': array(['Mixtral-8x7B-Instruct-v0.1'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
BERT score P=%{x}',
+ 'hovertemplate': 'Model=%{y}
BERT score precision=%{x}',
'legendgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
'marker': {'color': '#FECB52', 'pattern': {'shape': ''}},
'name': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
@@ -276,12 +276,12 @@ plot_object,header,plot_json,description,df,arguments
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.12218507], dtype=float32),
+ 'x': array([0.1223323], dtype=float32),
'xaxis': 'x',
'y': array(['TinyLlama/TinyLlama-1.1B-Chat-v1.0'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
BERT score P=%{x}',
+ 'hovertemplate': 'Model=%{y}
BERT score precision=%{x}',
'legendgroup': 'zephyr-7b-beta',
'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
'name': 'zephyr-7b-beta',
@@ -290,12 +290,12 @@ plot_object,header,plot_json,description,df,arguments
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.08539014], dtype=float32),
+ 'x': array([0.08554672], dtype=float32),
'xaxis': 'x',
'y': array(['zephyr-7b-beta'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
BERT score P=%{x}',
+ 'hovertemplate': 'Model=%{y}
BERT score precision=%{x}',
'legendgroup': 'Mistral-7B-Instruct-v0.2',
'marker': {'color': '#EF553B', 'pattern': {'shape': ''}},
'name': 'Mistral-7B-Instruct-v0.2',
@@ -304,12 +304,12 @@ plot_object,header,plot_json,description,df,arguments
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.0438201], dtype=float32),
+ 'x': array([0.04389399], dtype=float32),
'xaxis': 'x',
'y': array(['Mistral-7B-Instruct-v0.2'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
BERT score P=%{x}',
+ 'hovertemplate': 'Model=%{y}
BERT score precision=%{x}',
'legendgroup': 'Upstage SOLAR Instruct v1 (11B)',
'marker': {'color': '#00cc96', 'pattern': {'shape': ''}},
'name': 'Upstage SOLAR Instruct v1 (11B)',
@@ -325,8 +325,8 @@ plot_object,header,plot_json,description,df,arguments
'layout': {'barmode': 'relative',
'legend': {'title': {'text': 'Model'}, 'tracegroupgap': 0},
'template': '...',
- 'title': {'text': 'Summary metrics BERT score P'},
- 'xaxis': {'anchor': 'y', 'domain': [0.0, 1.0], 'title': {'text': 'BERT score P'}},
+ 'title': {'text': 'Summary metrics BERT score precision'},
+ 'xaxis': {'anchor': 'y', 'domain': [0.0, 1.0], 'title': {'text': 'BERT score precision'}},
'yaxis': {'anchor': 'x',
'categoryarray': [Upstage SOLAR Instruct v1 (11B),
Mistral-7B-Instruct-v0.2,
@@ -346,34 +346,34 @@ plot_object,header,plot_json,description,df,arguments
'categoryorder': 'array',
'domain': [0.0, 1.0],
'title': {'text': 'Model'}}}
-})",Summary metrics BERT score P,"{""data"":[{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score P=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-3.5-turbo"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""gpt-3.5-turbo"",""offsetgroup"":""gpt-3.5-turbo"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.4943981],""xaxis"":""x"",""y"":[""gpt-3.5-turbo""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score P=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""gpt-4"",""offsetgroup"":""gpt-4"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.48605907],""xaxis"":""x"",""y"":[""gpt-4""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score P=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4-turbo"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""gpt-4-turbo"",""offsetgroup"":""gpt-4-turbo"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.42728576],""xaxis"":""x"",""y"":[""gpt-4-turbo""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score P=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral (7B) Instruct v0.2 (Together AI)"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""Mistral (7B) Instruct v0.2 (Together AI)"",""offsetgroup"":""Mistral (7B) Instruct v0.2 (Together AI)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.3647361],""xaxis"":""x"",""y"":[""Mistral (7B) Instruct v0.2 (Together AI)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score P=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""OpenHermes-2.5-Mistral (7B)"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""OpenHermes-2.5-Mistral (7B)"",""offsetgroup"":""OpenHermes-2.5-Mistral (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.3618188],""xaxis"":""x"",""y"":[""OpenHermes-2.5-Mistral (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score P=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Qwen 1.5 Chat (7B)"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""Qwen 1.5 Chat (7B)"",""offsetgroup"":""Qwen 1.5 Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.34855434],""xaxis"":""x"",""y"":[""Qwen 1.5 Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score P=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""WizardLM v1.2 (13B)"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""WizardLM v1.2 (13B)"",""offsetgroup"":""WizardLM v1.2 (13B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.34085444],""xaxis"":""x"",""y"":[""WizardLM v1.2 (13B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score P=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""01-ai Yi Chat (34B)"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""01-ai Yi Chat (34B)"",""offsetgroup"":""01-ai Yi Chat (34B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.33974892],""xaxis"":""x"",""y"":[""01-ai Yi Chat (34B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score P=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""LLaMA-2 Chat (7B)"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""LLaMA-2 Chat (7B)"",""offsetgroup"":""LLaMA-2 Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.3203912],""xaxis"":""x"",""y"":[""LLaMA-2 Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score P=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Snorkel Mistral PairRM DPO (7B)"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""Snorkel Mistral PairRM DPO (7B)"",""offsetgroup"":""Snorkel Mistral PairRM DPO (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.31672964],""xaxis"":""x"",""y"":[""Snorkel Mistral PairRM DPO (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score P=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Chronos Hermes (13B)"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""Chronos Hermes (13B)"",""offsetgroup"":""Chronos Hermes (13B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.3124825],""xaxis"":""x"",""y"":[""Chronos Hermes (13B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score P=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Falcon Instruct (7B)"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""Falcon Instruct (7B)"",""offsetgroup"":""Falcon Instruct (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.2895086],""xaxis"":""x"",""y"":[""Falcon Instruct (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score P=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Vicuna v1.5 (7B)"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""Vicuna v1.5 (7B)"",""offsetgroup"":""Vicuna v1.5 (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.284109],""xaxis"":""x"",""y"":[""Vicuna v1.5 (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score P=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""RedPajama-INCITE Chat (7B)"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""RedPajama-INCITE Chat (7B)"",""offsetgroup"":""RedPajama-INCITE Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.261367],""xaxis"":""x"",""y"":[""RedPajama-INCITE Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score P=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison (PaLM 2)"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""chat-bison (PaLM 2)"",""offsetgroup"":""chat-bison (PaLM 2)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.23117188],""xaxis"":""x"",""y"":[""chat-bison (PaLM 2)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score P=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gemini-pro"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""gemini-pro"",""offsetgroup"":""gemini-pro"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.23105659],""xaxis"":""x"",""y"":[""gemini-pro""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score P=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison-32k (PaLM 2 32K)"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""chat-bison-32k (PaLM 2 32K)"",""offsetgroup"":""chat-bison-32k (PaLM 2 32K)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.23046139],""xaxis"":""x"",""y"":[""chat-bison-32k (PaLM 2 32K)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score P=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""llama-2-70b-chat"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""llama-2-70b-chat"",""offsetgroup"":""llama-2-70b-chat"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.20800962],""xaxis"":""x"",""y"":[""llama-2-70b-chat""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score P=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mixtral-8x7B-Instruct-v0.1"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""Mixtral-8x7B-Instruct-v0.1"",""offsetgroup"":""Mixtral-8x7B-Instruct-v0.1"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.19128644],""xaxis"":""x"",""y"":[""Mixtral-8x7B-Instruct-v0.1""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score P=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""offsetgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.122185074],""xaxis"":""x"",""y"":[""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score P=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""zephyr-7b-beta"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""zephyr-7b-beta"",""offsetgroup"":""zephyr-7b-beta"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.085390136],""xaxis"":""x"",""y"":[""zephyr-7b-beta""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score P=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral-7B-Instruct-v0.2"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""Mistral-7B-Instruct-v0.2"",""offsetgroup"":""Mistral-7B-Instruct-v0.2"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.043820098],""xaxis"":""x"",""y"":[""Mistral-7B-Instruct-v0.2""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score P=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Upstage SOLAR Instruct v1 (11B)"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""Upstage SOLAR Instruct v1 (11B)"",""offsetgroup"":""Upstage SOLAR Instruct v1 (11B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.0],""xaxis"":""x"",""y"":[""Upstage SOLAR Instruct v1 (11B)""],""yaxis"":""y"",""type"":""bar""}],""layout"":{""template"":{""data"":{""histogram2dcontour"":[{""type"":""histogram2dcontour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""choropleth"":[{""type"":""choropleth"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""histogram2d"":[{""type"":""histogram2d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmap"":[{""type"":""heatmap"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmapgl"":[{""type"":""heatmapgl"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""contourcarpet"":[{""type"":""contourcarpet"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""contour"":[{""type"":""contour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""surface"":[{""type"":""surface"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""mesh3d"":[{""type"":""mesh3d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""scatter"":[{""fillpattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2},""type"":""scatter""}],""parcoords"":[{""type"":""parcoords"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolargl"":[{""type"":""scatterpolargl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""bar"":[{""error_x"":{""color"":""#2a3f5f""},""error_y"":{""color"":""#2a3f5f""},""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""bar""}],""scattergeo"":[{""type"":""scattergeo"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolar"":[{""type"":""scatterpolar"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""histogram"":[{""marker"":{""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""histogram""}],""scattergl"":[{""type"":""scattergl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatter3d"":[{""type"":""scatter3d"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattermapbox"":[{""type"":""scattermapbox"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterternary"":[{""type"":""scatterternary"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattercarpet"":[{""type"":""scattercarpet"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""carpet"":[{""aaxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""baxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""type"":""carpet""}],""table"":[{""cells"":{""fill"":{""color"":""#EBF0F8""},""line"":{""color"":""white""}},""header"":{""fill"":{""color"":""#C8D4E3""},""line"":{""color"":""white""}},""type"":""table""}],""barpolar"":[{""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""barpolar""}],""pie"":[{""automargin"":true,""type"":""pie""}]},""layout"":{""autotypenumbers"":""strict"",""colorway"":[""#636efa"",""#EF553B"",""#00cc96"",""#ab63fa"",""#FFA15A"",""#19d3f3"",""#FF6692"",""#B6E880"",""#FF97FF"",""#FECB52""],""font"":{""color"":""#2a3f5f""},""hovermode"":""closest"",""hoverlabel"":{""align"":""left""},""paper_bgcolor"":""white"",""plot_bgcolor"":""#E5ECF6"",""polar"":{""bgcolor"":""#E5ECF6"",""angularaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""radialaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""ternary"":{""bgcolor"":""#E5ECF6"",""aaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""baxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""caxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""coloraxis"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""colorscale"":{""sequential"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""sequentialminus"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""diverging"":[[0,""#8e0152""],[0.1,""#c51b7d""],[0.2,""#de77ae""],[0.3,""#f1b6da""],[0.4,""#fde0ef""],[0.5,""#f7f7f7""],[0.6,""#e6f5d0""],[0.7,""#b8e186""],[0.8,""#7fbc41""],[0.9,""#4d9221""],[1,""#276419""]]},""xaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""yaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""scene"":{""xaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""yaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""zaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2}},""shapedefaults"":{""line"":{""color"":""#2a3f5f""}},""annotationdefaults"":{""arrowcolor"":""#2a3f5f"",""arrowhead"":0,""arrowwidth"":1},""geo"":{""bgcolor"":""white"",""landcolor"":""#E5ECF6"",""subunitcolor"":""white"",""showland"":true,""showlakes"":true,""lakecolor"":""white""},""title"":{""x"":0.05},""mapbox"":{""style"":""light""}}},""xaxis"":{""anchor"":""y"",""domain"":[0.0,1.0],""title"":{""text"":""BERT score P""}},""yaxis"":{""anchor"":""x"",""domain"":[0.0,1.0],""title"":{""text"":""Model""},""categoryorder"":""array"",""categoryarray"":[""Upstage SOLAR Instruct v1 (11B)"",""Mistral-7B-Instruct-v0.2"",""zephyr-7b-beta"",""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""Mixtral-8x7B-Instruct-v0.1"",""llama-2-70b-chat"",""chat-bison-32k (PaLM 2 32K)"",""gemini-pro"",""chat-bison (PaLM 2)"",""RedPajama-INCITE Chat (7B)"",""Vicuna v1.5 (7B)"",""Falcon Instruct (7B)"",""Chronos Hermes (13B)"",""Snorkel Mistral PairRM DPO (7B)"",""LLaMA-2 Chat (7B)"",""01-ai Yi Chat (34B)"",""WizardLM v1.2 (13B)"",""Qwen 1.5 Chat (7B)"",""OpenHermes-2.5-Mistral (7B)"",""Mistral (7B) Instruct v0.2 (Together AI)"",""gpt-4-turbo"",""gpt-4"",""gpt-3.5-turbo""]},""legend"":{""title"":{""text"":""Model""},""tracegroupgap"":0},""title"":{""text"":""Summary metrics BERT score P""},""barmode"":""relative""}}",,",model,bert_score_P,bert_score_R,bert_score_F1,original_text_length_part,sentence_count,length_penalty,bleu_score
-18,gpt-3.5-turbo,0.4943981,0.48408476,0.4888874,0.5905700146991734,4.229639819909955,89814.0,0.007892445077902592
-19,gpt-4,0.48605907,0.472583,0.47901583,0.4763731952669352,4.266137566137566,85120.0,0.004704572681138337
-20,gpt-4-turbo,0.42728576,0.4162435,0.42098433,0.5393220459796505,4.266137566137566,85120.0,0.0034873692407505464
-4,Mistral (7B) Instruct v0.2 (Together AI),0.3647361,0.3664233,0.36540908,0.5233998570385472,3.712222222222222,29298.0,0.005478518060743351
-7,OpenHermes-2.5-Mistral (7B),0.3618188,0.35180506,0.3565194,0.312054520357568,3.5818443804034583,14928.0,0.006563161880264231
-8,Qwen 1.5 Chat (7B),0.34855434,0.34154576,0.344803,0.29904529709475364,3.5818443804034583,14928.0,0.003185571110431172
-14,WizardLM v1.2 (13B),0.34085444,0.32933056,0.33466902,0.28716720161049375,3.5818443804034583,14928.0,0.003671383039102015
-0,01-ai Yi Chat (34B),0.33974892,0.3404481,0.3399749,0.43251538287409536,3.5818443804034583,14928.0,0.007311566390840339
-3,LLaMA-2 Chat (7B),0.3203912,0.3153909,0.31770444,0.4084233313416049,3.5818443804034583,14928.0,0.004255859538193306
-10,Snorkel Mistral PairRM DPO (7B),0.31672964,0.33782956,0.3265383,3.7740234383755356,3.5818443804034583,14928.0,0.002907897771152987
-1,Chronos Hermes (13B),0.3124825,0.31071666,0.311415,0.4742810243835248,3.5818443804034583,14928.0,0.011439012700594395
-2,Falcon Instruct (7B),0.2895086,0.23968808,0.2615204,0.0490635544441649,3.5818443804034583,14928.0,0.00021729364201653395
-13,Vicuna v1.5 (7B),0.284109,0.27878883,0.28129113,0.2781035051738079,3.6173027989821884,16948.0,0.006952332387656228
-9,RedPajama-INCITE Chat (7B),0.261367,0.23758642,0.2487217,0.0560284823193376,3.5818443804034583,14928.0,0.0
-15,chat-bison (PaLM 2),0.23117188,0.23029378,0.23060663,0.2927236655934559,4.281081081081081,83400.0,0.0033173472693443363
-17,gemini-pro,0.23105659,0.23057175,0.23072062,0.295286999418032,4.244871794871795,87700.0,0.0025439281189154664
-16,chat-bison-32k (PaLM 2 32K),0.23046139,0.22983725,0.23002876,0.2608806894318779,4.281081081081081,83400.0,0.002970914340485325
-21,llama-2-70b-chat,0.20800962,0.21472095,0.21117964,0.29684572894554634,4.2436893203883495,88008.0,0.00329426273003284
-6,Mixtral-8x7B-Instruct-v0.1,0.19128644,0.19555509,0.19330867,0.2665288353398184,4.161038961038961,103320.0,0.0026839271544750283
-11,TinyLlama/TinyLlama-1.1B-Chat-v1.0,0.122185074,0.11885959,0.12042627,0.13915355617375091,4.244871794871795,87700.0,0.002991155730532842
-22,zephyr-7b-beta,0.085390136,0.08266569,0.08394519,0.08796697338212889,4.159788702026735,103714.0,0.0010625100735849574
-5,Mistral-7B-Instruct-v0.2,0.043820098,0.042561684,0.04313921,0.04250630683894714,4.120342654588421,113258.0,0.0004930290548816363
-12,Upstage SOLAR Instruct v1 (11B),0.0,0.0,0.0,0.0017662349842492329,3.5818443804034583,14928.0,0.0
-","{""x"": ""bert_score_P"", ""y"": ""model"", ""color"": ""model"", ""orientation"": ""h"", ""labels"": {""bert_score_P"": ""BERT score P"", ""model"": ""Model""}, ""title"": ""Summary metrics BERT score P""}"
+})",Summary metrics BERT score precision,"{""data"":[{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score precision=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-3.5-turbo"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""gpt-3.5-turbo"",""offsetgroup"":""gpt-3.5-turbo"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.49478123],""xaxis"":""x"",""y"":[""gpt-3.5-turbo""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score precision=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""gpt-4"",""offsetgroup"":""gpt-4"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.4864653],""xaxis"":""x"",""y"":[""gpt-4""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score precision=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4-turbo"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""gpt-4-turbo"",""offsetgroup"":""gpt-4-turbo"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.42933634],""xaxis"":""x"",""y"":[""gpt-4-turbo""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score precision=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral (7B) Instruct v0.2 (Together AI)"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""Mistral (7B) Instruct v0.2 (Together AI)"",""offsetgroup"":""Mistral (7B) Instruct v0.2 (Together AI)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.36488953],""xaxis"":""x"",""y"":[""Mistral (7B) Instruct v0.2 (Together AI)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score precision=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""OpenHermes-2.5-Mistral (7B)"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""OpenHermes-2.5-Mistral (7B)"",""offsetgroup"":""OpenHermes-2.5-Mistral (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.3621834],""xaxis"":""x"",""y"":[""OpenHermes-2.5-Mistral (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score precision=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Qwen 1.5 Chat (7B)"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""Qwen 1.5 Chat (7B)"",""offsetgroup"":""Qwen 1.5 Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.34898603],""xaxis"":""x"",""y"":[""Qwen 1.5 Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score precision=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""WizardLM v1.2 (13B)"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""WizardLM v1.2 (13B)"",""offsetgroup"":""WizardLM v1.2 (13B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.3420949],""xaxis"":""x"",""y"":[""WizardLM v1.2 (13B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score precision=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""01-ai Yi Chat (34B)"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""01-ai Yi Chat (34B)"",""offsetgroup"":""01-ai Yi Chat (34B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.33981326],""xaxis"":""x"",""y"":[""01-ai Yi Chat (34B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score precision=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""LLaMA-2 Chat (7B)"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""LLaMA-2 Chat (7B)"",""offsetgroup"":""LLaMA-2 Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.32074162],""xaxis"":""x"",""y"":[""LLaMA-2 Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score precision=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Snorkel Mistral PairRM DPO (7B)"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""Snorkel Mistral PairRM DPO (7B)"",""offsetgroup"":""Snorkel Mistral PairRM DPO (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.3167385],""xaxis"":""x"",""y"":[""Snorkel Mistral PairRM DPO (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score precision=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Chronos Hermes (13B)"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""Chronos Hermes (13B)"",""offsetgroup"":""Chronos Hermes (13B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.31285536],""xaxis"":""x"",""y"":[""Chronos Hermes (13B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score precision=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Falcon Instruct (7B)"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""Falcon Instruct (7B)"",""offsetgroup"":""Falcon Instruct (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.30270517],""xaxis"":""x"",""y"":[""Falcon Instruct (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score precision=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Vicuna v1.5 (7B)"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""Vicuna v1.5 (7B)"",""offsetgroup"":""Vicuna v1.5 (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.28434175],""xaxis"":""x"",""y"":[""Vicuna v1.5 (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score precision=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""RedPajama-INCITE Chat (7B)"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""RedPajama-INCITE Chat (7B)"",""offsetgroup"":""RedPajama-INCITE Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.26832756],""xaxis"":""x"",""y"":[""RedPajama-INCITE Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score precision=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison (PaLM 2)"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""chat-bison (PaLM 2)"",""offsetgroup"":""chat-bison (PaLM 2)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.23123139],""xaxis"":""x"",""y"":[""chat-bison (PaLM 2)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score precision=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gemini-pro"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""gemini-pro"",""offsetgroup"":""gemini-pro"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.23109974],""xaxis"":""x"",""y"":[""gemini-pro""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score precision=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison-32k (PaLM 2 32K)"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""chat-bison-32k (PaLM 2 32K)"",""offsetgroup"":""chat-bison-32k (PaLM 2 32K)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.23051436],""xaxis"":""x"",""y"":[""chat-bison-32k (PaLM 2 32K)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score precision=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""llama-2-70b-chat"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""llama-2-70b-chat"",""offsetgroup"":""llama-2-70b-chat"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.20810011],""xaxis"":""x"",""y"":[""llama-2-70b-chat""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score precision=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mixtral-8x7B-Instruct-v0.1"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""Mixtral-8x7B-Instruct-v0.1"",""offsetgroup"":""Mixtral-8x7B-Instruct-v0.1"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.19137934],""xaxis"":""x"",""y"":[""Mixtral-8x7B-Instruct-v0.1""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score precision=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""offsetgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.122332305],""xaxis"":""x"",""y"":[""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score precision=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""zephyr-7b-beta"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""zephyr-7b-beta"",""offsetgroup"":""zephyr-7b-beta"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.085546724],""xaxis"":""x"",""y"":[""zephyr-7b-beta""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score precision=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral-7B-Instruct-v0.2"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""Mistral-7B-Instruct-v0.2"",""offsetgroup"":""Mistral-7B-Instruct-v0.2"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.04389399],""xaxis"":""x"",""y"":[""Mistral-7B-Instruct-v0.2""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score precision=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Upstage SOLAR Instruct v1 (11B)"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""Upstage SOLAR Instruct v1 (11B)"",""offsetgroup"":""Upstage SOLAR Instruct v1 (11B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.0],""xaxis"":""x"",""y"":[""Upstage SOLAR Instruct v1 (11B)""],""yaxis"":""y"",""type"":""bar""}],""layout"":{""template"":{""data"":{""histogram2dcontour"":[{""type"":""histogram2dcontour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""choropleth"":[{""type"":""choropleth"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""histogram2d"":[{""type"":""histogram2d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmap"":[{""type"":""heatmap"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmapgl"":[{""type"":""heatmapgl"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""contourcarpet"":[{""type"":""contourcarpet"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""contour"":[{""type"":""contour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""surface"":[{""type"":""surface"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""mesh3d"":[{""type"":""mesh3d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""scatter"":[{""fillpattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2},""type"":""scatter""}],""parcoords"":[{""type"":""parcoords"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolargl"":[{""type"":""scatterpolargl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""bar"":[{""error_x"":{""color"":""#2a3f5f""},""error_y"":{""color"":""#2a3f5f""},""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""bar""}],""scattergeo"":[{""type"":""scattergeo"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolar"":[{""type"":""scatterpolar"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""histogram"":[{""marker"":{""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""histogram""}],""scattergl"":[{""type"":""scattergl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatter3d"":[{""type"":""scatter3d"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattermapbox"":[{""type"":""scattermapbox"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterternary"":[{""type"":""scatterternary"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattercarpet"":[{""type"":""scattercarpet"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""carpet"":[{""aaxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""baxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""type"":""carpet""}],""table"":[{""cells"":{""fill"":{""color"":""#EBF0F8""},""line"":{""color"":""white""}},""header"":{""fill"":{""color"":""#C8D4E3""},""line"":{""color"":""white""}},""type"":""table""}],""barpolar"":[{""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""barpolar""}],""pie"":[{""automargin"":true,""type"":""pie""}]},""layout"":{""autotypenumbers"":""strict"",""colorway"":[""#636efa"",""#EF553B"",""#00cc96"",""#ab63fa"",""#FFA15A"",""#19d3f3"",""#FF6692"",""#B6E880"",""#FF97FF"",""#FECB52""],""font"":{""color"":""#2a3f5f""},""hovermode"":""closest"",""hoverlabel"":{""align"":""left""},""paper_bgcolor"":""white"",""plot_bgcolor"":""#E5ECF6"",""polar"":{""bgcolor"":""#E5ECF6"",""angularaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""radialaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""ternary"":{""bgcolor"":""#E5ECF6"",""aaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""baxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""caxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""coloraxis"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""colorscale"":{""sequential"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""sequentialminus"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""diverging"":[[0,""#8e0152""],[0.1,""#c51b7d""],[0.2,""#de77ae""],[0.3,""#f1b6da""],[0.4,""#fde0ef""],[0.5,""#f7f7f7""],[0.6,""#e6f5d0""],[0.7,""#b8e186""],[0.8,""#7fbc41""],[0.9,""#4d9221""],[1,""#276419""]]},""xaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""yaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""scene"":{""xaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""yaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""zaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2}},""shapedefaults"":{""line"":{""color"":""#2a3f5f""}},""annotationdefaults"":{""arrowcolor"":""#2a3f5f"",""arrowhead"":0,""arrowwidth"":1},""geo"":{""bgcolor"":""white"",""landcolor"":""#E5ECF6"",""subunitcolor"":""white"",""showland"":true,""showlakes"":true,""lakecolor"":""white""},""title"":{""x"":0.05},""mapbox"":{""style"":""light""}}},""xaxis"":{""anchor"":""y"",""domain"":[0.0,1.0],""title"":{""text"":""BERT score precision""}},""yaxis"":{""anchor"":""x"",""domain"":[0.0,1.0],""title"":{""text"":""Model""},""categoryorder"":""array"",""categoryarray"":[""Upstage SOLAR Instruct v1 (11B)"",""Mistral-7B-Instruct-v0.2"",""zephyr-7b-beta"",""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""Mixtral-8x7B-Instruct-v0.1"",""llama-2-70b-chat"",""chat-bison-32k (PaLM 2 32K)"",""gemini-pro"",""chat-bison (PaLM 2)"",""RedPajama-INCITE Chat (7B)"",""Vicuna v1.5 (7B)"",""Falcon Instruct (7B)"",""Chronos Hermes (13B)"",""Snorkel Mistral PairRM DPO (7B)"",""LLaMA-2 Chat (7B)"",""01-ai Yi Chat (34B)"",""WizardLM v1.2 (13B)"",""Qwen 1.5 Chat (7B)"",""OpenHermes-2.5-Mistral (7B)"",""Mistral (7B) Instruct v0.2 (Together AI)"",""gpt-4-turbo"",""gpt-4"",""gpt-3.5-turbo""]},""legend"":{""title"":{""text"":""Model""},""tracegroupgap"":0},""title"":{""text"":""Summary metrics BERT score precision""},""barmode"":""relative""}}",,",model,BERT_score_precision,BERT_score_recall,BERT_score_F1,BLEU_score,original_text_length_part,sentence_count,length_penalty
+18,gpt-3.5-turbo,0.49478123,0.50445867,0.49331823,0.00919205486407126,0.5905700146991734,4.229639819909955,89814.0
+19,gpt-4,0.4864653,0.49512562,0.4839312,0.005711113295666468,0.4763731952669352,4.266137566137566,85120.0
+20,gpt-4-turbo,0.42933634,0.4414623,0.4294052,0.0042830628392272,0.5393220459796505,4.266137566137566,85120.0
+4,Mistral (7B) Instruct v0.2 (Together AI),0.36488953,0.3797993,0.36758336,0.005650224193975447,0.5233998570385472,3.712222222222222,29298.0
+7,OpenHermes-2.5-Mistral (7B),0.3621834,0.3685358,0.36003792,0.0068684572027745494,0.312054520357568,3.5818443804034583,14928.0
+8,Qwen 1.5 Chat (7B),0.34898603,0.35945317,0.34867778,0.0033327500620805805,0.29904529709475364,3.5818443804034583,14928.0
+14,WizardLM v1.2 (13B),0.3420949,0.34746957,0.33996373,0.00373442128604677,0.28716720161049375,3.5818443804034583,14928.0
+0,01-ai Yi Chat (34B),0.33981326,0.35219854,0.34183535,0.007428840277380581,0.43251538287409536,3.5818443804034583,14928.0
+3,LLaMA-2 Chat (7B),0.32074162,0.33171847,0.32136682,0.004415024709996126,0.4084233313416049,3.5818443804034583,14928.0
+10,Snorkel Mistral PairRM DPO (7B),0.3167385,0.34785262,0.32718164,0.0029236226777824676,3.7740234383755356,3.5818443804034583,14928.0
+1,Chronos Hermes (13B),0.31285536,0.32630467,0.3150877,0.011542047908319874,0.4742810243835248,3.5818443804034583,14928.0
+2,Falcon Instruct (7B),0.30270517,0.28607234,0.29104736,0.0030232447024239606,0.0490635544441649,3.5818443804034583,14928.0
+13,Vicuna v1.5 (7B),0.28434175,0.29119453,0.2839047,0.007105541953090669,0.2781035051738079,3.6173027989821884,16948.0
+9,RedPajama-INCITE Chat (7B),0.26832756,0.27305293,0.26768887,0.0,0.0560284823193376,3.5818443804034583,14928.0
+15,chat-bison (PaLM 2),0.23123139,0.24001649,0.23214735,0.0037652345768886663,0.2927236655934559,4.281081081081081,83400.0
+17,gemini-pro,0.23109974,0.23956373,0.23199782,0.0032373504004405487,0.295286999418032,4.244871794871795,87700.0
+16,chat-bison-32k (PaLM 2 32K),0.23051436,0.23993237,0.2317056,0.003694633514634998,0.2608806894318779,4.281081081081081,83400.0
+21,llama-2-70b-chat,0.20810011,0.22406381,0.21268094,0.004560500754935232,0.29684572894554634,4.2436893203883495,88008.0
+6,Mixtral-8x7B-Instruct-v0.1,0.19137934,0.2029136,0.19449018,0.0031843990217988536,0.2665288353398184,4.161038961038961,103320.0
+11,TinyLlama/TinyLlama-1.1B-Chat-v1.0,0.122332305,0.12540509,0.12200464,0.003286423403673119,0.13915355617375091,4.244871794871795,87700.0
+22,zephyr-7b-beta,0.085546724,0.08755772,0.085219756,0.0012612839176470308,0.08796697338212889,4.159788702026735,103714.0
+5,Mistral-7B-Instruct-v0.2,0.04389399,0.045185987,0.04378006,0.000566625796313851,0.04250630683894714,4.120342654588421,113258.0
+12,Upstage SOLAR Instruct v1 (11B),0.0,0.0,0.0,0.0,0.0017662349842492329,3.5818443804034583,14928.0
+","{""x"": ""BERT_score_precision"", ""y"": ""model"", ""color"": ""model"", ""orientation"": ""h"", ""labels"": {""BERT_score_precision"": ""BERT score precision"", ""model"": ""Model""}, ""title"": ""Summary metrics BERT score precision""}"
"Figure({
'data': [{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
BERT score R=%{x}',
+ 'hovertemplate': 'Model=%{y}
BERT score recall=%{x}',
'legendgroup': 'gpt-3.5-turbo',
'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
'name': 'gpt-3.5-turbo',
@@ -382,12 +382,12 @@ plot_object,header,plot_json,description,df,arguments
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.48408476], dtype=float32),
+ 'x': array([0.50445867], dtype=float32),
'xaxis': 'x',
'y': array(['gpt-3.5-turbo'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
BERT score R=%{x}',
+ 'hovertemplate': 'Model=%{y}
BERT score recall=%{x}',
'legendgroup': 'gpt-4',
'marker': {'color': '#EF553B', 'pattern': {'shape': ''}},
'name': 'gpt-4',
@@ -396,12 +396,12 @@ plot_object,header,plot_json,description,df,arguments
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.472583], dtype=float32),
+ 'x': array([0.49512562], dtype=float32),
'xaxis': 'x',
'y': array(['gpt-4'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
BERT score R=%{x}',
+ 'hovertemplate': 'Model=%{y}
BERT score recall=%{x}',
'legendgroup': 'gpt-4-turbo',
'marker': {'color': '#00cc96', 'pattern': {'shape': ''}},
'name': 'gpt-4-turbo',
@@ -410,12 +410,12 @@ plot_object,header,plot_json,description,df,arguments
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.4162435], dtype=float32),
+ 'x': array([0.4414623], dtype=float32),
'xaxis': 'x',
'y': array(['gpt-4-turbo'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
BERT score R=%{x}',
+ 'hovertemplate': 'Model=%{y}
BERT score recall=%{x}',
'legendgroup': 'Mistral (7B) Instruct v0.2 (Together AI)',
'marker': {'color': '#ab63fa', 'pattern': {'shape': ''}},
'name': 'Mistral (7B) Instruct v0.2 (Together AI)',
@@ -424,12 +424,12 @@ plot_object,header,plot_json,description,df,arguments
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.3664233], dtype=float32),
+ 'x': array([0.3797993], dtype=float32),
'xaxis': 'x',
'y': array(['Mistral (7B) Instruct v0.2 (Together AI)'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
BERT score R=%{x}',
+ 'hovertemplate': 'Model=%{y}
BERT score recall=%{x}',
'legendgroup': 'OpenHermes-2.5-Mistral (7B)',
'marker': {'color': '#FFA15A', 'pattern': {'shape': ''}},
'name': 'OpenHermes-2.5-Mistral (7B)',
@@ -438,12 +438,12 @@ plot_object,header,plot_json,description,df,arguments
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.35180506], dtype=float32),
+ 'x': array([0.3685358], dtype=float32),
'xaxis': 'x',
'y': array(['OpenHermes-2.5-Mistral (7B)'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
BERT score R=%{x}',
+ 'hovertemplate': 'Model=%{y}
BERT score recall=%{x}',
'legendgroup': 'Qwen 1.5 Chat (7B)',
'marker': {'color': '#19d3f3', 'pattern': {'shape': ''}},
'name': 'Qwen 1.5 Chat (7B)',
@@ -452,12 +452,12 @@ plot_object,header,plot_json,description,df,arguments
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.34154576], dtype=float32),
+ 'x': array([0.35945317], dtype=float32),
'xaxis': 'x',
'y': array(['Qwen 1.5 Chat (7B)'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
BERT score R=%{x}',
+ 'hovertemplate': 'Model=%{y}
BERT score recall=%{x}',
'legendgroup': '01-ai Yi Chat (34B)',
'marker': {'color': '#FF6692', 'pattern': {'shape': ''}},
'name': '01-ai Yi Chat (34B)',
@@ -466,12 +466,12 @@ plot_object,header,plot_json,description,df,arguments
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.3404481], dtype=float32),
+ 'x': array([0.35219854], dtype=float32),
'xaxis': 'x',
'y': array(['01-ai Yi Chat (34B)'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
BERT score R=%{x}',
+ 'hovertemplate': 'Model=%{y}
BERT score recall=%{x}',
'legendgroup': 'Snorkel Mistral PairRM DPO (7B)',
'marker': {'color': '#B6E880', 'pattern': {'shape': ''}},
'name': 'Snorkel Mistral PairRM DPO (7B)',
@@ -480,12 +480,12 @@ plot_object,header,plot_json,description,df,arguments
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.33782956], dtype=float32),
+ 'x': array([0.34785262], dtype=float32),
'xaxis': 'x',
'y': array(['Snorkel Mistral PairRM DPO (7B)'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
BERT score R=%{x}',
+ 'hovertemplate': 'Model=%{y}
BERT score recall=%{x}',
'legendgroup': 'WizardLM v1.2 (13B)',
'marker': {'color': '#FF97FF', 'pattern': {'shape': ''}},
'name': 'WizardLM v1.2 (13B)',
@@ -494,12 +494,12 @@ plot_object,header,plot_json,description,df,arguments
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.32933056], dtype=float32),
+ 'x': array([0.34746957], dtype=float32),
'xaxis': 'x',
'y': array(['WizardLM v1.2 (13B)'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
BERT score R=%{x}',
+ 'hovertemplate': 'Model=%{y}
BERT score recall=%{x}',
'legendgroup': 'LLaMA-2 Chat (7B)',
'marker': {'color': '#FECB52', 'pattern': {'shape': ''}},
'name': 'LLaMA-2 Chat (7B)',
@@ -508,12 +508,12 @@ plot_object,header,plot_json,description,df,arguments
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.3153909], dtype=float32),
+ 'x': array([0.33171847], dtype=float32),
'xaxis': 'x',
'y': array(['LLaMA-2 Chat (7B)'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
BERT score R=%{x}',
+ 'hovertemplate': 'Model=%{y}
BERT score recall=%{x}',
'legendgroup': 'Chronos Hermes (13B)',
'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
'name': 'Chronos Hermes (13B)',
@@ -522,12 +522,12 @@ plot_object,header,plot_json,description,df,arguments
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.31071666], dtype=float32),
+ 'x': array([0.32630467], dtype=float32),
'xaxis': 'x',
'y': array(['Chronos Hermes (13B)'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
BERT score R=%{x}',
+ 'hovertemplate': 'Model=%{y}
BERT score recall=%{x}',
'legendgroup': 'Vicuna v1.5 (7B)',
'marker': {'color': '#EF553B', 'pattern': {'shape': ''}},
'name': 'Vicuna v1.5 (7B)',
@@ -536,12 +536,12 @@ plot_object,header,plot_json,description,df,arguments
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.27878883], dtype=float32),
+ 'x': array([0.29119453], dtype=float32),
'xaxis': 'x',
'y': array(['Vicuna v1.5 (7B)'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
BERT score R=%{x}',
+ 'hovertemplate': 'Model=%{y}
BERT score recall=%{x}',
'legendgroup': 'Falcon Instruct (7B)',
'marker': {'color': '#00cc96', 'pattern': {'shape': ''}},
'name': 'Falcon Instruct (7B)',
@@ -550,12 +550,12 @@ plot_object,header,plot_json,description,df,arguments
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.23968808], dtype=float32),
+ 'x': array([0.28607234], dtype=float32),
'xaxis': 'x',
'y': array(['Falcon Instruct (7B)'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
BERT score R=%{x}',
+ 'hovertemplate': 'Model=%{y}
BERT score recall=%{x}',
'legendgroup': 'RedPajama-INCITE Chat (7B)',
'marker': {'color': '#ab63fa', 'pattern': {'shape': ''}},
'name': 'RedPajama-INCITE Chat (7B)',
@@ -564,54 +564,54 @@ plot_object,header,plot_json,description,df,arguments
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.23758642], dtype=float32),
+ 'x': array([0.27305293], dtype=float32),
'xaxis': 'x',
'y': array(['RedPajama-INCITE Chat (7B)'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
BERT score R=%{x}',
- 'legendgroup': 'gemini-pro',
+ 'hovertemplate': 'Model=%{y}
BERT score recall=%{x}',
+ 'legendgroup': 'chat-bison (PaLM 2)',
'marker': {'color': '#FFA15A', 'pattern': {'shape': ''}},
- 'name': 'gemini-pro',
- 'offsetgroup': 'gemini-pro',
+ 'name': 'chat-bison (PaLM 2)',
+ 'offsetgroup': 'chat-bison (PaLM 2)',
'orientation': 'h',
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.23057175], dtype=float32),
+ 'x': array([0.24001649], dtype=float32),
'xaxis': 'x',
- 'y': array(['gemini-pro'], dtype=object),
+ 'y': array(['chat-bison (PaLM 2)'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
BERT score R=%{x}',
- 'legendgroup': 'chat-bison (PaLM 2)',
+ 'hovertemplate': 'Model=%{y}
BERT score recall=%{x}',
+ 'legendgroup': 'chat-bison-32k (PaLM 2 32K)',
'marker': {'color': '#19d3f3', 'pattern': {'shape': ''}},
- 'name': 'chat-bison (PaLM 2)',
- 'offsetgroup': 'chat-bison (PaLM 2)',
+ 'name': 'chat-bison-32k (PaLM 2 32K)',
+ 'offsetgroup': 'chat-bison-32k (PaLM 2 32K)',
'orientation': 'h',
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.23029378], dtype=float32),
+ 'x': array([0.23993237], dtype=float32),
'xaxis': 'x',
- 'y': array(['chat-bison (PaLM 2)'], dtype=object),
+ 'y': array(['chat-bison-32k (PaLM 2 32K)'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
BERT score R=%{x}',
- 'legendgroup': 'chat-bison-32k (PaLM 2 32K)',
+ 'hovertemplate': 'Model=%{y}
BERT score recall=%{x}',
+ 'legendgroup': 'gemini-pro',
'marker': {'color': '#FF6692', 'pattern': {'shape': ''}},
- 'name': 'chat-bison-32k (PaLM 2 32K)',
- 'offsetgroup': 'chat-bison-32k (PaLM 2 32K)',
+ 'name': 'gemini-pro',
+ 'offsetgroup': 'gemini-pro',
'orientation': 'h',
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.22983725], dtype=float32),
+ 'x': array([0.23956373], dtype=float32),
'xaxis': 'x',
- 'y': array(['chat-bison-32k (PaLM 2 32K)'], dtype=object),
+ 'y': array(['gemini-pro'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
BERT score R=%{x}',
+ 'hovertemplate': 'Model=%{y}
BERT score recall=%{x}',
'legendgroup': 'llama-2-70b-chat',
'marker': {'color': '#B6E880', 'pattern': {'shape': ''}},
'name': 'llama-2-70b-chat',
@@ -620,12 +620,12 @@ plot_object,header,plot_json,description,df,arguments
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.21472095], dtype=float32),
+ 'x': array([0.22406381], dtype=float32),
'xaxis': 'x',
'y': array(['llama-2-70b-chat'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
BERT score R=%{x}',
+ 'hovertemplate': 'Model=%{y}
BERT score recall=%{x}',
'legendgroup': 'Mixtral-8x7B-Instruct-v0.1',
'marker': {'color': '#FF97FF', 'pattern': {'shape': ''}},
'name': 'Mixtral-8x7B-Instruct-v0.1',
@@ -634,12 +634,12 @@ plot_object,header,plot_json,description,df,arguments
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.19555509], dtype=float32),
+ 'x': array([0.2029136], dtype=float32),
'xaxis': 'x',
'y': array(['Mixtral-8x7B-Instruct-v0.1'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
BERT score R=%{x}',
+ 'hovertemplate': 'Model=%{y}
BERT score recall=%{x}',
'legendgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
'marker': {'color': '#FECB52', 'pattern': {'shape': ''}},
'name': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
@@ -648,12 +648,12 @@ plot_object,header,plot_json,description,df,arguments
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.11885959], dtype=float32),
+ 'x': array([0.12540509], dtype=float32),
'xaxis': 'x',
'y': array(['TinyLlama/TinyLlama-1.1B-Chat-v1.0'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
BERT score R=%{x}',
+ 'hovertemplate': 'Model=%{y}
BERT score recall=%{x}',
'legendgroup': 'zephyr-7b-beta',
'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
'name': 'zephyr-7b-beta',
@@ -662,12 +662,12 @@ plot_object,header,plot_json,description,df,arguments
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.08266569], dtype=float32),
+ 'x': array([0.08755772], dtype=float32),
'xaxis': 'x',
'y': array(['zephyr-7b-beta'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
BERT score R=%{x}',
+ 'hovertemplate': 'Model=%{y}
BERT score recall=%{x}',
'legendgroup': 'Mistral-7B-Instruct-v0.2',
'marker': {'color': '#EF553B', 'pattern': {'shape': ''}},
'name': 'Mistral-7B-Instruct-v0.2',
@@ -676,12 +676,12 @@ plot_object,header,plot_json,description,df,arguments
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.04256168], dtype=float32),
+ 'x': array([0.04518599], dtype=float32),
'xaxis': 'x',
'y': array(['Mistral-7B-Instruct-v0.2'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
BERT score R=%{x}',
+ 'hovertemplate': 'Model=%{y}
BERT score recall=%{x}',
'legendgroup': 'Upstage SOLAR Instruct v1 (11B)',
'marker': {'color': '#00cc96', 'pattern': {'shape': ''}},
'name': 'Upstage SOLAR Instruct v1 (11B)',
@@ -697,17 +697,17 @@ plot_object,header,plot_json,description,df,arguments
'layout': {'barmode': 'relative',
'legend': {'title': {'text': 'Model'}, 'tracegroupgap': 0},
'template': '...',
- 'title': {'text': 'Summary metrics BERT score R'},
- 'xaxis': {'anchor': 'y', 'domain': [0.0, 1.0], 'title': {'text': 'BERT score R'}},
+ 'title': {'text': 'Summary metrics BERT score recall'},
+ 'xaxis': {'anchor': 'y', 'domain': [0.0, 1.0], 'title': {'text': 'BERT score recall'}},
'yaxis': {'anchor': 'x',
'categoryarray': [Upstage SOLAR Instruct v1 (11B),
Mistral-7B-Instruct-v0.2,
zephyr-7b-beta,
TinyLlama/TinyLlama-1.1B-Chat-v1.0,
Mixtral-8x7B-Instruct-v0.1,
- llama-2-70b-chat, chat-bison-32k (PaLM 2
- 32K), chat-bison (PaLM 2), gemini-pro,
- RedPajama-INCITE Chat (7B), Falcon
+ llama-2-70b-chat, gemini-pro, chat-
+ bison-32k (PaLM 2 32K), chat-bison (PaLM
+ 2), RedPajama-INCITE Chat (7B), Falcon
Instruct (7B), Vicuna v1.5 (7B), Chronos
Hermes (13B), LLaMA-2 Chat (7B),
WizardLM v1.2 (13B), Snorkel Mistral
@@ -719,31 +719,31 @@ plot_object,header,plot_json,description,df,arguments
'categoryorder': 'array',
'domain': [0.0, 1.0],
'title': {'text': 'Model'}}}
-})",Summary metrics BERT score R,"{""data"":[{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score R=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-3.5-turbo"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""gpt-3.5-turbo"",""offsetgroup"":""gpt-3.5-turbo"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.48408476],""xaxis"":""x"",""y"":[""gpt-3.5-turbo""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score R=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""gpt-4"",""offsetgroup"":""gpt-4"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.472583],""xaxis"":""x"",""y"":[""gpt-4""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score R=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4-turbo"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""gpt-4-turbo"",""offsetgroup"":""gpt-4-turbo"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.4162435],""xaxis"":""x"",""y"":[""gpt-4-turbo""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score R=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral (7B) Instruct v0.2 (Together AI)"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""Mistral (7B) Instruct v0.2 (Together AI)"",""offsetgroup"":""Mistral (7B) Instruct v0.2 (Together AI)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.3664233],""xaxis"":""x"",""y"":[""Mistral (7B) Instruct v0.2 (Together AI)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score R=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""OpenHermes-2.5-Mistral (7B)"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""OpenHermes-2.5-Mistral (7B)"",""offsetgroup"":""OpenHermes-2.5-Mistral (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.35180506],""xaxis"":""x"",""y"":[""OpenHermes-2.5-Mistral (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score R=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Qwen 1.5 Chat (7B)"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""Qwen 1.5 Chat (7B)"",""offsetgroup"":""Qwen 1.5 Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.34154576],""xaxis"":""x"",""y"":[""Qwen 1.5 Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score R=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""01-ai Yi Chat (34B)"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""01-ai Yi Chat (34B)"",""offsetgroup"":""01-ai Yi Chat (34B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.3404481],""xaxis"":""x"",""y"":[""01-ai Yi Chat (34B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score R=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Snorkel Mistral PairRM DPO (7B)"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""Snorkel Mistral PairRM DPO (7B)"",""offsetgroup"":""Snorkel Mistral PairRM DPO (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.33782956],""xaxis"":""x"",""y"":[""Snorkel Mistral PairRM DPO (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score R=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""WizardLM v1.2 (13B)"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""WizardLM v1.2 (13B)"",""offsetgroup"":""WizardLM v1.2 (13B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.32933056],""xaxis"":""x"",""y"":[""WizardLM v1.2 (13B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score R=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""LLaMA-2 Chat (7B)"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""LLaMA-2 Chat (7B)"",""offsetgroup"":""LLaMA-2 Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.3153909],""xaxis"":""x"",""y"":[""LLaMA-2 Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score R=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Chronos Hermes (13B)"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""Chronos Hermes (13B)"",""offsetgroup"":""Chronos Hermes (13B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.31071666],""xaxis"":""x"",""y"":[""Chronos Hermes (13B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score R=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Vicuna v1.5 (7B)"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""Vicuna v1.5 (7B)"",""offsetgroup"":""Vicuna v1.5 (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.27878883],""xaxis"":""x"",""y"":[""Vicuna v1.5 (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score R=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Falcon Instruct (7B)"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""Falcon Instruct (7B)"",""offsetgroup"":""Falcon Instruct (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.23968808],""xaxis"":""x"",""y"":[""Falcon Instruct (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score R=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""RedPajama-INCITE Chat (7B)"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""RedPajama-INCITE Chat (7B)"",""offsetgroup"":""RedPajama-INCITE Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.23758642],""xaxis"":""x"",""y"":[""RedPajama-INCITE Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score R=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gemini-pro"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""gemini-pro"",""offsetgroup"":""gemini-pro"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.23057175],""xaxis"":""x"",""y"":[""gemini-pro""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score R=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison (PaLM 2)"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""chat-bison (PaLM 2)"",""offsetgroup"":""chat-bison (PaLM 2)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.23029378],""xaxis"":""x"",""y"":[""chat-bison (PaLM 2)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score R=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison-32k (PaLM 2 32K)"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""chat-bison-32k (PaLM 2 32K)"",""offsetgroup"":""chat-bison-32k (PaLM 2 32K)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.22983725],""xaxis"":""x"",""y"":[""chat-bison-32k (PaLM 2 32K)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score R=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""llama-2-70b-chat"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""llama-2-70b-chat"",""offsetgroup"":""llama-2-70b-chat"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.21472095],""xaxis"":""x"",""y"":[""llama-2-70b-chat""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score R=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mixtral-8x7B-Instruct-v0.1"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""Mixtral-8x7B-Instruct-v0.1"",""offsetgroup"":""Mixtral-8x7B-Instruct-v0.1"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.19555509],""xaxis"":""x"",""y"":[""Mixtral-8x7B-Instruct-v0.1""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score R=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""offsetgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.11885959],""xaxis"":""x"",""y"":[""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score R=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""zephyr-7b-beta"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""zephyr-7b-beta"",""offsetgroup"":""zephyr-7b-beta"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.08266569],""xaxis"":""x"",""y"":[""zephyr-7b-beta""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score R=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral-7B-Instruct-v0.2"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""Mistral-7B-Instruct-v0.2"",""offsetgroup"":""Mistral-7B-Instruct-v0.2"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.042561684],""xaxis"":""x"",""y"":[""Mistral-7B-Instruct-v0.2""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score R=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Upstage SOLAR Instruct v1 (11B)"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""Upstage SOLAR Instruct v1 (11B)"",""offsetgroup"":""Upstage SOLAR Instruct v1 (11B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.0],""xaxis"":""x"",""y"":[""Upstage SOLAR Instruct v1 (11B)""],""yaxis"":""y"",""type"":""bar""}],""layout"":{""template"":{""data"":{""histogram2dcontour"":[{""type"":""histogram2dcontour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""choropleth"":[{""type"":""choropleth"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""histogram2d"":[{""type"":""histogram2d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmap"":[{""type"":""heatmap"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmapgl"":[{""type"":""heatmapgl"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""contourcarpet"":[{""type"":""contourcarpet"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""contour"":[{""type"":""contour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""surface"":[{""type"":""surface"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""mesh3d"":[{""type"":""mesh3d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""scatter"":[{""fillpattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2},""type"":""scatter""}],""parcoords"":[{""type"":""parcoords"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolargl"":[{""type"":""scatterpolargl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""bar"":[{""error_x"":{""color"":""#2a3f5f""},""error_y"":{""color"":""#2a3f5f""},""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""bar""}],""scattergeo"":[{""type"":""scattergeo"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolar"":[{""type"":""scatterpolar"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""histogram"":[{""marker"":{""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""histogram""}],""scattergl"":[{""type"":""scattergl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatter3d"":[{""type"":""scatter3d"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattermapbox"":[{""type"":""scattermapbox"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterternary"":[{""type"":""scatterternary"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattercarpet"":[{""type"":""scattercarpet"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""carpet"":[{""aaxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""baxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""type"":""carpet""}],""table"":[{""cells"":{""fill"":{""color"":""#EBF0F8""},""line"":{""color"":""white""}},""header"":{""fill"":{""color"":""#C8D4E3""},""line"":{""color"":""white""}},""type"":""table""}],""barpolar"":[{""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""barpolar""}],""pie"":[{""automargin"":true,""type"":""pie""}]},""layout"":{""autotypenumbers"":""strict"",""colorway"":[""#636efa"",""#EF553B"",""#00cc96"",""#ab63fa"",""#FFA15A"",""#19d3f3"",""#FF6692"",""#B6E880"",""#FF97FF"",""#FECB52""],""font"":{""color"":""#2a3f5f""},""hovermode"":""closest"",""hoverlabel"":{""align"":""left""},""paper_bgcolor"":""white"",""plot_bgcolor"":""#E5ECF6"",""polar"":{""bgcolor"":""#E5ECF6"",""angularaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""radialaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""ternary"":{""bgcolor"":""#E5ECF6"",""aaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""baxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""caxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""coloraxis"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""colorscale"":{""sequential"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""sequentialminus"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""diverging"":[[0,""#8e0152""],[0.1,""#c51b7d""],[0.2,""#de77ae""],[0.3,""#f1b6da""],[0.4,""#fde0ef""],[0.5,""#f7f7f7""],[0.6,""#e6f5d0""],[0.7,""#b8e186""],[0.8,""#7fbc41""],[0.9,""#4d9221""],[1,""#276419""]]},""xaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""yaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""scene"":{""xaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""yaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""zaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2}},""shapedefaults"":{""line"":{""color"":""#2a3f5f""}},""annotationdefaults"":{""arrowcolor"":""#2a3f5f"",""arrowhead"":0,""arrowwidth"":1},""geo"":{""bgcolor"":""white"",""landcolor"":""#E5ECF6"",""subunitcolor"":""white"",""showland"":true,""showlakes"":true,""lakecolor"":""white""},""title"":{""x"":0.05},""mapbox"":{""style"":""light""}}},""xaxis"":{""anchor"":""y"",""domain"":[0.0,1.0],""title"":{""text"":""BERT score R""}},""yaxis"":{""anchor"":""x"",""domain"":[0.0,1.0],""title"":{""text"":""Model""},""categoryorder"":""array"",""categoryarray"":[""Upstage SOLAR Instruct v1 (11B)"",""Mistral-7B-Instruct-v0.2"",""zephyr-7b-beta"",""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""Mixtral-8x7B-Instruct-v0.1"",""llama-2-70b-chat"",""chat-bison-32k (PaLM 2 32K)"",""chat-bison (PaLM 2)"",""gemini-pro"",""RedPajama-INCITE Chat (7B)"",""Falcon Instruct (7B)"",""Vicuna v1.5 (7B)"",""Chronos Hermes (13B)"",""LLaMA-2 Chat (7B)"",""WizardLM v1.2 (13B)"",""Snorkel Mistral PairRM DPO (7B)"",""01-ai Yi Chat (34B)"",""Qwen 1.5 Chat (7B)"",""OpenHermes-2.5-Mistral (7B)"",""Mistral (7B) Instruct v0.2 (Together AI)"",""gpt-4-turbo"",""gpt-4"",""gpt-3.5-turbo""]},""legend"":{""title"":{""text"":""Model""},""tracegroupgap"":0},""title"":{""text"":""Summary metrics BERT score R""},""barmode"":""relative""}}",,",model,bert_score_P,bert_score_R,bert_score_F1,original_text_length_part,sentence_count,length_penalty,bleu_score
-18,gpt-3.5-turbo,0.4943981,0.48408476,0.4888874,0.5905700146991734,4.229639819909955,89814.0,0.007892445077902592
-19,gpt-4,0.48605907,0.472583,0.47901583,0.4763731952669352,4.266137566137566,85120.0,0.004704572681138337
-20,gpt-4-turbo,0.42728576,0.4162435,0.42098433,0.5393220459796505,4.266137566137566,85120.0,0.0034873692407505464
-4,Mistral (7B) Instruct v0.2 (Together AI),0.3647361,0.3664233,0.36540908,0.5233998570385472,3.712222222222222,29298.0,0.005478518060743351
-7,OpenHermes-2.5-Mistral (7B),0.3618188,0.35180506,0.3565194,0.312054520357568,3.5818443804034583,14928.0,0.006563161880264231
-8,Qwen 1.5 Chat (7B),0.34855434,0.34154576,0.344803,0.29904529709475364,3.5818443804034583,14928.0,0.003185571110431172
-0,01-ai Yi Chat (34B),0.33974892,0.3404481,0.3399749,0.43251538287409536,3.5818443804034583,14928.0,0.007311566390840339
-10,Snorkel Mistral PairRM DPO (7B),0.31672964,0.33782956,0.3265383,3.7740234383755356,3.5818443804034583,14928.0,0.002907897771152987
-14,WizardLM v1.2 (13B),0.34085444,0.32933056,0.33466902,0.28716720161049375,3.5818443804034583,14928.0,0.003671383039102015
-3,LLaMA-2 Chat (7B),0.3203912,0.3153909,0.31770444,0.4084233313416049,3.5818443804034583,14928.0,0.004255859538193306
-1,Chronos Hermes (13B),0.3124825,0.31071666,0.311415,0.4742810243835248,3.5818443804034583,14928.0,0.011439012700594395
-13,Vicuna v1.5 (7B),0.284109,0.27878883,0.28129113,0.2781035051738079,3.6173027989821884,16948.0,0.006952332387656228
-2,Falcon Instruct (7B),0.2895086,0.23968808,0.2615204,0.0490635544441649,3.5818443804034583,14928.0,0.00021729364201653395
-9,RedPajama-INCITE Chat (7B),0.261367,0.23758642,0.2487217,0.0560284823193376,3.5818443804034583,14928.0,0.0
-17,gemini-pro,0.23105659,0.23057175,0.23072062,0.295286999418032,4.244871794871795,87700.0,0.0025439281189154664
-15,chat-bison (PaLM 2),0.23117188,0.23029378,0.23060663,0.2927236655934559,4.281081081081081,83400.0,0.0033173472693443363
-16,chat-bison-32k (PaLM 2 32K),0.23046139,0.22983725,0.23002876,0.2608806894318779,4.281081081081081,83400.0,0.002970914340485325
-21,llama-2-70b-chat,0.20800962,0.21472095,0.21117964,0.29684572894554634,4.2436893203883495,88008.0,0.00329426273003284
-6,Mixtral-8x7B-Instruct-v0.1,0.19128644,0.19555509,0.19330867,0.2665288353398184,4.161038961038961,103320.0,0.0026839271544750283
-11,TinyLlama/TinyLlama-1.1B-Chat-v1.0,0.122185074,0.11885959,0.12042627,0.13915355617375091,4.244871794871795,87700.0,0.002991155730532842
-22,zephyr-7b-beta,0.085390136,0.08266569,0.08394519,0.08796697338212889,4.159788702026735,103714.0,0.0010625100735849574
-5,Mistral-7B-Instruct-v0.2,0.043820098,0.042561684,0.04313921,0.04250630683894714,4.120342654588421,113258.0,0.0004930290548816363
-12,Upstage SOLAR Instruct v1 (11B),0.0,0.0,0.0,0.0017662349842492329,3.5818443804034583,14928.0,0.0
-","{""x"": ""bert_score_R"", ""y"": ""model"", ""color"": ""model"", ""orientation"": ""h"", ""labels"": {""bert_score_R"": ""BERT score R"", ""model"": ""Model""}, ""title"": ""Summary metrics BERT score R""}"
+})",Summary metrics BERT score recall,"{""data"":[{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score recall=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-3.5-turbo"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""gpt-3.5-turbo"",""offsetgroup"":""gpt-3.5-turbo"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.50445867],""xaxis"":""x"",""y"":[""gpt-3.5-turbo""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score recall=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""gpt-4"",""offsetgroup"":""gpt-4"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.49512562],""xaxis"":""x"",""y"":[""gpt-4""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score recall=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4-turbo"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""gpt-4-turbo"",""offsetgroup"":""gpt-4-turbo"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.4414623],""xaxis"":""x"",""y"":[""gpt-4-turbo""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score recall=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral (7B) Instruct v0.2 (Together AI)"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""Mistral (7B) Instruct v0.2 (Together AI)"",""offsetgroup"":""Mistral (7B) Instruct v0.2 (Together AI)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.3797993],""xaxis"":""x"",""y"":[""Mistral (7B) Instruct v0.2 (Together AI)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score recall=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""OpenHermes-2.5-Mistral (7B)"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""OpenHermes-2.5-Mistral (7B)"",""offsetgroup"":""OpenHermes-2.5-Mistral (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.3685358],""xaxis"":""x"",""y"":[""OpenHermes-2.5-Mistral (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score recall=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Qwen 1.5 Chat (7B)"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""Qwen 1.5 Chat (7B)"",""offsetgroup"":""Qwen 1.5 Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.35945317],""xaxis"":""x"",""y"":[""Qwen 1.5 Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score recall=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""01-ai Yi Chat (34B)"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""01-ai Yi Chat (34B)"",""offsetgroup"":""01-ai Yi Chat (34B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.35219854],""xaxis"":""x"",""y"":[""01-ai Yi Chat (34B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score recall=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Snorkel Mistral PairRM DPO (7B)"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""Snorkel Mistral PairRM DPO (7B)"",""offsetgroup"":""Snorkel Mistral PairRM DPO (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.34785262],""xaxis"":""x"",""y"":[""Snorkel Mistral PairRM DPO (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score recall=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""WizardLM v1.2 (13B)"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""WizardLM v1.2 (13B)"",""offsetgroup"":""WizardLM v1.2 (13B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.34746957],""xaxis"":""x"",""y"":[""WizardLM v1.2 (13B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score recall=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""LLaMA-2 Chat (7B)"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""LLaMA-2 Chat (7B)"",""offsetgroup"":""LLaMA-2 Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.33171847],""xaxis"":""x"",""y"":[""LLaMA-2 Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score recall=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Chronos Hermes (13B)"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""Chronos Hermes (13B)"",""offsetgroup"":""Chronos Hermes (13B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.32630467],""xaxis"":""x"",""y"":[""Chronos Hermes (13B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score recall=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Vicuna v1.5 (7B)"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""Vicuna v1.5 (7B)"",""offsetgroup"":""Vicuna v1.5 (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.29119453],""xaxis"":""x"",""y"":[""Vicuna v1.5 (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score recall=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Falcon Instruct (7B)"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""Falcon Instruct (7B)"",""offsetgroup"":""Falcon Instruct (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.28607234],""xaxis"":""x"",""y"":[""Falcon Instruct (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score recall=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""RedPajama-INCITE Chat (7B)"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""RedPajama-INCITE Chat (7B)"",""offsetgroup"":""RedPajama-INCITE Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.27305293],""xaxis"":""x"",""y"":[""RedPajama-INCITE Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score recall=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison (PaLM 2)"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""chat-bison (PaLM 2)"",""offsetgroup"":""chat-bison (PaLM 2)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.24001649],""xaxis"":""x"",""y"":[""chat-bison (PaLM 2)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score recall=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison-32k (PaLM 2 32K)"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""chat-bison-32k (PaLM 2 32K)"",""offsetgroup"":""chat-bison-32k (PaLM 2 32K)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.23993237],""xaxis"":""x"",""y"":[""chat-bison-32k (PaLM 2 32K)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score recall=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gemini-pro"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""gemini-pro"",""offsetgroup"":""gemini-pro"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.23956373],""xaxis"":""x"",""y"":[""gemini-pro""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score recall=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""llama-2-70b-chat"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""llama-2-70b-chat"",""offsetgroup"":""llama-2-70b-chat"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.22406381],""xaxis"":""x"",""y"":[""llama-2-70b-chat""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score recall=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mixtral-8x7B-Instruct-v0.1"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""Mixtral-8x7B-Instruct-v0.1"",""offsetgroup"":""Mixtral-8x7B-Instruct-v0.1"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.2029136],""xaxis"":""x"",""y"":[""Mixtral-8x7B-Instruct-v0.1""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score recall=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""offsetgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.12540509],""xaxis"":""x"",""y"":[""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score recall=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""zephyr-7b-beta"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""zephyr-7b-beta"",""offsetgroup"":""zephyr-7b-beta"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.08755772],""xaxis"":""x"",""y"":[""zephyr-7b-beta""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score recall=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral-7B-Instruct-v0.2"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""Mistral-7B-Instruct-v0.2"",""offsetgroup"":""Mistral-7B-Instruct-v0.2"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.045185987],""xaxis"":""x"",""y"":[""Mistral-7B-Instruct-v0.2""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score recall=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Upstage SOLAR Instruct v1 (11B)"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""Upstage SOLAR Instruct v1 (11B)"",""offsetgroup"":""Upstage SOLAR Instruct v1 (11B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.0],""xaxis"":""x"",""y"":[""Upstage SOLAR Instruct v1 (11B)""],""yaxis"":""y"",""type"":""bar""}],""layout"":{""template"":{""data"":{""histogram2dcontour"":[{""type"":""histogram2dcontour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""choropleth"":[{""type"":""choropleth"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""histogram2d"":[{""type"":""histogram2d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmap"":[{""type"":""heatmap"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmapgl"":[{""type"":""heatmapgl"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""contourcarpet"":[{""type"":""contourcarpet"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""contour"":[{""type"":""contour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""surface"":[{""type"":""surface"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""mesh3d"":[{""type"":""mesh3d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""scatter"":[{""fillpattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2},""type"":""scatter""}],""parcoords"":[{""type"":""parcoords"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolargl"":[{""type"":""scatterpolargl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""bar"":[{""error_x"":{""color"":""#2a3f5f""},""error_y"":{""color"":""#2a3f5f""},""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""bar""}],""scattergeo"":[{""type"":""scattergeo"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolar"":[{""type"":""scatterpolar"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""histogram"":[{""marker"":{""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""histogram""}],""scattergl"":[{""type"":""scattergl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatter3d"":[{""type"":""scatter3d"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattermapbox"":[{""type"":""scattermapbox"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterternary"":[{""type"":""scatterternary"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattercarpet"":[{""type"":""scattercarpet"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""carpet"":[{""aaxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""baxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""type"":""carpet""}],""table"":[{""cells"":{""fill"":{""color"":""#EBF0F8""},""line"":{""color"":""white""}},""header"":{""fill"":{""color"":""#C8D4E3""},""line"":{""color"":""white""}},""type"":""table""}],""barpolar"":[{""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""barpolar""}],""pie"":[{""automargin"":true,""type"":""pie""}]},""layout"":{""autotypenumbers"":""strict"",""colorway"":[""#636efa"",""#EF553B"",""#00cc96"",""#ab63fa"",""#FFA15A"",""#19d3f3"",""#FF6692"",""#B6E880"",""#FF97FF"",""#FECB52""],""font"":{""color"":""#2a3f5f""},""hovermode"":""closest"",""hoverlabel"":{""align"":""left""},""paper_bgcolor"":""white"",""plot_bgcolor"":""#E5ECF6"",""polar"":{""bgcolor"":""#E5ECF6"",""angularaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""radialaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""ternary"":{""bgcolor"":""#E5ECF6"",""aaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""baxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""caxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""coloraxis"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""colorscale"":{""sequential"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""sequentialminus"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""diverging"":[[0,""#8e0152""],[0.1,""#c51b7d""],[0.2,""#de77ae""],[0.3,""#f1b6da""],[0.4,""#fde0ef""],[0.5,""#f7f7f7""],[0.6,""#e6f5d0""],[0.7,""#b8e186""],[0.8,""#7fbc41""],[0.9,""#4d9221""],[1,""#276419""]]},""xaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""yaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""scene"":{""xaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""yaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""zaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2}},""shapedefaults"":{""line"":{""color"":""#2a3f5f""}},""annotationdefaults"":{""arrowcolor"":""#2a3f5f"",""arrowhead"":0,""arrowwidth"":1},""geo"":{""bgcolor"":""white"",""landcolor"":""#E5ECF6"",""subunitcolor"":""white"",""showland"":true,""showlakes"":true,""lakecolor"":""white""},""title"":{""x"":0.05},""mapbox"":{""style"":""light""}}},""xaxis"":{""anchor"":""y"",""domain"":[0.0,1.0],""title"":{""text"":""BERT score recall""}},""yaxis"":{""anchor"":""x"",""domain"":[0.0,1.0],""title"":{""text"":""Model""},""categoryorder"":""array"",""categoryarray"":[""Upstage SOLAR Instruct v1 (11B)"",""Mistral-7B-Instruct-v0.2"",""zephyr-7b-beta"",""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""Mixtral-8x7B-Instruct-v0.1"",""llama-2-70b-chat"",""gemini-pro"",""chat-bison-32k (PaLM 2 32K)"",""chat-bison (PaLM 2)"",""RedPajama-INCITE Chat (7B)"",""Falcon Instruct (7B)"",""Vicuna v1.5 (7B)"",""Chronos Hermes (13B)"",""LLaMA-2 Chat (7B)"",""WizardLM v1.2 (13B)"",""Snorkel Mistral PairRM DPO (7B)"",""01-ai Yi Chat (34B)"",""Qwen 1.5 Chat (7B)"",""OpenHermes-2.5-Mistral (7B)"",""Mistral (7B) Instruct v0.2 (Together AI)"",""gpt-4-turbo"",""gpt-4"",""gpt-3.5-turbo""]},""legend"":{""title"":{""text"":""Model""},""tracegroupgap"":0},""title"":{""text"":""Summary metrics BERT score recall""},""barmode"":""relative""}}",,",model,BERT_score_precision,BERT_score_recall,BERT_score_F1,BLEU_score,original_text_length_part,sentence_count,length_penalty
+18,gpt-3.5-turbo,0.49478123,0.50445867,0.49331823,0.00919205486407126,0.5905700146991734,4.229639819909955,89814.0
+19,gpt-4,0.4864653,0.49512562,0.4839312,0.005711113295666468,0.4763731952669352,4.266137566137566,85120.0
+20,gpt-4-turbo,0.42933634,0.4414623,0.4294052,0.0042830628392272,0.5393220459796505,4.266137566137566,85120.0
+4,Mistral (7B) Instruct v0.2 (Together AI),0.36488953,0.3797993,0.36758336,0.005650224193975447,0.5233998570385472,3.712222222222222,29298.0
+7,OpenHermes-2.5-Mistral (7B),0.3621834,0.3685358,0.36003792,0.0068684572027745494,0.312054520357568,3.5818443804034583,14928.0
+8,Qwen 1.5 Chat (7B),0.34898603,0.35945317,0.34867778,0.0033327500620805805,0.29904529709475364,3.5818443804034583,14928.0
+0,01-ai Yi Chat (34B),0.33981326,0.35219854,0.34183535,0.007428840277380581,0.43251538287409536,3.5818443804034583,14928.0
+10,Snorkel Mistral PairRM DPO (7B),0.3167385,0.34785262,0.32718164,0.0029236226777824676,3.7740234383755356,3.5818443804034583,14928.0
+14,WizardLM v1.2 (13B),0.3420949,0.34746957,0.33996373,0.00373442128604677,0.28716720161049375,3.5818443804034583,14928.0
+3,LLaMA-2 Chat (7B),0.32074162,0.33171847,0.32136682,0.004415024709996126,0.4084233313416049,3.5818443804034583,14928.0
+1,Chronos Hermes (13B),0.31285536,0.32630467,0.3150877,0.011542047908319874,0.4742810243835248,3.5818443804034583,14928.0
+13,Vicuna v1.5 (7B),0.28434175,0.29119453,0.2839047,0.007105541953090669,0.2781035051738079,3.6173027989821884,16948.0
+2,Falcon Instruct (7B),0.30270517,0.28607234,0.29104736,0.0030232447024239606,0.0490635544441649,3.5818443804034583,14928.0
+9,RedPajama-INCITE Chat (7B),0.26832756,0.27305293,0.26768887,0.0,0.0560284823193376,3.5818443804034583,14928.0
+15,chat-bison (PaLM 2),0.23123139,0.24001649,0.23214735,0.0037652345768886663,0.2927236655934559,4.281081081081081,83400.0
+16,chat-bison-32k (PaLM 2 32K),0.23051436,0.23993237,0.2317056,0.003694633514634998,0.2608806894318779,4.281081081081081,83400.0
+17,gemini-pro,0.23109974,0.23956373,0.23199782,0.0032373504004405487,0.295286999418032,4.244871794871795,87700.0
+21,llama-2-70b-chat,0.20810011,0.22406381,0.21268094,0.004560500754935232,0.29684572894554634,4.2436893203883495,88008.0
+6,Mixtral-8x7B-Instruct-v0.1,0.19137934,0.2029136,0.19449018,0.0031843990217988536,0.2665288353398184,4.161038961038961,103320.0
+11,TinyLlama/TinyLlama-1.1B-Chat-v1.0,0.122332305,0.12540509,0.12200464,0.003286423403673119,0.13915355617375091,4.244871794871795,87700.0
+22,zephyr-7b-beta,0.085546724,0.08755772,0.085219756,0.0012612839176470308,0.08796697338212889,4.159788702026735,103714.0
+5,Mistral-7B-Instruct-v0.2,0.04389399,0.045185987,0.04378006,0.000566625796313851,0.04250630683894714,4.120342654588421,113258.0
+12,Upstage SOLAR Instruct v1 (11B),0.0,0.0,0.0,0.0,0.0017662349842492329,3.5818443804034583,14928.0
+","{""x"": ""BERT_score_recall"", ""y"": ""model"", ""color"": ""model"", ""orientation"": ""h"", ""labels"": {""BERT_score_recall"": ""BERT score recall"", ""model"": ""Model""}, ""title"": ""Summary metrics BERT score recall""}"
"Figure({
'data': [{'alignmentgroup': 'True',
'hovertemplate': 'Model=%{y}
BERT score F1=%{x}',
@@ -755,7 +755,7 @@ plot_object,header,plot_json,description,df,arguments
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.4888874], dtype=float32),
+ 'x': array([0.49331823], dtype=float32),
'xaxis': 'x',
'y': array(['gpt-3.5-turbo'], dtype=object),
'yaxis': 'y'},
@@ -769,7 +769,7 @@ plot_object,header,plot_json,description,df,arguments
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.47901583], dtype=float32),
+ 'x': array([0.4839312], dtype=float32),
'xaxis': 'x',
'y': array(['gpt-4'], dtype=object),
'yaxis': 'y'},
@@ -783,7 +783,7 @@ plot_object,header,plot_json,description,df,arguments
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.42098433], dtype=float32),
+ 'x': array([0.4294052], dtype=float32),
'xaxis': 'x',
'y': array(['gpt-4-turbo'], dtype=object),
'yaxis': 'y'},
@@ -797,7 +797,7 @@ plot_object,header,plot_json,description,df,arguments
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.36540908], dtype=float32),
+ 'x': array([0.36758336], dtype=float32),
'xaxis': 'x',
'y': array(['Mistral (7B) Instruct v0.2 (Together AI)'], dtype=object),
'yaxis': 'y'},
@@ -811,7 +811,7 @@ plot_object,header,plot_json,description,df,arguments
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.3565194], dtype=float32),
+ 'x': array([0.36003792], dtype=float32),
'xaxis': 'x',
'y': array(['OpenHermes-2.5-Mistral (7B)'], dtype=object),
'yaxis': 'y'},
@@ -825,7 +825,7 @@ plot_object,header,plot_json,description,df,arguments
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.344803], dtype=float32),
+ 'x': array([0.34867778], dtype=float32),
'xaxis': 'x',
'y': array(['Qwen 1.5 Chat (7B)'], dtype=object),
'yaxis': 'y'},
@@ -839,7 +839,7 @@ plot_object,header,plot_json,description,df,arguments
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.3399749], dtype=float32),
+ 'x': array([0.34183535], dtype=float32),
'xaxis': 'x',
'y': array(['01-ai Yi Chat (34B)'], dtype=object),
'yaxis': 'y'},
@@ -853,7 +853,7 @@ plot_object,header,plot_json,description,df,arguments
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.33466902], dtype=float32),
+ 'x': array([0.33996373], dtype=float32),
'xaxis': 'x',
'y': array(['WizardLM v1.2 (13B)'], dtype=object),
'yaxis': 'y'},
@@ -867,7 +867,7 @@ plot_object,header,plot_json,description,df,arguments
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.3265383], dtype=float32),
+ 'x': array([0.32718164], dtype=float32),
'xaxis': 'x',
'y': array(['Snorkel Mistral PairRM DPO (7B)'], dtype=object),
'yaxis': 'y'},
@@ -881,7 +881,7 @@ plot_object,header,plot_json,description,df,arguments
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.31770444], dtype=float32),
+ 'x': array([0.32136682], dtype=float32),
'xaxis': 'x',
'y': array(['LLaMA-2 Chat (7B)'], dtype=object),
'yaxis': 'y'},
@@ -895,37 +895,37 @@ plot_object,header,plot_json,description,df,arguments
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.311415], dtype=float32),
+ 'x': array([0.3150877], dtype=float32),
'xaxis': 'x',
'y': array(['Chronos Hermes (13B)'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
'hovertemplate': 'Model=%{y}
BERT score F1=%{x}',
- 'legendgroup': 'Vicuna v1.5 (7B)',
+ 'legendgroup': 'Falcon Instruct (7B)',
'marker': {'color': '#EF553B', 'pattern': {'shape': ''}},
- 'name': 'Vicuna v1.5 (7B)',
- 'offsetgroup': 'Vicuna v1.5 (7B)',
+ 'name': 'Falcon Instruct (7B)',
+ 'offsetgroup': 'Falcon Instruct (7B)',
'orientation': 'h',
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.28129113], dtype=float32),
+ 'x': array([0.29104736], dtype=float32),
'xaxis': 'x',
- 'y': array(['Vicuna v1.5 (7B)'], dtype=object),
+ 'y': array(['Falcon Instruct (7B)'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
'hovertemplate': 'Model=%{y}
BERT score F1=%{x}',
- 'legendgroup': 'Falcon Instruct (7B)',
+ 'legendgroup': 'Vicuna v1.5 (7B)',
'marker': {'color': '#00cc96', 'pattern': {'shape': ''}},
- 'name': 'Falcon Instruct (7B)',
- 'offsetgroup': 'Falcon Instruct (7B)',
+ 'name': 'Vicuna v1.5 (7B)',
+ 'offsetgroup': 'Vicuna v1.5 (7B)',
'orientation': 'h',
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.2615204], dtype=float32),
+ 'x': array([0.2839047], dtype=float32),
'xaxis': 'x',
- 'y': array(['Falcon Instruct (7B)'], dtype=object),
+ 'y': array(['Vicuna v1.5 (7B)'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
'hovertemplate': 'Model=%{y}
BERT score F1=%{x}',
@@ -937,37 +937,37 @@ plot_object,header,plot_json,description,df,arguments
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.2487217], dtype=float32),
+ 'x': array([0.26768887], dtype=float32),
'xaxis': 'x',
'y': array(['RedPajama-INCITE Chat (7B)'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
'hovertemplate': 'Model=%{y}
BERT score F1=%{x}',
- 'legendgroup': 'gemini-pro',
+ 'legendgroup': 'chat-bison (PaLM 2)',
'marker': {'color': '#FFA15A', 'pattern': {'shape': ''}},
- 'name': 'gemini-pro',
- 'offsetgroup': 'gemini-pro',
+ 'name': 'chat-bison (PaLM 2)',
+ 'offsetgroup': 'chat-bison (PaLM 2)',
'orientation': 'h',
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.23072062], dtype=float32),
+ 'x': array([0.23214735], dtype=float32),
'xaxis': 'x',
- 'y': array(['gemini-pro'], dtype=object),
+ 'y': array(['chat-bison (PaLM 2)'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
'hovertemplate': 'Model=%{y}
BERT score F1=%{x}',
- 'legendgroup': 'chat-bison (PaLM 2)',
+ 'legendgroup': 'gemini-pro',
'marker': {'color': '#19d3f3', 'pattern': {'shape': ''}},
- 'name': 'chat-bison (PaLM 2)',
- 'offsetgroup': 'chat-bison (PaLM 2)',
+ 'name': 'gemini-pro',
+ 'offsetgroup': 'gemini-pro',
'orientation': 'h',
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.23060663], dtype=float32),
+ 'x': array([0.23199782], dtype=float32),
'xaxis': 'x',
- 'y': array(['chat-bison (PaLM 2)'], dtype=object),
+ 'y': array(['gemini-pro'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
'hovertemplate': 'Model=%{y}
BERT score F1=%{x}',
@@ -979,7 +979,7 @@ plot_object,header,plot_json,description,df,arguments
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.23002876], dtype=float32),
+ 'x': array([0.2317056], dtype=float32),
'xaxis': 'x',
'y': array(['chat-bison-32k (PaLM 2 32K)'], dtype=object),
'yaxis': 'y'},
@@ -993,7 +993,7 @@ plot_object,header,plot_json,description,df,arguments
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.21117964], dtype=float32),
+ 'x': array([0.21268094], dtype=float32),
'xaxis': 'x',
'y': array(['llama-2-70b-chat'], dtype=object),
'yaxis': 'y'},
@@ -1007,7 +1007,7 @@ plot_object,header,plot_json,description,df,arguments
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.19330867], dtype=float32),
+ 'x': array([0.19449018], dtype=float32),
'xaxis': 'x',
'y': array(['Mixtral-8x7B-Instruct-v0.1'], dtype=object),
'yaxis': 'y'},
@@ -1021,7 +1021,7 @@ plot_object,header,plot_json,description,df,arguments
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.12042627], dtype=float32),
+ 'x': array([0.12200464], dtype=float32),
'xaxis': 'x',
'y': array(['TinyLlama/TinyLlama-1.1B-Chat-v1.0'], dtype=object),
'yaxis': 'y'},
@@ -1035,7 +1035,7 @@ plot_object,header,plot_json,description,df,arguments
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.08394519], dtype=float32),
+ 'x': array([0.08521976], dtype=float32),
'xaxis': 'x',
'y': array(['zephyr-7b-beta'], dtype=object),
'yaxis': 'y'},
@@ -1049,7 +1049,7 @@ plot_object,header,plot_json,description,df,arguments
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.04313921], dtype=float32),
+ 'x': array([0.04378006], dtype=float32),
'xaxis': 'x',
'y': array(['Mistral-7B-Instruct-v0.2'], dtype=object),
'yaxis': 'y'},
@@ -1079,9 +1079,9 @@ plot_object,header,plot_json,description,df,arguments
TinyLlama/TinyLlama-1.1B-Chat-v1.0,
Mixtral-8x7B-Instruct-v0.1,
llama-2-70b-chat, chat-bison-32k (PaLM 2
- 32K), chat-bison (PaLM 2), gemini-pro,
- RedPajama-INCITE Chat (7B), Falcon
- Instruct (7B), Vicuna v1.5 (7B), Chronos
+ 32K), gemini-pro, chat-bison (PaLM 2),
+ RedPajama-INCITE Chat (7B), Vicuna v1.5
+ (7B), Falcon Instruct (7B), Chronos
Hermes (13B), LLaMA-2 Chat (7B), Snorkel
Mistral PairRM DPO (7B), WizardLM v1.2
(13B), 01-ai Yi Chat (34B), Qwen 1.5
@@ -1091,48 +1091,54 @@ plot_object,header,plot_json,description,df,arguments
'categoryorder': 'array',
'domain': [0.0, 1.0],
'title': {'text': 'Model'}}}
-})",Summary metrics BERT score F1,"{""data"":[{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-3.5-turbo"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""gpt-3.5-turbo"",""offsetgroup"":""gpt-3.5-turbo"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.4888874],""xaxis"":""x"",""y"":[""gpt-3.5-turbo""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""gpt-4"",""offsetgroup"":""gpt-4"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.47901583],""xaxis"":""x"",""y"":[""gpt-4""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4-turbo"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""gpt-4-turbo"",""offsetgroup"":""gpt-4-turbo"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.42098433],""xaxis"":""x"",""y"":[""gpt-4-turbo""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral (7B) Instruct v0.2 (Together AI)"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""Mistral (7B) Instruct v0.2 (Together AI)"",""offsetgroup"":""Mistral (7B) Instruct v0.2 (Together AI)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.36540908],""xaxis"":""x"",""y"":[""Mistral (7B) Instruct v0.2 (Together AI)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""OpenHermes-2.5-Mistral (7B)"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""OpenHermes-2.5-Mistral (7B)"",""offsetgroup"":""OpenHermes-2.5-Mistral (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.3565194],""xaxis"":""x"",""y"":[""OpenHermes-2.5-Mistral (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Qwen 1.5 Chat (7B)"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""Qwen 1.5 Chat (7B)"",""offsetgroup"":""Qwen 1.5 Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.344803],""xaxis"":""x"",""y"":[""Qwen 1.5 Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""01-ai Yi Chat (34B)"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""01-ai Yi Chat (34B)"",""offsetgroup"":""01-ai Yi Chat (34B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.3399749],""xaxis"":""x"",""y"":[""01-ai Yi Chat (34B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""WizardLM v1.2 (13B)"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""WizardLM v1.2 (13B)"",""offsetgroup"":""WizardLM v1.2 (13B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.33466902],""xaxis"":""x"",""y"":[""WizardLM v1.2 (13B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Snorkel Mistral PairRM DPO (7B)"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""Snorkel Mistral PairRM DPO (7B)"",""offsetgroup"":""Snorkel Mistral PairRM DPO (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.3265383],""xaxis"":""x"",""y"":[""Snorkel Mistral PairRM DPO (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""LLaMA-2 Chat (7B)"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""LLaMA-2 Chat (7B)"",""offsetgroup"":""LLaMA-2 Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.31770444],""xaxis"":""x"",""y"":[""LLaMA-2 Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Chronos Hermes (13B)"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""Chronos Hermes (13B)"",""offsetgroup"":""Chronos Hermes (13B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.311415],""xaxis"":""x"",""y"":[""Chronos Hermes (13B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Vicuna v1.5 (7B)"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""Vicuna v1.5 (7B)"",""offsetgroup"":""Vicuna v1.5 (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.28129113],""xaxis"":""x"",""y"":[""Vicuna v1.5 (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Falcon Instruct (7B)"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""Falcon Instruct (7B)"",""offsetgroup"":""Falcon Instruct (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.2615204],""xaxis"":""x"",""y"":[""Falcon Instruct (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""RedPajama-INCITE Chat (7B)"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""RedPajama-INCITE Chat (7B)"",""offsetgroup"":""RedPajama-INCITE Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.2487217],""xaxis"":""x"",""y"":[""RedPajama-INCITE Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gemini-pro"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""gemini-pro"",""offsetgroup"":""gemini-pro"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.23072062],""xaxis"":""x"",""y"":[""gemini-pro""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison (PaLM 2)"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""chat-bison (PaLM 2)"",""offsetgroup"":""chat-bison (PaLM 2)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.23060663],""xaxis"":""x"",""y"":[""chat-bison (PaLM 2)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison-32k (PaLM 2 32K)"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""chat-bison-32k (PaLM 2 32K)"",""offsetgroup"":""chat-bison-32k (PaLM 2 32K)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.23002876],""xaxis"":""x"",""y"":[""chat-bison-32k (PaLM 2 32K)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""llama-2-70b-chat"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""llama-2-70b-chat"",""offsetgroup"":""llama-2-70b-chat"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.21117964],""xaxis"":""x"",""y"":[""llama-2-70b-chat""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mixtral-8x7B-Instruct-v0.1"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""Mixtral-8x7B-Instruct-v0.1"",""offsetgroup"":""Mixtral-8x7B-Instruct-v0.1"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.19330867],""xaxis"":""x"",""y"":[""Mixtral-8x7B-Instruct-v0.1""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""offsetgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.12042627],""xaxis"":""x"",""y"":[""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""zephyr-7b-beta"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""zephyr-7b-beta"",""offsetgroup"":""zephyr-7b-beta"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.08394519],""xaxis"":""x"",""y"":[""zephyr-7b-beta""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral-7B-Instruct-v0.2"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""Mistral-7B-Instruct-v0.2"",""offsetgroup"":""Mistral-7B-Instruct-v0.2"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.04313921],""xaxis"":""x"",""y"":[""Mistral-7B-Instruct-v0.2""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Upstage SOLAR Instruct v1 (11B)"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""Upstage SOLAR Instruct v1 (11B)"",""offsetgroup"":""Upstage SOLAR Instruct v1 (11B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.0],""xaxis"":""x"",""y"":[""Upstage SOLAR Instruct v1 (11B)""],""yaxis"":""y"",""type"":""bar""}],""layout"":{""template"":{""data"":{""histogram2dcontour"":[{""type"":""histogram2dcontour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""choropleth"":[{""type"":""choropleth"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""histogram2d"":[{""type"":""histogram2d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmap"":[{""type"":""heatmap"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmapgl"":[{""type"":""heatmapgl"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""contourcarpet"":[{""type"":""contourcarpet"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""contour"":[{""type"":""contour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""surface"":[{""type"":""surface"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""mesh3d"":[{""type"":""mesh3d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""scatter"":[{""fillpattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2},""type"":""scatter""}],""parcoords"":[{""type"":""parcoords"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolargl"":[{""type"":""scatterpolargl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""bar"":[{""error_x"":{""color"":""#2a3f5f""},""error_y"":{""color"":""#2a3f5f""},""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""bar""}],""scattergeo"":[{""type"":""scattergeo"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolar"":[{""type"":""scatterpolar"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""histogram"":[{""marker"":{""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""histogram""}],""scattergl"":[{""type"":""scattergl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatter3d"":[{""type"":""scatter3d"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattermapbox"":[{""type"":""scattermapbox"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterternary"":[{""type"":""scatterternary"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattercarpet"":[{""type"":""scattercarpet"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""carpet"":[{""aaxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""baxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""type"":""carpet""}],""table"":[{""cells"":{""fill"":{""color"":""#EBF0F8""},""line"":{""color"":""white""}},""header"":{""fill"":{""color"":""#C8D4E3""},""line"":{""color"":""white""}},""type"":""table""}],""barpolar"":[{""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""barpolar""}],""pie"":[{""automargin"":true,""type"":""pie""}]},""layout"":{""autotypenumbers"":""strict"",""colorway"":[""#636efa"",""#EF553B"",""#00cc96"",""#ab63fa"",""#FFA15A"",""#19d3f3"",""#FF6692"",""#B6E880"",""#FF97FF"",""#FECB52""],""font"":{""color"":""#2a3f5f""},""hovermode"":""closest"",""hoverlabel"":{""align"":""left""},""paper_bgcolor"":""white"",""plot_bgcolor"":""#E5ECF6"",""polar"":{""bgcolor"":""#E5ECF6"",""angularaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""radialaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""ternary"":{""bgcolor"":""#E5ECF6"",""aaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""baxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""caxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""coloraxis"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""colorscale"":{""sequential"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""sequentialminus"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""diverging"":[[0,""#8e0152""],[0.1,""#c51b7d""],[0.2,""#de77ae""],[0.3,""#f1b6da""],[0.4,""#fde0ef""],[0.5,""#f7f7f7""],[0.6,""#e6f5d0""],[0.7,""#b8e186""],[0.8,""#7fbc41""],[0.9,""#4d9221""],[1,""#276419""]]},""xaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""yaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""scene"":{""xaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""yaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""zaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2}},""shapedefaults"":{""line"":{""color"":""#2a3f5f""}},""annotationdefaults"":{""arrowcolor"":""#2a3f5f"",""arrowhead"":0,""arrowwidth"":1},""geo"":{""bgcolor"":""white"",""landcolor"":""#E5ECF6"",""subunitcolor"":""white"",""showland"":true,""showlakes"":true,""lakecolor"":""white""},""title"":{""x"":0.05},""mapbox"":{""style"":""light""}}},""xaxis"":{""anchor"":""y"",""domain"":[0.0,1.0],""title"":{""text"":""BERT score F1""}},""yaxis"":{""anchor"":""x"",""domain"":[0.0,1.0],""title"":{""text"":""Model""},""categoryorder"":""array"",""categoryarray"":[""Upstage SOLAR Instruct v1 (11B)"",""Mistral-7B-Instruct-v0.2"",""zephyr-7b-beta"",""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""Mixtral-8x7B-Instruct-v0.1"",""llama-2-70b-chat"",""chat-bison-32k (PaLM 2 32K)"",""chat-bison (PaLM 2)"",""gemini-pro"",""RedPajama-INCITE Chat (7B)"",""Falcon Instruct (7B)"",""Vicuna v1.5 (7B)"",""Chronos Hermes (13B)"",""LLaMA-2 Chat (7B)"",""Snorkel Mistral PairRM DPO (7B)"",""WizardLM v1.2 (13B)"",""01-ai Yi Chat (34B)"",""Qwen 1.5 Chat (7B)"",""OpenHermes-2.5-Mistral (7B)"",""Mistral (7B) Instruct v0.2 (Together AI)"",""gpt-4-turbo"",""gpt-4"",""gpt-3.5-turbo""]},""legend"":{""title"":{""text"":""Model""},""tracegroupgap"":0},""title"":{""text"":""Summary metrics BERT score F1""},""barmode"":""relative""}}",How similar are the BERT model embeddings of the summary to the BERT model embeddings of the original text. Value is averaged for each model.,",model,bert_score_P,bert_score_R,bert_score_F1,original_text_length_part,sentence_count,length_penalty,bleu_score
-18,gpt-3.5-turbo,0.4943981,0.48408476,0.4888874,0.5905700146991734,4.229639819909955,89814.0,0.007892445077902592
-19,gpt-4,0.48605907,0.472583,0.47901583,0.4763731952669352,4.266137566137566,85120.0,0.004704572681138337
-20,gpt-4-turbo,0.42728576,0.4162435,0.42098433,0.5393220459796505,4.266137566137566,85120.0,0.0034873692407505464
-4,Mistral (7B) Instruct v0.2 (Together AI),0.3647361,0.3664233,0.36540908,0.5233998570385472,3.712222222222222,29298.0,0.005478518060743351
-7,OpenHermes-2.5-Mistral (7B),0.3618188,0.35180506,0.3565194,0.312054520357568,3.5818443804034583,14928.0,0.006563161880264231
-8,Qwen 1.5 Chat (7B),0.34855434,0.34154576,0.344803,0.29904529709475364,3.5818443804034583,14928.0,0.003185571110431172
-0,01-ai Yi Chat (34B),0.33974892,0.3404481,0.3399749,0.43251538287409536,3.5818443804034583,14928.0,0.007311566390840339
-14,WizardLM v1.2 (13B),0.34085444,0.32933056,0.33466902,0.28716720161049375,3.5818443804034583,14928.0,0.003671383039102015
-10,Snorkel Mistral PairRM DPO (7B),0.31672964,0.33782956,0.3265383,3.7740234383755356,3.5818443804034583,14928.0,0.002907897771152987
-3,LLaMA-2 Chat (7B),0.3203912,0.3153909,0.31770444,0.4084233313416049,3.5818443804034583,14928.0,0.004255859538193306
-1,Chronos Hermes (13B),0.3124825,0.31071666,0.311415,0.4742810243835248,3.5818443804034583,14928.0,0.011439012700594395
-13,Vicuna v1.5 (7B),0.284109,0.27878883,0.28129113,0.2781035051738079,3.6173027989821884,16948.0,0.006952332387656228
-2,Falcon Instruct (7B),0.2895086,0.23968808,0.2615204,0.0490635544441649,3.5818443804034583,14928.0,0.00021729364201653395
-9,RedPajama-INCITE Chat (7B),0.261367,0.23758642,0.2487217,0.0560284823193376,3.5818443804034583,14928.0,0.0
-17,gemini-pro,0.23105659,0.23057175,0.23072062,0.295286999418032,4.244871794871795,87700.0,0.0025439281189154664
-15,chat-bison (PaLM 2),0.23117188,0.23029378,0.23060663,0.2927236655934559,4.281081081081081,83400.0,0.0033173472693443363
-16,chat-bison-32k (PaLM 2 32K),0.23046139,0.22983725,0.23002876,0.2608806894318779,4.281081081081081,83400.0,0.002970914340485325
-21,llama-2-70b-chat,0.20800962,0.21472095,0.21117964,0.29684572894554634,4.2436893203883495,88008.0,0.00329426273003284
-6,Mixtral-8x7B-Instruct-v0.1,0.19128644,0.19555509,0.19330867,0.2665288353398184,4.161038961038961,103320.0,0.0026839271544750283
-11,TinyLlama/TinyLlama-1.1B-Chat-v1.0,0.122185074,0.11885959,0.12042627,0.13915355617375091,4.244871794871795,87700.0,0.002991155730532842
-22,zephyr-7b-beta,0.085390136,0.08266569,0.08394519,0.08796697338212889,4.159788702026735,103714.0,0.0010625100735849574
-5,Mistral-7B-Instruct-v0.2,0.043820098,0.042561684,0.04313921,0.04250630683894714,4.120342654588421,113258.0,0.0004930290548816363
-12,Upstage SOLAR Instruct v1 (11B),0.0,0.0,0.0,0.0017662349842492329,3.5818443804034583,14928.0,0.0
-","{""x"": ""bert_score_F1"", ""y"": ""model"", ""color"": ""model"", ""orientation"": ""h"", ""labels"": {""bert_score_F1"": ""BERT score F1"", ""model"": ""Model""}, ""title"": ""Summary metrics BERT score F1""}"
+})",Summary metrics BERT score F1,"{""data"":[{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-3.5-turbo"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""gpt-3.5-turbo"",""offsetgroup"":""gpt-3.5-turbo"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.49331823],""xaxis"":""x"",""y"":[""gpt-3.5-turbo""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""gpt-4"",""offsetgroup"":""gpt-4"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.4839312],""xaxis"":""x"",""y"":[""gpt-4""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4-turbo"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""gpt-4-turbo"",""offsetgroup"":""gpt-4-turbo"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.4294052],""xaxis"":""x"",""y"":[""gpt-4-turbo""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral (7B) Instruct v0.2 (Together AI)"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""Mistral (7B) Instruct v0.2 (Together AI)"",""offsetgroup"":""Mistral (7B) Instruct v0.2 (Together AI)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.36758336],""xaxis"":""x"",""y"":[""Mistral (7B) Instruct v0.2 (Together AI)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""OpenHermes-2.5-Mistral (7B)"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""OpenHermes-2.5-Mistral (7B)"",""offsetgroup"":""OpenHermes-2.5-Mistral (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.36003792],""xaxis"":""x"",""y"":[""OpenHermes-2.5-Mistral (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Qwen 1.5 Chat (7B)"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""Qwen 1.5 Chat (7B)"",""offsetgroup"":""Qwen 1.5 Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.34867778],""xaxis"":""x"",""y"":[""Qwen 1.5 Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""01-ai Yi Chat (34B)"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""01-ai Yi Chat (34B)"",""offsetgroup"":""01-ai Yi Chat (34B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.34183535],""xaxis"":""x"",""y"":[""01-ai Yi Chat (34B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""WizardLM v1.2 (13B)"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""WizardLM v1.2 (13B)"",""offsetgroup"":""WizardLM v1.2 (13B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.33996373],""xaxis"":""x"",""y"":[""WizardLM v1.2 (13B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Snorkel Mistral PairRM DPO (7B)"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""Snorkel Mistral PairRM DPO (7B)"",""offsetgroup"":""Snorkel Mistral PairRM DPO (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.32718164],""xaxis"":""x"",""y"":[""Snorkel Mistral PairRM DPO (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""LLaMA-2 Chat (7B)"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""LLaMA-2 Chat (7B)"",""offsetgroup"":""LLaMA-2 Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.32136682],""xaxis"":""x"",""y"":[""LLaMA-2 Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Chronos Hermes (13B)"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""Chronos Hermes (13B)"",""offsetgroup"":""Chronos Hermes (13B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.3150877],""xaxis"":""x"",""y"":[""Chronos Hermes (13B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Falcon Instruct (7B)"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""Falcon Instruct (7B)"",""offsetgroup"":""Falcon Instruct (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.29104736],""xaxis"":""x"",""y"":[""Falcon Instruct (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Vicuna v1.5 (7B)"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""Vicuna v1.5 (7B)"",""offsetgroup"":""Vicuna v1.5 (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.2839047],""xaxis"":""x"",""y"":[""Vicuna v1.5 (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""RedPajama-INCITE Chat (7B)"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""RedPajama-INCITE Chat (7B)"",""offsetgroup"":""RedPajama-INCITE Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.26768887],""xaxis"":""x"",""y"":[""RedPajama-INCITE Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison (PaLM 2)"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""chat-bison (PaLM 2)"",""offsetgroup"":""chat-bison (PaLM 2)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.23214735],""xaxis"":""x"",""y"":[""chat-bison (PaLM 2)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gemini-pro"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""gemini-pro"",""offsetgroup"":""gemini-pro"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.23199782],""xaxis"":""x"",""y"":[""gemini-pro""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison-32k (PaLM 2 32K)"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""chat-bison-32k (PaLM 2 32K)"",""offsetgroup"":""chat-bison-32k (PaLM 2 32K)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.2317056],""xaxis"":""x"",""y"":[""chat-bison-32k (PaLM 2 32K)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""llama-2-70b-chat"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""llama-2-70b-chat"",""offsetgroup"":""llama-2-70b-chat"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.21268094],""xaxis"":""x"",""y"":[""llama-2-70b-chat""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mixtral-8x7B-Instruct-v0.1"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""Mixtral-8x7B-Instruct-v0.1"",""offsetgroup"":""Mixtral-8x7B-Instruct-v0.1"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.19449018],""xaxis"":""x"",""y"":[""Mixtral-8x7B-Instruct-v0.1""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""offsetgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.12200464],""xaxis"":""x"",""y"":[""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""zephyr-7b-beta"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""zephyr-7b-beta"",""offsetgroup"":""zephyr-7b-beta"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.085219756],""xaxis"":""x"",""y"":[""zephyr-7b-beta""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral-7B-Instruct-v0.2"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""Mistral-7B-Instruct-v0.2"",""offsetgroup"":""Mistral-7B-Instruct-v0.2"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.04378006],""xaxis"":""x"",""y"":[""Mistral-7B-Instruct-v0.2""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Upstage SOLAR Instruct v1 (11B)"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""Upstage SOLAR Instruct v1 (11B)"",""offsetgroup"":""Upstage SOLAR Instruct v1 (11B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.0],""xaxis"":""x"",""y"":[""Upstage SOLAR Instruct v1 (11B)""],""yaxis"":""y"",""type"":""bar""}],""layout"":{""template"":{""data"":{""histogram2dcontour"":[{""type"":""histogram2dcontour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""choropleth"":[{""type"":""choropleth"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""histogram2d"":[{""type"":""histogram2d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmap"":[{""type"":""heatmap"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmapgl"":[{""type"":""heatmapgl"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""contourcarpet"":[{""type"":""contourcarpet"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""contour"":[{""type"":""contour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""surface"":[{""type"":""surface"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""mesh3d"":[{""type"":""mesh3d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""scatter"":[{""fillpattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2},""type"":""scatter""}],""parcoords"":[{""type"":""parcoords"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolargl"":[{""type"":""scatterpolargl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""bar"":[{""error_x"":{""color"":""#2a3f5f""},""error_y"":{""color"":""#2a3f5f""},""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""bar""}],""scattergeo"":[{""type"":""scattergeo"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolar"":[{""type"":""scatterpolar"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""histogram"":[{""marker"":{""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""histogram""}],""scattergl"":[{""type"":""scattergl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatter3d"":[{""type"":""scatter3d"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattermapbox"":[{""type"":""scattermapbox"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterternary"":[{""type"":""scatterternary"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattercarpet"":[{""type"":""scattercarpet"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""carpet"":[{""aaxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""baxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""type"":""carpet""}],""table"":[{""cells"":{""fill"":{""color"":""#EBF0F8""},""line"":{""color"":""white""}},""header"":{""fill"":{""color"":""#C8D4E3""},""line"":{""color"":""white""}},""type"":""table""}],""barpolar"":[{""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""barpolar""}],""pie"":[{""automargin"":true,""type"":""pie""}]},""layout"":{""autotypenumbers"":""strict"",""colorway"":[""#636efa"",""#EF553B"",""#00cc96"",""#ab63fa"",""#FFA15A"",""#19d3f3"",""#FF6692"",""#B6E880"",""#FF97FF"",""#FECB52""],""font"":{""color"":""#2a3f5f""},""hovermode"":""closest"",""hoverlabel"":{""align"":""left""},""paper_bgcolor"":""white"",""plot_bgcolor"":""#E5ECF6"",""polar"":{""bgcolor"":""#E5ECF6"",""angularaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""radialaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""ternary"":{""bgcolor"":""#E5ECF6"",""aaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""baxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""caxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""coloraxis"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""colorscale"":{""sequential"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""sequentialminus"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""diverging"":[[0,""#8e0152""],[0.1,""#c51b7d""],[0.2,""#de77ae""],[0.3,""#f1b6da""],[0.4,""#fde0ef""],[0.5,""#f7f7f7""],[0.6,""#e6f5d0""],[0.7,""#b8e186""],[0.8,""#7fbc41""],[0.9,""#4d9221""],[1,""#276419""]]},""xaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""yaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""scene"":{""xaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""yaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""zaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2}},""shapedefaults"":{""line"":{""color"":""#2a3f5f""}},""annotationdefaults"":{""arrowcolor"":""#2a3f5f"",""arrowhead"":0,""arrowwidth"":1},""geo"":{""bgcolor"":""white"",""landcolor"":""#E5ECF6"",""subunitcolor"":""white"",""showland"":true,""showlakes"":true,""lakecolor"":""white""},""title"":{""x"":0.05},""mapbox"":{""style"":""light""}}},""xaxis"":{""anchor"":""y"",""domain"":[0.0,1.0],""title"":{""text"":""BERT score F1""}},""yaxis"":{""anchor"":""x"",""domain"":[0.0,1.0],""title"":{""text"":""Model""},""categoryorder"":""array"",""categoryarray"":[""Upstage SOLAR Instruct v1 (11B)"",""Mistral-7B-Instruct-v0.2"",""zephyr-7b-beta"",""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""Mixtral-8x7B-Instruct-v0.1"",""llama-2-70b-chat"",""chat-bison-32k (PaLM 2 32K)"",""gemini-pro"",""chat-bison (PaLM 2)"",""RedPajama-INCITE Chat (7B)"",""Vicuna v1.5 (7B)"",""Falcon Instruct (7B)"",""Chronos Hermes (13B)"",""LLaMA-2 Chat (7B)"",""Snorkel Mistral PairRM DPO (7B)"",""WizardLM v1.2 (13B)"",""01-ai Yi Chat (34B)"",""Qwen 1.5 Chat (7B)"",""OpenHermes-2.5-Mistral (7B)"",""Mistral (7B) Instruct v0.2 (Together AI)"",""gpt-4-turbo"",""gpt-4"",""gpt-3.5-turbo""]},""legend"":{""title"":{""text"":""Model""},""tracegroupgap"":0},""title"":{""text"":""Summary metrics BERT score F1""},""barmode"":""relative""}}","
+ BERT score uses contextual embeddings from pre-trained BERT model to compare summarized text to reference texts.
+ For reference texts we used reference summarizations from the dataset, article title and original article text.
+ BERT score measures the similarity at both the token and sentence levels, capturing semantic nuances and contextual relevance.
+
+ More about this metric can be read here: [link](https://arxiv.org/pdf/1904.09675.pdf).
+ Higher score indicates better alignment between the generated and reference text. The value is averaged for each model.",",model,BERT_score_precision,BERT_score_recall,BERT_score_F1,BLEU_score,original_text_length_part,sentence_count,length_penalty
+18,gpt-3.5-turbo,0.49478123,0.50445867,0.49331823,0.00919205486407126,0.5905700146991734,4.229639819909955,89814.0
+19,gpt-4,0.4864653,0.49512562,0.4839312,0.005711113295666468,0.4763731952669352,4.266137566137566,85120.0
+20,gpt-4-turbo,0.42933634,0.4414623,0.4294052,0.0042830628392272,0.5393220459796505,4.266137566137566,85120.0
+4,Mistral (7B) Instruct v0.2 (Together AI),0.36488953,0.3797993,0.36758336,0.005650224193975447,0.5233998570385472,3.712222222222222,29298.0
+7,OpenHermes-2.5-Mistral (7B),0.3621834,0.3685358,0.36003792,0.0068684572027745494,0.312054520357568,3.5818443804034583,14928.0
+8,Qwen 1.5 Chat (7B),0.34898603,0.35945317,0.34867778,0.0033327500620805805,0.29904529709475364,3.5818443804034583,14928.0
+0,01-ai Yi Chat (34B),0.33981326,0.35219854,0.34183535,0.007428840277380581,0.43251538287409536,3.5818443804034583,14928.0
+14,WizardLM v1.2 (13B),0.3420949,0.34746957,0.33996373,0.00373442128604677,0.28716720161049375,3.5818443804034583,14928.0
+10,Snorkel Mistral PairRM DPO (7B),0.3167385,0.34785262,0.32718164,0.0029236226777824676,3.7740234383755356,3.5818443804034583,14928.0
+3,LLaMA-2 Chat (7B),0.32074162,0.33171847,0.32136682,0.004415024709996126,0.4084233313416049,3.5818443804034583,14928.0
+1,Chronos Hermes (13B),0.31285536,0.32630467,0.3150877,0.011542047908319874,0.4742810243835248,3.5818443804034583,14928.0
+2,Falcon Instruct (7B),0.30270517,0.28607234,0.29104736,0.0030232447024239606,0.0490635544441649,3.5818443804034583,14928.0
+13,Vicuna v1.5 (7B),0.28434175,0.29119453,0.2839047,0.007105541953090669,0.2781035051738079,3.6173027989821884,16948.0
+9,RedPajama-INCITE Chat (7B),0.26832756,0.27305293,0.26768887,0.0,0.0560284823193376,3.5818443804034583,14928.0
+15,chat-bison (PaLM 2),0.23123139,0.24001649,0.23214735,0.0037652345768886663,0.2927236655934559,4.281081081081081,83400.0
+17,gemini-pro,0.23109974,0.23956373,0.23199782,0.0032373504004405487,0.295286999418032,4.244871794871795,87700.0
+16,chat-bison-32k (PaLM 2 32K),0.23051436,0.23993237,0.2317056,0.003694633514634998,0.2608806894318779,4.281081081081081,83400.0
+21,llama-2-70b-chat,0.20810011,0.22406381,0.21268094,0.004560500754935232,0.29684572894554634,4.2436893203883495,88008.0
+6,Mixtral-8x7B-Instruct-v0.1,0.19137934,0.2029136,0.19449018,0.0031843990217988536,0.2665288353398184,4.161038961038961,103320.0
+11,TinyLlama/TinyLlama-1.1B-Chat-v1.0,0.122332305,0.12540509,0.12200464,0.003286423403673119,0.13915355617375091,4.244871794871795,87700.0
+22,zephyr-7b-beta,0.085546724,0.08755772,0.085219756,0.0012612839176470308,0.08796697338212889,4.159788702026735,103714.0
+5,Mistral-7B-Instruct-v0.2,0.04389399,0.045185987,0.04378006,0.000566625796313851,0.04250630683894714,4.120342654588421,113258.0
+12,Upstage SOLAR Instruct v1 (11B),0.0,0.0,0.0,0.0,0.0017662349842492329,3.5818443804034583,14928.0
+","{""x"": ""BERT_score_F1"", ""y"": ""model"", ""color"": ""model"", ""orientation"": ""h"", ""labels"": {""BERT_score_F1"": ""BERT score F1"", ""model"": ""Model""}, ""title"": ""Summary metrics BERT score F1""}"
"Figure({
'data': [{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
original text length part=%{x}',
- 'legendgroup': 'Snorkel Mistral PairRM DPO (7B)',
+ 'hovertemplate': 'Model=%{y}
BLEU score=%{x}',
+ 'legendgroup': 'Chronos Hermes (13B)',
'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
- 'name': 'Snorkel Mistral PairRM DPO (7B)',
- 'offsetgroup': 'Snorkel Mistral PairRM DPO (7B)',
+ 'name': 'Chronos Hermes (13B)',
+ 'offsetgroup': 'Chronos Hermes (13B)',
'orientation': 'h',
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([3.77402344]),
+ 'x': array([0.01154205]),
'xaxis': 'x',
- 'y': array(['Snorkel Mistral PairRM DPO (7B)'], dtype=object),
+ 'y': array(['Chronos Hermes (13B)'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
original text length part=%{x}',
+ 'hovertemplate': 'Model=%{y}
BLEU score=%{x}',
'legendgroup': 'gpt-3.5-turbo',
'marker': {'color': '#EF553B', 'pattern': {'shape': ''}},
'name': 'gpt-3.5-turbo',
@@ -1141,292 +1147,292 @@ plot_object,header,plot_json,description,df,arguments
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.59057001]),
+ 'x': array([0.00919205]),
'xaxis': 'x',
'y': array(['gpt-3.5-turbo'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
original text length part=%{x}',
- 'legendgroup': 'gpt-4-turbo',
+ 'hovertemplate': 'Model=%{y}
BLEU score=%{x}',
+ 'legendgroup': '01-ai Yi Chat (34B)',
'marker': {'color': '#00cc96', 'pattern': {'shape': ''}},
- 'name': 'gpt-4-turbo',
- 'offsetgroup': 'gpt-4-turbo',
+ 'name': '01-ai Yi Chat (34B)',
+ 'offsetgroup': '01-ai Yi Chat (34B)',
'orientation': 'h',
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.53932205]),
+ 'x': array([0.00742884]),
'xaxis': 'x',
- 'y': array(['gpt-4-turbo'], dtype=object),
+ 'y': array(['01-ai Yi Chat (34B)'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
original text length part=%{x}',
- 'legendgroup': 'Mistral (7B) Instruct v0.2 (Together AI)',
+ 'hovertemplate': 'Model=%{y}
BLEU score=%{x}',
+ 'legendgroup': 'Vicuna v1.5 (7B)',
'marker': {'color': '#ab63fa', 'pattern': {'shape': ''}},
- 'name': 'Mistral (7B) Instruct v0.2 (Together AI)',
- 'offsetgroup': 'Mistral (7B) Instruct v0.2 (Together AI)',
+ 'name': 'Vicuna v1.5 (7B)',
+ 'offsetgroup': 'Vicuna v1.5 (7B)',
'orientation': 'h',
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.52339986]),
+ 'x': array([0.00710554]),
'xaxis': 'x',
- 'y': array(['Mistral (7B) Instruct v0.2 (Together AI)'], dtype=object),
+ 'y': array(['Vicuna v1.5 (7B)'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
original text length part=%{x}',
- 'legendgroup': 'gpt-4',
+ 'hovertemplate': 'Model=%{y}
BLEU score=%{x}',
+ 'legendgroup': 'OpenHermes-2.5-Mistral (7B)',
'marker': {'color': '#FFA15A', 'pattern': {'shape': ''}},
- 'name': 'gpt-4',
- 'offsetgroup': 'gpt-4',
+ 'name': 'OpenHermes-2.5-Mistral (7B)',
+ 'offsetgroup': 'OpenHermes-2.5-Mistral (7B)',
'orientation': 'h',
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.4763732]),
+ 'x': array([0.00686846]),
'xaxis': 'x',
- 'y': array(['gpt-4'], dtype=object),
+ 'y': array(['OpenHermes-2.5-Mistral (7B)'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
original text length part=%{x}',
- 'legendgroup': 'Chronos Hermes (13B)',
+ 'hovertemplate': 'Model=%{y}
BLEU score=%{x}',
+ 'legendgroup': 'gpt-4',
'marker': {'color': '#19d3f3', 'pattern': {'shape': ''}},
- 'name': 'Chronos Hermes (13B)',
- 'offsetgroup': 'Chronos Hermes (13B)',
+ 'name': 'gpt-4',
+ 'offsetgroup': 'gpt-4',
'orientation': 'h',
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.47428102]),
+ 'x': array([0.00571111]),
'xaxis': 'x',
- 'y': array(['Chronos Hermes (13B)'], dtype=object),
+ 'y': array(['gpt-4'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
original text length part=%{x}',
- 'legendgroup': '01-ai Yi Chat (34B)',
+ 'hovertemplate': 'Model=%{y}
BLEU score=%{x}',
+ 'legendgroup': 'Mistral (7B) Instruct v0.2 (Together AI)',
'marker': {'color': '#FF6692', 'pattern': {'shape': ''}},
- 'name': '01-ai Yi Chat (34B)',
- 'offsetgroup': '01-ai Yi Chat (34B)',
+ 'name': 'Mistral (7B) Instruct v0.2 (Together AI)',
+ 'offsetgroup': 'Mistral (7B) Instruct v0.2 (Together AI)',
'orientation': 'h',
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.43251538]),
+ 'x': array([0.00565022]),
'xaxis': 'x',
- 'y': array(['01-ai Yi Chat (34B)'], dtype=object),
+ 'y': array(['Mistral (7B) Instruct v0.2 (Together AI)'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
original text length part=%{x}',
- 'legendgroup': 'LLaMA-2 Chat (7B)',
+ 'hovertemplate': 'Model=%{y}
BLEU score=%{x}',
+ 'legendgroup': 'llama-2-70b-chat',
'marker': {'color': '#B6E880', 'pattern': {'shape': ''}},
- 'name': 'LLaMA-2 Chat (7B)',
- 'offsetgroup': 'LLaMA-2 Chat (7B)',
+ 'name': 'llama-2-70b-chat',
+ 'offsetgroup': 'llama-2-70b-chat',
'orientation': 'h',
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.40842333]),
+ 'x': array([0.0045605]),
'xaxis': 'x',
- 'y': array(['LLaMA-2 Chat (7B)'], dtype=object),
+ 'y': array(['llama-2-70b-chat'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
original text length part=%{x}',
- 'legendgroup': 'OpenHermes-2.5-Mistral (7B)',
+ 'hovertemplate': 'Model=%{y}
BLEU score=%{x}',
+ 'legendgroup': 'LLaMA-2 Chat (7B)',
'marker': {'color': '#FF97FF', 'pattern': {'shape': ''}},
- 'name': 'OpenHermes-2.5-Mistral (7B)',
- 'offsetgroup': 'OpenHermes-2.5-Mistral (7B)',
+ 'name': 'LLaMA-2 Chat (7B)',
+ 'offsetgroup': 'LLaMA-2 Chat (7B)',
'orientation': 'h',
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.31205452]),
+ 'x': array([0.00441502]),
'xaxis': 'x',
- 'y': array(['OpenHermes-2.5-Mistral (7B)'], dtype=object),
+ 'y': array(['LLaMA-2 Chat (7B)'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
original text length part=%{x}',
- 'legendgroup': 'Qwen 1.5 Chat (7B)',
+ 'hovertemplate': 'Model=%{y}
BLEU score=%{x}',
+ 'legendgroup': 'gpt-4-turbo',
'marker': {'color': '#FECB52', 'pattern': {'shape': ''}},
- 'name': 'Qwen 1.5 Chat (7B)',
- 'offsetgroup': 'Qwen 1.5 Chat (7B)',
+ 'name': 'gpt-4-turbo',
+ 'offsetgroup': 'gpt-4-turbo',
'orientation': 'h',
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.2990453]),
+ 'x': array([0.00428306]),
'xaxis': 'x',
- 'y': array(['Qwen 1.5 Chat (7B)'], dtype=object),
+ 'y': array(['gpt-4-turbo'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
original text length part=%{x}',
- 'legendgroup': 'llama-2-70b-chat',
+ 'hovertemplate': 'Model=%{y}
BLEU score=%{x}',
+ 'legendgroup': 'chat-bison (PaLM 2)',
'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
- 'name': 'llama-2-70b-chat',
- 'offsetgroup': 'llama-2-70b-chat',
+ 'name': 'chat-bison (PaLM 2)',
+ 'offsetgroup': 'chat-bison (PaLM 2)',
'orientation': 'h',
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.29684573]),
+ 'x': array([0.00376523]),
'xaxis': 'x',
- 'y': array(['llama-2-70b-chat'], dtype=object),
+ 'y': array(['chat-bison (PaLM 2)'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
original text length part=%{x}',
- 'legendgroup': 'gemini-pro',
+ 'hovertemplate': 'Model=%{y}
BLEU score=%{x}',
+ 'legendgroup': 'WizardLM v1.2 (13B)',
'marker': {'color': '#EF553B', 'pattern': {'shape': ''}},
- 'name': 'gemini-pro',
- 'offsetgroup': 'gemini-pro',
+ 'name': 'WizardLM v1.2 (13B)',
+ 'offsetgroup': 'WizardLM v1.2 (13B)',
'orientation': 'h',
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.295287]),
+ 'x': array([0.00373442]),
'xaxis': 'x',
- 'y': array(['gemini-pro'], dtype=object),
+ 'y': array(['WizardLM v1.2 (13B)'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
original text length part=%{x}',
- 'legendgroup': 'chat-bison (PaLM 2)',
+ 'hovertemplate': 'Model=%{y}
BLEU score=%{x}',
+ 'legendgroup': 'chat-bison-32k (PaLM 2 32K)',
'marker': {'color': '#00cc96', 'pattern': {'shape': ''}},
- 'name': 'chat-bison (PaLM 2)',
- 'offsetgroup': 'chat-bison (PaLM 2)',
+ 'name': 'chat-bison-32k (PaLM 2 32K)',
+ 'offsetgroup': 'chat-bison-32k (PaLM 2 32K)',
'orientation': 'h',
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.29272367]),
+ 'x': array([0.00369463]),
'xaxis': 'x',
- 'y': array(['chat-bison (PaLM 2)'], dtype=object),
+ 'y': array(['chat-bison-32k (PaLM 2 32K)'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
original text length part=%{x}',
- 'legendgroup': 'WizardLM v1.2 (13B)',
+ 'hovertemplate': 'Model=%{y}
BLEU score=%{x}',
+ 'legendgroup': 'Qwen 1.5 Chat (7B)',
'marker': {'color': '#ab63fa', 'pattern': {'shape': ''}},
- 'name': 'WizardLM v1.2 (13B)',
- 'offsetgroup': 'WizardLM v1.2 (13B)',
+ 'name': 'Qwen 1.5 Chat (7B)',
+ 'offsetgroup': 'Qwen 1.5 Chat (7B)',
'orientation': 'h',
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.2871672]),
+ 'x': array([0.00333275]),
'xaxis': 'x',
- 'y': array(['WizardLM v1.2 (13B)'], dtype=object),
+ 'y': array(['Qwen 1.5 Chat (7B)'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
original text length part=%{x}',
- 'legendgroup': 'Vicuna v1.5 (7B)',
+ 'hovertemplate': 'Model=%{y}
BLEU score=%{x}',
+ 'legendgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
'marker': {'color': '#FFA15A', 'pattern': {'shape': ''}},
- 'name': 'Vicuna v1.5 (7B)',
- 'offsetgroup': 'Vicuna v1.5 (7B)',
+ 'name': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
+ 'offsetgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
'orientation': 'h',
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.27810351]),
+ 'x': array([0.00328642]),
'xaxis': 'x',
- 'y': array(['Vicuna v1.5 (7B)'], dtype=object),
+ 'y': array(['TinyLlama/TinyLlama-1.1B-Chat-v1.0'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
original text length part=%{x}',
- 'legendgroup': 'Mixtral-8x7B-Instruct-v0.1',
+ 'hovertemplate': 'Model=%{y}
BLEU score=%{x}',
+ 'legendgroup': 'gemini-pro',
'marker': {'color': '#19d3f3', 'pattern': {'shape': ''}},
- 'name': 'Mixtral-8x7B-Instruct-v0.1',
- 'offsetgroup': 'Mixtral-8x7B-Instruct-v0.1',
+ 'name': 'gemini-pro',
+ 'offsetgroup': 'gemini-pro',
'orientation': 'h',
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.26652884]),
+ 'x': array([0.00323735]),
'xaxis': 'x',
- 'y': array(['Mixtral-8x7B-Instruct-v0.1'], dtype=object),
+ 'y': array(['gemini-pro'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
original text length part=%{x}',
- 'legendgroup': 'chat-bison-32k (PaLM 2 32K)',
+ 'hovertemplate': 'Model=%{y}
BLEU score=%{x}',
+ 'legendgroup': 'Mixtral-8x7B-Instruct-v0.1',
'marker': {'color': '#FF6692', 'pattern': {'shape': ''}},
- 'name': 'chat-bison-32k (PaLM 2 32K)',
- 'offsetgroup': 'chat-bison-32k (PaLM 2 32K)',
+ 'name': 'Mixtral-8x7B-Instruct-v0.1',
+ 'offsetgroup': 'Mixtral-8x7B-Instruct-v0.1',
'orientation': 'h',
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.26088069]),
+ 'x': array([0.0031844]),
'xaxis': 'x',
- 'y': array(['chat-bison-32k (PaLM 2 32K)'], dtype=object),
+ 'y': array(['Mixtral-8x7B-Instruct-v0.1'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
original text length part=%{x}',
- 'legendgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
+ 'hovertemplate': 'Model=%{y}
BLEU score=%{x}',
+ 'legendgroup': 'Falcon Instruct (7B)',
'marker': {'color': '#B6E880', 'pattern': {'shape': ''}},
- 'name': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
- 'offsetgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
+ 'name': 'Falcon Instruct (7B)',
+ 'offsetgroup': 'Falcon Instruct (7B)',
'orientation': 'h',
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.13915356]),
+ 'x': array([0.00302324]),
'xaxis': 'x',
- 'y': array(['TinyLlama/TinyLlama-1.1B-Chat-v1.0'], dtype=object),
+ 'y': array(['Falcon Instruct (7B)'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
original text length part=%{x}',
- 'legendgroup': 'zephyr-7b-beta',
+ 'hovertemplate': 'Model=%{y}
BLEU score=%{x}',
+ 'legendgroup': 'Snorkel Mistral PairRM DPO (7B)',
'marker': {'color': '#FF97FF', 'pattern': {'shape': ''}},
- 'name': 'zephyr-7b-beta',
- 'offsetgroup': 'zephyr-7b-beta',
+ 'name': 'Snorkel Mistral PairRM DPO (7B)',
+ 'offsetgroup': 'Snorkel Mistral PairRM DPO (7B)',
'orientation': 'h',
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.08796697]),
+ 'x': array([0.00292362]),
'xaxis': 'x',
- 'y': array(['zephyr-7b-beta'], dtype=object),
+ 'y': array(['Snorkel Mistral PairRM DPO (7B)'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
original text length part=%{x}',
- 'legendgroup': 'RedPajama-INCITE Chat (7B)',
+ 'hovertemplate': 'Model=%{y}
BLEU score=%{x}',
+ 'legendgroup': 'zephyr-7b-beta',
'marker': {'color': '#FECB52', 'pattern': {'shape': ''}},
- 'name': 'RedPajama-INCITE Chat (7B)',
- 'offsetgroup': 'RedPajama-INCITE Chat (7B)',
+ 'name': 'zephyr-7b-beta',
+ 'offsetgroup': 'zephyr-7b-beta',
'orientation': 'h',
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.05602848]),
+ 'x': array([0.00126128]),
'xaxis': 'x',
- 'y': array(['RedPajama-INCITE Chat (7B)'], dtype=object),
+ 'y': array(['zephyr-7b-beta'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
original text length part=%{x}',
- 'legendgroup': 'Falcon Instruct (7B)',
+ 'hovertemplate': 'Model=%{y}
BLEU score=%{x}',
+ 'legendgroup': 'Mistral-7B-Instruct-v0.2',
'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
- 'name': 'Falcon Instruct (7B)',
- 'offsetgroup': 'Falcon Instruct (7B)',
+ 'name': 'Mistral-7B-Instruct-v0.2',
+ 'offsetgroup': 'Mistral-7B-Instruct-v0.2',
'orientation': 'h',
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.04906355]),
+ 'x': array([0.00056663]),
'xaxis': 'x',
- 'y': array(['Falcon Instruct (7B)'], dtype=object),
+ 'y': array(['Mistral-7B-Instruct-v0.2'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
original text length part=%{x}',
- 'legendgroup': 'Mistral-7B-Instruct-v0.2',
+ 'hovertemplate': 'Model=%{y}
BLEU score=%{x}',
+ 'legendgroup': 'RedPajama-INCITE Chat (7B)',
'marker': {'color': '#EF553B', 'pattern': {'shape': ''}},
- 'name': 'Mistral-7B-Instruct-v0.2',
- 'offsetgroup': 'Mistral-7B-Instruct-v0.2',
+ 'name': 'RedPajama-INCITE Chat (7B)',
+ 'offsetgroup': 'RedPajama-INCITE Chat (7B)',
'orientation': 'h',
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.04250631]),
+ 'x': array([0.]),
'xaxis': 'x',
- 'y': array(['Mistral-7B-Instruct-v0.2'], dtype=object),
+ 'y': array(['RedPajama-INCITE Chat (7B)'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
original text length part=%{x}',
+ 'hovertemplate': 'Model=%{y}
BLEU score=%{x}',
'legendgroup': 'Upstage SOLAR Instruct v1 (11B)',
'marker': {'color': '#00cc96', 'pattern': {'shape': ''}},
'name': 'Upstage SOLAR Instruct v1 (11B)',
@@ -1435,91 +1441,98 @@ plot_object,header,plot_json,description,df,arguments
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.00176623]),
+ 'x': array([0.]),
'xaxis': 'x',
'y': array(['Upstage SOLAR Instruct v1 (11B)'], dtype=object),
'yaxis': 'y'}],
'layout': {'barmode': 'relative',
'legend': {'title': {'text': 'Model'}, 'tracegroupgap': 0},
'template': '...',
- 'title': {'text': 'Summary metrics original text length part'},
- 'xaxis': {'anchor': 'y', 'domain': [0.0, 1.0], 'title': {'text': 'original text length part'}},
+ 'title': {'text': 'Summary metrics BLEU score'},
+ 'xaxis': {'anchor': 'y', 'domain': [0.0, 1.0], 'title': {'text': 'BLEU score'}},
'yaxis': {'anchor': 'x',
'categoryarray': [Upstage SOLAR Instruct v1 (11B),
- Mistral-7B-Instruct-v0.2, Falcon
- Instruct (7B), RedPajama-INCITE Chat
- (7B), zephyr-7b-beta,
- TinyLlama/TinyLlama-1.1B-Chat-v1.0,
- chat-bison-32k (PaLM 2 32K),
- Mixtral-8x7B-Instruct-v0.1, Vicuna v1.5
- (7B), WizardLM v1.2 (13B), chat-bison
- (PaLM 2), gemini-pro, llama-2-70b-chat,
- Qwen 1.5 Chat (7B),
- OpenHermes-2.5-Mistral (7B), LLaMA-2
- Chat (7B), 01-ai Yi Chat (34B), Chronos
- Hermes (13B), gpt-4, Mistral (7B)
- Instruct v0.2 (Together AI),
- gpt-4-turbo, gpt-3.5-turbo, Snorkel
- Mistral PairRM DPO (7B)],
+ RedPajama-INCITE Chat (7B),
+ Mistral-7B-Instruct-v0.2,
+ zephyr-7b-beta, Snorkel Mistral PairRM
+ DPO (7B), Falcon Instruct (7B),
+ Mixtral-8x7B-Instruct-v0.1, gemini-pro,
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0, Qwen
+ 1.5 Chat (7B), chat-bison-32k (PaLM 2
+ 32K), WizardLM v1.2 (13B), chat-bison
+ (PaLM 2), gpt-4-turbo, LLaMA-2 Chat
+ (7B), llama-2-70b-chat, Mistral (7B)
+ Instruct v0.2 (Together AI), gpt-4,
+ OpenHermes-2.5-Mistral (7B), Vicuna v1.5
+ (7B), 01-ai Yi Chat (34B),
+ gpt-3.5-turbo, Chronos Hermes (13B)],
'categoryorder': 'array',
'domain': [0.0, 1.0],
'title': {'text': 'Model'}}}
-})",Summary metrics original text length part,"{""data"":[{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eoriginal text length part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Snorkel Mistral PairRM DPO (7B)"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""Snorkel Mistral PairRM DPO (7B)"",""offsetgroup"":""Snorkel Mistral PairRM DPO (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[3.7740234383755356],""xaxis"":""x"",""y"":[""Snorkel Mistral PairRM DPO (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eoriginal text length part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-3.5-turbo"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""gpt-3.5-turbo"",""offsetgroup"":""gpt-3.5-turbo"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.5905700146991734],""xaxis"":""x"",""y"":[""gpt-3.5-turbo""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eoriginal text length part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4-turbo"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""gpt-4-turbo"",""offsetgroup"":""gpt-4-turbo"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.5393220459796505],""xaxis"":""x"",""y"":[""gpt-4-turbo""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eoriginal text length part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral (7B) Instruct v0.2 (Together AI)"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""Mistral (7B) Instruct v0.2 (Together AI)"",""offsetgroup"":""Mistral (7B) Instruct v0.2 (Together AI)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.5233998570385472],""xaxis"":""x"",""y"":[""Mistral (7B) Instruct v0.2 (Together AI)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eoriginal text length part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""gpt-4"",""offsetgroup"":""gpt-4"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.4763731952669352],""xaxis"":""x"",""y"":[""gpt-4""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eoriginal text length part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Chronos Hermes (13B)"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""Chronos Hermes (13B)"",""offsetgroup"":""Chronos Hermes (13B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.4742810243835248],""xaxis"":""x"",""y"":[""Chronos Hermes (13B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eoriginal text length part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""01-ai Yi Chat (34B)"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""01-ai Yi Chat (34B)"",""offsetgroup"":""01-ai Yi Chat (34B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.43251538287409536],""xaxis"":""x"",""y"":[""01-ai Yi Chat (34B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eoriginal text length part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""LLaMA-2 Chat (7B)"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""LLaMA-2 Chat (7B)"",""offsetgroup"":""LLaMA-2 Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.4084233313416049],""xaxis"":""x"",""y"":[""LLaMA-2 Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eoriginal text length part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""OpenHermes-2.5-Mistral (7B)"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""OpenHermes-2.5-Mistral (7B)"",""offsetgroup"":""OpenHermes-2.5-Mistral (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.312054520357568],""xaxis"":""x"",""y"":[""OpenHermes-2.5-Mistral (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eoriginal text length part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Qwen 1.5 Chat (7B)"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""Qwen 1.5 Chat (7B)"",""offsetgroup"":""Qwen 1.5 Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.29904529709475364],""xaxis"":""x"",""y"":[""Qwen 1.5 Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eoriginal text length part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""llama-2-70b-chat"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""llama-2-70b-chat"",""offsetgroup"":""llama-2-70b-chat"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.29684572894554634],""xaxis"":""x"",""y"":[""llama-2-70b-chat""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eoriginal text length part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gemini-pro"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""gemini-pro"",""offsetgroup"":""gemini-pro"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.295286999418032],""xaxis"":""x"",""y"":[""gemini-pro""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eoriginal text length part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison (PaLM 2)"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""chat-bison (PaLM 2)"",""offsetgroup"":""chat-bison (PaLM 2)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.2927236655934559],""xaxis"":""x"",""y"":[""chat-bison (PaLM 2)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eoriginal text length part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""WizardLM v1.2 (13B)"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""WizardLM v1.2 (13B)"",""offsetgroup"":""WizardLM v1.2 (13B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.28716720161049375],""xaxis"":""x"",""y"":[""WizardLM v1.2 (13B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eoriginal text length part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Vicuna v1.5 (7B)"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""Vicuna v1.5 (7B)"",""offsetgroup"":""Vicuna v1.5 (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.2781035051738079],""xaxis"":""x"",""y"":[""Vicuna v1.5 (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eoriginal text length part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mixtral-8x7B-Instruct-v0.1"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""Mixtral-8x7B-Instruct-v0.1"",""offsetgroup"":""Mixtral-8x7B-Instruct-v0.1"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.2665288353398184],""xaxis"":""x"",""y"":[""Mixtral-8x7B-Instruct-v0.1""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eoriginal text length part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison-32k (PaLM 2 32K)"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""chat-bison-32k (PaLM 2 32K)"",""offsetgroup"":""chat-bison-32k (PaLM 2 32K)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.2608806894318779],""xaxis"":""x"",""y"":[""chat-bison-32k (PaLM 2 32K)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eoriginal text length part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""offsetgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.13915355617375091],""xaxis"":""x"",""y"":[""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eoriginal text length part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""zephyr-7b-beta"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""zephyr-7b-beta"",""offsetgroup"":""zephyr-7b-beta"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.08796697338212889],""xaxis"":""x"",""y"":[""zephyr-7b-beta""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eoriginal text length part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""RedPajama-INCITE Chat (7B)"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""RedPajama-INCITE Chat (7B)"",""offsetgroup"":""RedPajama-INCITE Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.0560284823193376],""xaxis"":""x"",""y"":[""RedPajama-INCITE Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eoriginal text length part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Falcon Instruct (7B)"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""Falcon Instruct (7B)"",""offsetgroup"":""Falcon Instruct (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.0490635544441649],""xaxis"":""x"",""y"":[""Falcon Instruct (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eoriginal text length part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral-7B-Instruct-v0.2"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""Mistral-7B-Instruct-v0.2"",""offsetgroup"":""Mistral-7B-Instruct-v0.2"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.04250630683894714],""xaxis"":""x"",""y"":[""Mistral-7B-Instruct-v0.2""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eoriginal text length part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Upstage SOLAR Instruct v1 (11B)"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""Upstage SOLAR Instruct v1 (11B)"",""offsetgroup"":""Upstage SOLAR Instruct v1 (11B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.0017662349842492329],""xaxis"":""x"",""y"":[""Upstage SOLAR Instruct v1 (11B)""],""yaxis"":""y"",""type"":""bar""}],""layout"":{""template"":{""data"":{""histogram2dcontour"":[{""type"":""histogram2dcontour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""choropleth"":[{""type"":""choropleth"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""histogram2d"":[{""type"":""histogram2d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmap"":[{""type"":""heatmap"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmapgl"":[{""type"":""heatmapgl"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""contourcarpet"":[{""type"":""contourcarpet"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""contour"":[{""type"":""contour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""surface"":[{""type"":""surface"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""mesh3d"":[{""type"":""mesh3d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""scatter"":[{""fillpattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2},""type"":""scatter""}],""parcoords"":[{""type"":""parcoords"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolargl"":[{""type"":""scatterpolargl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""bar"":[{""error_x"":{""color"":""#2a3f5f""},""error_y"":{""color"":""#2a3f5f""},""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""bar""}],""scattergeo"":[{""type"":""scattergeo"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolar"":[{""type"":""scatterpolar"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""histogram"":[{""marker"":{""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""histogram""}],""scattergl"":[{""type"":""scattergl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatter3d"":[{""type"":""scatter3d"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattermapbox"":[{""type"":""scattermapbox"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterternary"":[{""type"":""scatterternary"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattercarpet"":[{""type"":""scattercarpet"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""carpet"":[{""aaxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""baxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""type"":""carpet""}],""table"":[{""cells"":{""fill"":{""color"":""#EBF0F8""},""line"":{""color"":""white""}},""header"":{""fill"":{""color"":""#C8D4E3""},""line"":{""color"":""white""}},""type"":""table""}],""barpolar"":[{""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""barpolar""}],""pie"":[{""automargin"":true,""type"":""pie""}]},""layout"":{""autotypenumbers"":""strict"",""colorway"":[""#636efa"",""#EF553B"",""#00cc96"",""#ab63fa"",""#FFA15A"",""#19d3f3"",""#FF6692"",""#B6E880"",""#FF97FF"",""#FECB52""],""font"":{""color"":""#2a3f5f""},""hovermode"":""closest"",""hoverlabel"":{""align"":""left""},""paper_bgcolor"":""white"",""plot_bgcolor"":""#E5ECF6"",""polar"":{""bgcolor"":""#E5ECF6"",""angularaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""radialaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""ternary"":{""bgcolor"":""#E5ECF6"",""aaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""baxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""caxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""coloraxis"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""colorscale"":{""sequential"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""sequentialminus"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""diverging"":[[0,""#8e0152""],[0.1,""#c51b7d""],[0.2,""#de77ae""],[0.3,""#f1b6da""],[0.4,""#fde0ef""],[0.5,""#f7f7f7""],[0.6,""#e6f5d0""],[0.7,""#b8e186""],[0.8,""#7fbc41""],[0.9,""#4d9221""],[1,""#276419""]]},""xaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""yaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""scene"":{""xaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""yaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""zaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2}},""shapedefaults"":{""line"":{""color"":""#2a3f5f""}},""annotationdefaults"":{""arrowcolor"":""#2a3f5f"",""arrowhead"":0,""arrowwidth"":1},""geo"":{""bgcolor"":""white"",""landcolor"":""#E5ECF6"",""subunitcolor"":""white"",""showland"":true,""showlakes"":true,""lakecolor"":""white""},""title"":{""x"":0.05},""mapbox"":{""style"":""light""}}},""xaxis"":{""anchor"":""y"",""domain"":[0.0,1.0],""title"":{""text"":""original text length part""}},""yaxis"":{""anchor"":""x"",""domain"":[0.0,1.0],""title"":{""text"":""Model""},""categoryorder"":""array"",""categoryarray"":[""Upstage SOLAR Instruct v1 (11B)"",""Mistral-7B-Instruct-v0.2"",""Falcon Instruct (7B)"",""RedPajama-INCITE Chat (7B)"",""zephyr-7b-beta"",""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""chat-bison-32k (PaLM 2 32K)"",""Mixtral-8x7B-Instruct-v0.1"",""Vicuna v1.5 (7B)"",""WizardLM v1.2 (13B)"",""chat-bison (PaLM 2)"",""gemini-pro"",""llama-2-70b-chat"",""Qwen 1.5 Chat (7B)"",""OpenHermes-2.5-Mistral (7B)"",""LLaMA-2 Chat (7B)"",""01-ai Yi Chat (34B)"",""Chronos Hermes (13B)"",""gpt-4"",""Mistral (7B) Instruct v0.2 (Together AI)"",""gpt-4-turbo"",""gpt-3.5-turbo"",""Snorkel Mistral PairRM DPO (7B)""]},""legend"":{""title"":{""text"":""Model""},""tracegroupgap"":0},""title"":{""text"":""Summary metrics original text length part""},""barmode"":""relative""}}","How long is the summarization compared to the original text, calculated as: `len(summarized_text) + 1 / len(original_text) + 1`. Value is averaged for each model.",",model,bert_score_P,bert_score_R,bert_score_F1,original_text_length_part,sentence_count,length_penalty,bleu_score
-10,Snorkel Mistral PairRM DPO (7B),0.31672964,0.33782956,0.3265383,3.7740234383755356,3.5818443804034583,14928.0,0.002907897771152987
-18,gpt-3.5-turbo,0.4943981,0.48408476,0.4888874,0.5905700146991734,4.229639819909955,89814.0,0.007892445077902592
-20,gpt-4-turbo,0.42728576,0.4162435,0.42098433,0.5393220459796505,4.266137566137566,85120.0,0.0034873692407505464
-4,Mistral (7B) Instruct v0.2 (Together AI),0.3647361,0.3664233,0.36540908,0.5233998570385472,3.712222222222222,29298.0,0.005478518060743351
-19,gpt-4,0.48605907,0.472583,0.47901583,0.4763731952669352,4.266137566137566,85120.0,0.004704572681138337
-1,Chronos Hermes (13B),0.3124825,0.31071666,0.311415,0.4742810243835248,3.5818443804034583,14928.0,0.011439012700594395
-0,01-ai Yi Chat (34B),0.33974892,0.3404481,0.3399749,0.43251538287409536,3.5818443804034583,14928.0,0.007311566390840339
-3,LLaMA-2 Chat (7B),0.3203912,0.3153909,0.31770444,0.4084233313416049,3.5818443804034583,14928.0,0.004255859538193306
-7,OpenHermes-2.5-Mistral (7B),0.3618188,0.35180506,0.3565194,0.312054520357568,3.5818443804034583,14928.0,0.006563161880264231
-8,Qwen 1.5 Chat (7B),0.34855434,0.34154576,0.344803,0.29904529709475364,3.5818443804034583,14928.0,0.003185571110431172
-21,llama-2-70b-chat,0.20800962,0.21472095,0.21117964,0.29684572894554634,4.2436893203883495,88008.0,0.00329426273003284
-17,gemini-pro,0.23105659,0.23057175,0.23072062,0.295286999418032,4.244871794871795,87700.0,0.0025439281189154664
-15,chat-bison (PaLM 2),0.23117188,0.23029378,0.23060663,0.2927236655934559,4.281081081081081,83400.0,0.0033173472693443363
-14,WizardLM v1.2 (13B),0.34085444,0.32933056,0.33466902,0.28716720161049375,3.5818443804034583,14928.0,0.003671383039102015
-13,Vicuna v1.5 (7B),0.284109,0.27878883,0.28129113,0.2781035051738079,3.6173027989821884,16948.0,0.006952332387656228
-6,Mixtral-8x7B-Instruct-v0.1,0.19128644,0.19555509,0.19330867,0.2665288353398184,4.161038961038961,103320.0,0.0026839271544750283
-16,chat-bison-32k (PaLM 2 32K),0.23046139,0.22983725,0.23002876,0.2608806894318779,4.281081081081081,83400.0,0.002970914340485325
-11,TinyLlama/TinyLlama-1.1B-Chat-v1.0,0.122185074,0.11885959,0.12042627,0.13915355617375091,4.244871794871795,87700.0,0.002991155730532842
-22,zephyr-7b-beta,0.085390136,0.08266569,0.08394519,0.08796697338212889,4.159788702026735,103714.0,0.0010625100735849574
-9,RedPajama-INCITE Chat (7B),0.261367,0.23758642,0.2487217,0.0560284823193376,3.5818443804034583,14928.0,0.0
-2,Falcon Instruct (7B),0.2895086,0.23968808,0.2615204,0.0490635544441649,3.5818443804034583,14928.0,0.00021729364201653395
-5,Mistral-7B-Instruct-v0.2,0.043820098,0.042561684,0.04313921,0.04250630683894714,4.120342654588421,113258.0,0.0004930290548816363
-12,Upstage SOLAR Instruct v1 (11B),0.0,0.0,0.0,0.0017662349842492329,3.5818443804034583,14928.0,0.0
-","{""x"": ""original_text_length_part"", ""y"": ""model"", ""color"": ""model"", ""orientation"": ""h"", ""labels"": {""original_text_length_part"": ""original text length part"", ""model"": ""Model""}, ""title"": ""Summary metrics original text length part""}"
+})",Summary metrics BLEU score,"{""data"":[{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBLEU score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Chronos Hermes (13B)"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""Chronos Hermes (13B)"",""offsetgroup"":""Chronos Hermes (13B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.011542047908319874],""xaxis"":""x"",""y"":[""Chronos Hermes (13B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBLEU score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-3.5-turbo"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""gpt-3.5-turbo"",""offsetgroup"":""gpt-3.5-turbo"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.00919205486407126],""xaxis"":""x"",""y"":[""gpt-3.5-turbo""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBLEU score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""01-ai Yi Chat (34B)"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""01-ai Yi Chat (34B)"",""offsetgroup"":""01-ai Yi Chat (34B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.007428840277380581],""xaxis"":""x"",""y"":[""01-ai Yi Chat (34B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBLEU score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Vicuna v1.5 (7B)"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""Vicuna v1.5 (7B)"",""offsetgroup"":""Vicuna v1.5 (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.007105541953090669],""xaxis"":""x"",""y"":[""Vicuna v1.5 (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBLEU score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""OpenHermes-2.5-Mistral (7B)"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""OpenHermes-2.5-Mistral (7B)"",""offsetgroup"":""OpenHermes-2.5-Mistral (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.0068684572027745494],""xaxis"":""x"",""y"":[""OpenHermes-2.5-Mistral (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBLEU score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""gpt-4"",""offsetgroup"":""gpt-4"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.005711113295666468],""xaxis"":""x"",""y"":[""gpt-4""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBLEU score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral (7B) Instruct v0.2 (Together AI)"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""Mistral (7B) Instruct v0.2 (Together AI)"",""offsetgroup"":""Mistral (7B) Instruct v0.2 (Together AI)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.005650224193975447],""xaxis"":""x"",""y"":[""Mistral (7B) Instruct v0.2 (Together AI)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBLEU score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""llama-2-70b-chat"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""llama-2-70b-chat"",""offsetgroup"":""llama-2-70b-chat"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.004560500754935232],""xaxis"":""x"",""y"":[""llama-2-70b-chat""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBLEU score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""LLaMA-2 Chat (7B)"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""LLaMA-2 Chat (7B)"",""offsetgroup"":""LLaMA-2 Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.004415024709996126],""xaxis"":""x"",""y"":[""LLaMA-2 Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBLEU score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4-turbo"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""gpt-4-turbo"",""offsetgroup"":""gpt-4-turbo"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.0042830628392272],""xaxis"":""x"",""y"":[""gpt-4-turbo""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBLEU score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison (PaLM 2)"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""chat-bison (PaLM 2)"",""offsetgroup"":""chat-bison (PaLM 2)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.0037652345768886663],""xaxis"":""x"",""y"":[""chat-bison (PaLM 2)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBLEU score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""WizardLM v1.2 (13B)"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""WizardLM v1.2 (13B)"",""offsetgroup"":""WizardLM v1.2 (13B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.00373442128604677],""xaxis"":""x"",""y"":[""WizardLM v1.2 (13B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBLEU score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison-32k (PaLM 2 32K)"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""chat-bison-32k (PaLM 2 32K)"",""offsetgroup"":""chat-bison-32k (PaLM 2 32K)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.003694633514634998],""xaxis"":""x"",""y"":[""chat-bison-32k (PaLM 2 32K)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBLEU score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Qwen 1.5 Chat (7B)"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""Qwen 1.5 Chat (7B)"",""offsetgroup"":""Qwen 1.5 Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.0033327500620805805],""xaxis"":""x"",""y"":[""Qwen 1.5 Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBLEU score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""offsetgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.003286423403673119],""xaxis"":""x"",""y"":[""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBLEU score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gemini-pro"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""gemini-pro"",""offsetgroup"":""gemini-pro"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.0032373504004405487],""xaxis"":""x"",""y"":[""gemini-pro""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBLEU score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mixtral-8x7B-Instruct-v0.1"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""Mixtral-8x7B-Instruct-v0.1"",""offsetgroup"":""Mixtral-8x7B-Instruct-v0.1"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.0031843990217988536],""xaxis"":""x"",""y"":[""Mixtral-8x7B-Instruct-v0.1""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBLEU score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Falcon Instruct (7B)"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""Falcon Instruct (7B)"",""offsetgroup"":""Falcon Instruct (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.0030232447024239606],""xaxis"":""x"",""y"":[""Falcon Instruct (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBLEU score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Snorkel Mistral PairRM DPO (7B)"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""Snorkel Mistral PairRM DPO (7B)"",""offsetgroup"":""Snorkel Mistral PairRM DPO (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.0029236226777824676],""xaxis"":""x"",""y"":[""Snorkel Mistral PairRM DPO (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBLEU score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""zephyr-7b-beta"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""zephyr-7b-beta"",""offsetgroup"":""zephyr-7b-beta"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.0012612839176470308],""xaxis"":""x"",""y"":[""zephyr-7b-beta""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBLEU score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral-7B-Instruct-v0.2"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""Mistral-7B-Instruct-v0.2"",""offsetgroup"":""Mistral-7B-Instruct-v0.2"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.000566625796313851],""xaxis"":""x"",""y"":[""Mistral-7B-Instruct-v0.2""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBLEU score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""RedPajama-INCITE Chat (7B)"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""RedPajama-INCITE Chat (7B)"",""offsetgroup"":""RedPajama-INCITE Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.0],""xaxis"":""x"",""y"":[""RedPajama-INCITE Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBLEU score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Upstage SOLAR Instruct v1 (11B)"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""Upstage SOLAR Instruct v1 (11B)"",""offsetgroup"":""Upstage SOLAR Instruct v1 (11B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.0],""xaxis"":""x"",""y"":[""Upstage SOLAR Instruct v1 (11B)""],""yaxis"":""y"",""type"":""bar""}],""layout"":{""template"":{""data"":{""histogram2dcontour"":[{""type"":""histogram2dcontour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""choropleth"":[{""type"":""choropleth"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""histogram2d"":[{""type"":""histogram2d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmap"":[{""type"":""heatmap"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmapgl"":[{""type"":""heatmapgl"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""contourcarpet"":[{""type"":""contourcarpet"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""contour"":[{""type"":""contour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""surface"":[{""type"":""surface"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""mesh3d"":[{""type"":""mesh3d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""scatter"":[{""fillpattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2},""type"":""scatter""}],""parcoords"":[{""type"":""parcoords"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolargl"":[{""type"":""scatterpolargl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""bar"":[{""error_x"":{""color"":""#2a3f5f""},""error_y"":{""color"":""#2a3f5f""},""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""bar""}],""scattergeo"":[{""type"":""scattergeo"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolar"":[{""type"":""scatterpolar"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""histogram"":[{""marker"":{""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""histogram""}],""scattergl"":[{""type"":""scattergl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatter3d"":[{""type"":""scatter3d"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattermapbox"":[{""type"":""scattermapbox"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterternary"":[{""type"":""scatterternary"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattercarpet"":[{""type"":""scattercarpet"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""carpet"":[{""aaxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""baxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""type"":""carpet""}],""table"":[{""cells"":{""fill"":{""color"":""#EBF0F8""},""line"":{""color"":""white""}},""header"":{""fill"":{""color"":""#C8D4E3""},""line"":{""color"":""white""}},""type"":""table""}],""barpolar"":[{""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""barpolar""}],""pie"":[{""automargin"":true,""type"":""pie""}]},""layout"":{""autotypenumbers"":""strict"",""colorway"":[""#636efa"",""#EF553B"",""#00cc96"",""#ab63fa"",""#FFA15A"",""#19d3f3"",""#FF6692"",""#B6E880"",""#FF97FF"",""#FECB52""],""font"":{""color"":""#2a3f5f""},""hovermode"":""closest"",""hoverlabel"":{""align"":""left""},""paper_bgcolor"":""white"",""plot_bgcolor"":""#E5ECF6"",""polar"":{""bgcolor"":""#E5ECF6"",""angularaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""radialaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""ternary"":{""bgcolor"":""#E5ECF6"",""aaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""baxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""caxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""coloraxis"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""colorscale"":{""sequential"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""sequentialminus"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""diverging"":[[0,""#8e0152""],[0.1,""#c51b7d""],[0.2,""#de77ae""],[0.3,""#f1b6da""],[0.4,""#fde0ef""],[0.5,""#f7f7f7""],[0.6,""#e6f5d0""],[0.7,""#b8e186""],[0.8,""#7fbc41""],[0.9,""#4d9221""],[1,""#276419""]]},""xaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""yaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""scene"":{""xaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""yaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""zaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2}},""shapedefaults"":{""line"":{""color"":""#2a3f5f""}},""annotationdefaults"":{""arrowcolor"":""#2a3f5f"",""arrowhead"":0,""arrowwidth"":1},""geo"":{""bgcolor"":""white"",""landcolor"":""#E5ECF6"",""subunitcolor"":""white"",""showland"":true,""showlakes"":true,""lakecolor"":""white""},""title"":{""x"":0.05},""mapbox"":{""style"":""light""}}},""xaxis"":{""anchor"":""y"",""domain"":[0.0,1.0],""title"":{""text"":""BLEU score""}},""yaxis"":{""anchor"":""x"",""domain"":[0.0,1.0],""title"":{""text"":""Model""},""categoryorder"":""array"",""categoryarray"":[""Upstage SOLAR Instruct v1 (11B)"",""RedPajama-INCITE Chat (7B)"",""Mistral-7B-Instruct-v0.2"",""zephyr-7b-beta"",""Snorkel Mistral PairRM DPO (7B)"",""Falcon Instruct (7B)"",""Mixtral-8x7B-Instruct-v0.1"",""gemini-pro"",""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""Qwen 1.5 Chat (7B)"",""chat-bison-32k (PaLM 2 32K)"",""WizardLM v1.2 (13B)"",""chat-bison (PaLM 2)"",""gpt-4-turbo"",""LLaMA-2 Chat (7B)"",""llama-2-70b-chat"",""Mistral (7B) Instruct v0.2 (Together AI)"",""gpt-4"",""OpenHermes-2.5-Mistral (7B)"",""Vicuna v1.5 (7B)"",""01-ai Yi Chat (34B)"",""gpt-3.5-turbo"",""Chronos Hermes (13B)""]},""legend"":{""title"":{""text"":""Model""},""tracegroupgap"":0},""title"":{""text"":""Summary metrics BLEU score""},""barmode"":""relative""}}","
+ BLEU (BiLingual Evaluation Understudy) measures similarity between n-grams
+ (contiguous sequences of n words) in the generated and reference texts,
+ considering brevity penalties and length normalization.
+ For reference texts we used reference summarizations from the dataset, article title and original article text.
+ Maximum -gram size was set to 3. Unlike BERT score this metric doesn't handle synonyms, semantic nuance and context.
+
+ More about this metric can be read here: [link](https://aclanthology.org/P02-1040.pdf).
+ Higher score indicates better alignment between the generated and reference text. The value is averaged for each model.",",model,BERT_score_precision,BERT_score_recall,BERT_score_F1,BLEU_score,original_text_length_part,sentence_count,length_penalty
+1,Chronos Hermes (13B),0.31285536,0.32630467,0.3150877,0.011542047908319874,0.4742810243835248,3.5818443804034583,14928.0
+18,gpt-3.5-turbo,0.49478123,0.50445867,0.49331823,0.00919205486407126,0.5905700146991734,4.229639819909955,89814.0
+0,01-ai Yi Chat (34B),0.33981326,0.35219854,0.34183535,0.007428840277380581,0.43251538287409536,3.5818443804034583,14928.0
+13,Vicuna v1.5 (7B),0.28434175,0.29119453,0.2839047,0.007105541953090669,0.2781035051738079,3.6173027989821884,16948.0
+7,OpenHermes-2.5-Mistral (7B),0.3621834,0.3685358,0.36003792,0.0068684572027745494,0.312054520357568,3.5818443804034583,14928.0
+19,gpt-4,0.4864653,0.49512562,0.4839312,0.005711113295666468,0.4763731952669352,4.266137566137566,85120.0
+4,Mistral (7B) Instruct v0.2 (Together AI),0.36488953,0.3797993,0.36758336,0.005650224193975447,0.5233998570385472,3.712222222222222,29298.0
+21,llama-2-70b-chat,0.20810011,0.22406381,0.21268094,0.004560500754935232,0.29684572894554634,4.2436893203883495,88008.0
+3,LLaMA-2 Chat (7B),0.32074162,0.33171847,0.32136682,0.004415024709996126,0.4084233313416049,3.5818443804034583,14928.0
+20,gpt-4-turbo,0.42933634,0.4414623,0.4294052,0.0042830628392272,0.5393220459796505,4.266137566137566,85120.0
+15,chat-bison (PaLM 2),0.23123139,0.24001649,0.23214735,0.0037652345768886663,0.2927236655934559,4.281081081081081,83400.0
+14,WizardLM v1.2 (13B),0.3420949,0.34746957,0.33996373,0.00373442128604677,0.28716720161049375,3.5818443804034583,14928.0
+16,chat-bison-32k (PaLM 2 32K),0.23051436,0.23993237,0.2317056,0.003694633514634998,0.2608806894318779,4.281081081081081,83400.0
+8,Qwen 1.5 Chat (7B),0.34898603,0.35945317,0.34867778,0.0033327500620805805,0.29904529709475364,3.5818443804034583,14928.0
+11,TinyLlama/TinyLlama-1.1B-Chat-v1.0,0.122332305,0.12540509,0.12200464,0.003286423403673119,0.13915355617375091,4.244871794871795,87700.0
+17,gemini-pro,0.23109974,0.23956373,0.23199782,0.0032373504004405487,0.295286999418032,4.244871794871795,87700.0
+6,Mixtral-8x7B-Instruct-v0.1,0.19137934,0.2029136,0.19449018,0.0031843990217988536,0.2665288353398184,4.161038961038961,103320.0
+2,Falcon Instruct (7B),0.30270517,0.28607234,0.29104736,0.0030232447024239606,0.0490635544441649,3.5818443804034583,14928.0
+10,Snorkel Mistral PairRM DPO (7B),0.3167385,0.34785262,0.32718164,0.0029236226777824676,3.7740234383755356,3.5818443804034583,14928.0
+22,zephyr-7b-beta,0.085546724,0.08755772,0.085219756,0.0012612839176470308,0.08796697338212889,4.159788702026735,103714.0
+5,Mistral-7B-Instruct-v0.2,0.04389399,0.045185987,0.04378006,0.000566625796313851,0.04250630683894714,4.120342654588421,113258.0
+9,RedPajama-INCITE Chat (7B),0.26832756,0.27305293,0.26768887,0.0,0.0560284823193376,3.5818443804034583,14928.0
+12,Upstage SOLAR Instruct v1 (11B),0.0,0.0,0.0,0.0,0.0017662349842492329,3.5818443804034583,14928.0
+","{""x"": ""BLEU_score"", ""y"": ""model"", ""color"": ""model"", ""orientation"": ""h"", ""labels"": {""BLEU_score"": ""BLEU score"", ""model"": ""Model""}, ""title"": ""Summary metrics BLEU score""}"
"Figure({
'data': [{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
sentence count=%{x}',
- 'legendgroup': 'chat-bison (PaLM 2)',
+ 'hovertemplate': 'Model=%{y}
original text length part=%{x}',
+ 'legendgroup': 'Snorkel Mistral PairRM DPO (7B)',
'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
- 'name': 'chat-bison (PaLM 2)',
- 'offsetgroup': 'chat-bison (PaLM 2)',
+ 'name': 'Snorkel Mistral PairRM DPO (7B)',
+ 'offsetgroup': 'Snorkel Mistral PairRM DPO (7B)',
'orientation': 'h',
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([4.28108108]),
+ 'x': array([3.77402344]),
'xaxis': 'x',
- 'y': array(['chat-bison (PaLM 2)'], dtype=object),
+ 'y': array(['Snorkel Mistral PairRM DPO (7B)'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
sentence count=%{x}',
- 'legendgroup': 'chat-bison-32k (PaLM 2 32K)',
+ 'hovertemplate': 'Model=%{y}
original text length part=%{x}',
+ 'legendgroup': 'gpt-3.5-turbo',
'marker': {'color': '#EF553B', 'pattern': {'shape': ''}},
- 'name': 'chat-bison-32k (PaLM 2 32K)',
- 'offsetgroup': 'chat-bison-32k (PaLM 2 32K)',
+ 'name': 'gpt-3.5-turbo',
+ 'offsetgroup': 'gpt-3.5-turbo',
'orientation': 'h',
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([4.28108108]),
+ 'x': array([0.59057001]),
'xaxis': 'x',
- 'y': array(['chat-bison-32k (PaLM 2 32K)'], dtype=object),
+ 'y': array(['gpt-3.5-turbo'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
sentence count=%{x}',
+ 'hovertemplate': 'Model=%{y}
original text length part=%{x}',
'legendgroup': 'gpt-4-turbo',
'marker': {'color': '#00cc96', 'pattern': {'shape': ''}},
'name': 'gpt-4-turbo',
@@ -1528,278 +1541,278 @@ plot_object,header,plot_json,description,df,arguments
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([4.26613757]),
+ 'x': array([0.53932205]),
'xaxis': 'x',
'y': array(['gpt-4-turbo'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
sentence count=%{x}',
- 'legendgroup': 'gpt-4',
+ 'hovertemplate': 'Model=%{y}
original text length part=%{x}',
+ 'legendgroup': 'Mistral (7B) Instruct v0.2 (Together AI)',
'marker': {'color': '#ab63fa', 'pattern': {'shape': ''}},
- 'name': 'gpt-4',
- 'offsetgroup': 'gpt-4',
+ 'name': 'Mistral (7B) Instruct v0.2 (Together AI)',
+ 'offsetgroup': 'Mistral (7B) Instruct v0.2 (Together AI)',
'orientation': 'h',
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([4.26613757]),
+ 'x': array([0.52339986]),
'xaxis': 'x',
- 'y': array(['gpt-4'], dtype=object),
+ 'y': array(['Mistral (7B) Instruct v0.2 (Together AI)'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
sentence count=%{x}',
- 'legendgroup': 'gemini-pro',
+ 'hovertemplate': 'Model=%{y}
original text length part=%{x}',
+ 'legendgroup': 'gpt-4',
'marker': {'color': '#FFA15A', 'pattern': {'shape': ''}},
- 'name': 'gemini-pro',
- 'offsetgroup': 'gemini-pro',
+ 'name': 'gpt-4',
+ 'offsetgroup': 'gpt-4',
'orientation': 'h',
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([4.24487179]),
+ 'x': array([0.4763732]),
'xaxis': 'x',
- 'y': array(['gemini-pro'], dtype=object),
+ 'y': array(['gpt-4'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
sentence count=%{x}',
- 'legendgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
+ 'hovertemplate': 'Model=%{y}
original text length part=%{x}',
+ 'legendgroup': 'Chronos Hermes (13B)',
'marker': {'color': '#19d3f3', 'pattern': {'shape': ''}},
- 'name': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
- 'offsetgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
+ 'name': 'Chronos Hermes (13B)',
+ 'offsetgroup': 'Chronos Hermes (13B)',
'orientation': 'h',
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([4.24487179]),
+ 'x': array([0.47428102]),
'xaxis': 'x',
- 'y': array(['TinyLlama/TinyLlama-1.1B-Chat-v1.0'], dtype=object),
+ 'y': array(['Chronos Hermes (13B)'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
sentence count=%{x}',
- 'legendgroup': 'llama-2-70b-chat',
+ 'hovertemplate': 'Model=%{y}
original text length part=%{x}',
+ 'legendgroup': '01-ai Yi Chat (34B)',
'marker': {'color': '#FF6692', 'pattern': {'shape': ''}},
- 'name': 'llama-2-70b-chat',
- 'offsetgroup': 'llama-2-70b-chat',
+ 'name': '01-ai Yi Chat (34B)',
+ 'offsetgroup': '01-ai Yi Chat (34B)',
'orientation': 'h',
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([4.24368932]),
+ 'x': array([0.43251538]),
'xaxis': 'x',
- 'y': array(['llama-2-70b-chat'], dtype=object),
+ 'y': array(['01-ai Yi Chat (34B)'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
sentence count=%{x}',
- 'legendgroup': 'gpt-3.5-turbo',
+ 'hovertemplate': 'Model=%{y}
original text length part=%{x}',
+ 'legendgroup': 'LLaMA-2 Chat (7B)',
'marker': {'color': '#B6E880', 'pattern': {'shape': ''}},
- 'name': 'gpt-3.5-turbo',
- 'offsetgroup': 'gpt-3.5-turbo',
+ 'name': 'LLaMA-2 Chat (7B)',
+ 'offsetgroup': 'LLaMA-2 Chat (7B)',
'orientation': 'h',
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([4.22963982]),
+ 'x': array([0.40842333]),
'xaxis': 'x',
- 'y': array(['gpt-3.5-turbo'], dtype=object),
+ 'y': array(['LLaMA-2 Chat (7B)'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
sentence count=%{x}',
- 'legendgroup': 'Mixtral-8x7B-Instruct-v0.1',
+ 'hovertemplate': 'Model=%{y}
original text length part=%{x}',
+ 'legendgroup': 'OpenHermes-2.5-Mistral (7B)',
'marker': {'color': '#FF97FF', 'pattern': {'shape': ''}},
- 'name': 'Mixtral-8x7B-Instruct-v0.1',
- 'offsetgroup': 'Mixtral-8x7B-Instruct-v0.1',
+ 'name': 'OpenHermes-2.5-Mistral (7B)',
+ 'offsetgroup': 'OpenHermes-2.5-Mistral (7B)',
'orientation': 'h',
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([4.16103896]),
+ 'x': array([0.31205452]),
'xaxis': 'x',
- 'y': array(['Mixtral-8x7B-Instruct-v0.1'], dtype=object),
+ 'y': array(['OpenHermes-2.5-Mistral (7B)'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
sentence count=%{x}',
- 'legendgroup': 'zephyr-7b-beta',
+ 'hovertemplate': 'Model=%{y}
original text length part=%{x}',
+ 'legendgroup': 'Qwen 1.5 Chat (7B)',
'marker': {'color': '#FECB52', 'pattern': {'shape': ''}},
- 'name': 'zephyr-7b-beta',
- 'offsetgroup': 'zephyr-7b-beta',
+ 'name': 'Qwen 1.5 Chat (7B)',
+ 'offsetgroup': 'Qwen 1.5 Chat (7B)',
'orientation': 'h',
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([4.1597887]),
+ 'x': array([0.2990453]),
'xaxis': 'x',
- 'y': array(['zephyr-7b-beta'], dtype=object),
+ 'y': array(['Qwen 1.5 Chat (7B)'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
sentence count=%{x}',
- 'legendgroup': 'Mistral-7B-Instruct-v0.2',
+ 'hovertemplate': 'Model=%{y}
original text length part=%{x}',
+ 'legendgroup': 'llama-2-70b-chat',
'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
- 'name': 'Mistral-7B-Instruct-v0.2',
- 'offsetgroup': 'Mistral-7B-Instruct-v0.2',
+ 'name': 'llama-2-70b-chat',
+ 'offsetgroup': 'llama-2-70b-chat',
'orientation': 'h',
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([4.12034265]),
+ 'x': array([0.29684573]),
'xaxis': 'x',
- 'y': array(['Mistral-7B-Instruct-v0.2'], dtype=object),
+ 'y': array(['llama-2-70b-chat'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
sentence count=%{x}',
- 'legendgroup': 'Mistral (7B) Instruct v0.2 (Together AI)',
+ 'hovertemplate': 'Model=%{y}
original text length part=%{x}',
+ 'legendgroup': 'gemini-pro',
'marker': {'color': '#EF553B', 'pattern': {'shape': ''}},
- 'name': 'Mistral (7B) Instruct v0.2 (Together AI)',
- 'offsetgroup': 'Mistral (7B) Instruct v0.2 (Together AI)',
+ 'name': 'gemini-pro',
+ 'offsetgroup': 'gemini-pro',
'orientation': 'h',
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([3.71222222]),
+ 'x': array([0.295287]),
'xaxis': 'x',
- 'y': array(['Mistral (7B) Instruct v0.2 (Together AI)'], dtype=object),
+ 'y': array(['gemini-pro'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
sentence count=%{x}',
- 'legendgroup': 'Vicuna v1.5 (7B)',
+ 'hovertemplate': 'Model=%{y}
original text length part=%{x}',
+ 'legendgroup': 'chat-bison (PaLM 2)',
'marker': {'color': '#00cc96', 'pattern': {'shape': ''}},
- 'name': 'Vicuna v1.5 (7B)',
- 'offsetgroup': 'Vicuna v1.5 (7B)',
+ 'name': 'chat-bison (PaLM 2)',
+ 'offsetgroup': 'chat-bison (PaLM 2)',
'orientation': 'h',
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([3.6173028]),
+ 'x': array([0.29272367]),
'xaxis': 'x',
- 'y': array(['Vicuna v1.5 (7B)'], dtype=object),
+ 'y': array(['chat-bison (PaLM 2)'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
sentence count=%{x}',
- 'legendgroup': 'Falcon Instruct (7B)',
+ 'hovertemplate': 'Model=%{y}
original text length part=%{x}',
+ 'legendgroup': 'WizardLM v1.2 (13B)',
'marker': {'color': '#ab63fa', 'pattern': {'shape': ''}},
- 'name': 'Falcon Instruct (7B)',
- 'offsetgroup': 'Falcon Instruct (7B)',
+ 'name': 'WizardLM v1.2 (13B)',
+ 'offsetgroup': 'WizardLM v1.2 (13B)',
'orientation': 'h',
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([3.58184438]),
+ 'x': array([0.2871672]),
'xaxis': 'x',
- 'y': array(['Falcon Instruct (7B)'], dtype=object),
+ 'y': array(['WizardLM v1.2 (13B)'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
sentence count=%{x}',
- 'legendgroup': 'RedPajama-INCITE Chat (7B)',
+ 'hovertemplate': 'Model=%{y}
original text length part=%{x}',
+ 'legendgroup': 'Vicuna v1.5 (7B)',
'marker': {'color': '#FFA15A', 'pattern': {'shape': ''}},
- 'name': 'RedPajama-INCITE Chat (7B)',
- 'offsetgroup': 'RedPajama-INCITE Chat (7B)',
+ 'name': 'Vicuna v1.5 (7B)',
+ 'offsetgroup': 'Vicuna v1.5 (7B)',
'orientation': 'h',
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([3.58184438]),
+ 'x': array([0.27810351]),
'xaxis': 'x',
- 'y': array(['RedPajama-INCITE Chat (7B)'], dtype=object),
+ 'y': array(['Vicuna v1.5 (7B)'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
sentence count=%{x}',
- 'legendgroup': 'Snorkel Mistral PairRM DPO (7B)',
+ 'hovertemplate': 'Model=%{y}
original text length part=%{x}',
+ 'legendgroup': 'Mixtral-8x7B-Instruct-v0.1',
'marker': {'color': '#19d3f3', 'pattern': {'shape': ''}},
- 'name': 'Snorkel Mistral PairRM DPO (7B)',
- 'offsetgroup': 'Snorkel Mistral PairRM DPO (7B)',
+ 'name': 'Mixtral-8x7B-Instruct-v0.1',
+ 'offsetgroup': 'Mixtral-8x7B-Instruct-v0.1',
'orientation': 'h',
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([3.58184438]),
+ 'x': array([0.26652884]),
'xaxis': 'x',
- 'y': array(['Snorkel Mistral PairRM DPO (7B)'], dtype=object),
+ 'y': array(['Mixtral-8x7B-Instruct-v0.1'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
sentence count=%{x}',
- 'legendgroup': 'WizardLM v1.2 (13B)',
+ 'hovertemplate': 'Model=%{y}
original text length part=%{x}',
+ 'legendgroup': 'chat-bison-32k (PaLM 2 32K)',
'marker': {'color': '#FF6692', 'pattern': {'shape': ''}},
- 'name': 'WizardLM v1.2 (13B)',
- 'offsetgroup': 'WizardLM v1.2 (13B)',
+ 'name': 'chat-bison-32k (PaLM 2 32K)',
+ 'offsetgroup': 'chat-bison-32k (PaLM 2 32K)',
'orientation': 'h',
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([3.58184438]),
+ 'x': array([0.26088069]),
'xaxis': 'x',
- 'y': array(['WizardLM v1.2 (13B)'], dtype=object),
+ 'y': array(['chat-bison-32k (PaLM 2 32K)'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
sentence count=%{x}',
- 'legendgroup': 'Qwen 1.5 Chat (7B)',
+ 'hovertemplate': 'Model=%{y}
original text length part=%{x}',
+ 'legendgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
'marker': {'color': '#B6E880', 'pattern': {'shape': ''}},
- 'name': 'Qwen 1.5 Chat (7B)',
- 'offsetgroup': 'Qwen 1.5 Chat (7B)',
+ 'name': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
+ 'offsetgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
'orientation': 'h',
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([3.58184438]),
+ 'x': array([0.13915356]),
'xaxis': 'x',
- 'y': array(['Qwen 1.5 Chat (7B)'], dtype=object),
+ 'y': array(['TinyLlama/TinyLlama-1.1B-Chat-v1.0'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
sentence count=%{x}',
- 'legendgroup': 'OpenHermes-2.5-Mistral (7B)',
+ 'hovertemplate': 'Model=%{y}
original text length part=%{x}',
+ 'legendgroup': 'zephyr-7b-beta',
'marker': {'color': '#FF97FF', 'pattern': {'shape': ''}},
- 'name': 'OpenHermes-2.5-Mistral (7B)',
- 'offsetgroup': 'OpenHermes-2.5-Mistral (7B)',
+ 'name': 'zephyr-7b-beta',
+ 'offsetgroup': 'zephyr-7b-beta',
'orientation': 'h',
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([3.58184438]),
+ 'x': array([0.08796697]),
'xaxis': 'x',
- 'y': array(['OpenHermes-2.5-Mistral (7B)'], dtype=object),
+ 'y': array(['zephyr-7b-beta'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
sentence count=%{x}',
- 'legendgroup': 'LLaMA-2 Chat (7B)',
+ 'hovertemplate': 'Model=%{y}
original text length part=%{x}',
+ 'legendgroup': 'RedPajama-INCITE Chat (7B)',
'marker': {'color': '#FECB52', 'pattern': {'shape': ''}},
- 'name': 'LLaMA-2 Chat (7B)',
- 'offsetgroup': 'LLaMA-2 Chat (7B)',
+ 'name': 'RedPajama-INCITE Chat (7B)',
+ 'offsetgroup': 'RedPajama-INCITE Chat (7B)',
'orientation': 'h',
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([3.58184438]),
+ 'x': array([0.05602848]),
'xaxis': 'x',
- 'y': array(['LLaMA-2 Chat (7B)'], dtype=object),
+ 'y': array(['RedPajama-INCITE Chat (7B)'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
sentence count=%{x}',
- 'legendgroup': '01-ai Yi Chat (34B)',
+ 'hovertemplate': 'Model=%{y}
original text length part=%{x}',
+ 'legendgroup': 'Falcon Instruct (7B)',
'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
- 'name': '01-ai Yi Chat (34B)',
- 'offsetgroup': '01-ai Yi Chat (34B)',
+ 'name': 'Falcon Instruct (7B)',
+ 'offsetgroup': 'Falcon Instruct (7B)',
'orientation': 'h',
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([3.58184438]),
+ 'x': array([0.04906355]),
'xaxis': 'x',
- 'y': array(['01-ai Yi Chat (34B)'], dtype=object),
+ 'y': array(['Falcon Instruct (7B)'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
sentence count=%{x}',
- 'legendgroup': 'Chronos Hermes (13B)',
+ 'hovertemplate': 'Model=%{y}
original text length part=%{x}',
+ 'legendgroup': 'Mistral-7B-Instruct-v0.2',
'marker': {'color': '#EF553B', 'pattern': {'shape': ''}},
- 'name': 'Chronos Hermes (13B)',
- 'offsetgroup': 'Chronos Hermes (13B)',
+ 'name': 'Mistral-7B-Instruct-v0.2',
+ 'offsetgroup': 'Mistral-7B-Instruct-v0.2',
'orientation': 'h',
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([3.58184438]),
+ 'x': array([0.04250631]),
'xaxis': 'x',
- 'y': array(['Chronos Hermes (13B)'], dtype=object),
+ 'y': array(['Mistral-7B-Instruct-v0.2'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
sentence count=%{x}',
+ 'hovertemplate': 'Model=%{y}
original text length part=%{x}',
'legendgroup': 'Upstage SOLAR Instruct v1 (11B)',
'marker': {'color': '#00cc96', 'pattern': {'shape': ''}},
'name': 'Upstage SOLAR Instruct v1 (11B)',
@@ -1808,218 +1821,221 @@ plot_object,header,plot_json,description,df,arguments
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([3.58184438]),
+ 'x': array([0.00176623]),
'xaxis': 'x',
'y': array(['Upstage SOLAR Instruct v1 (11B)'], dtype=object),
'yaxis': 'y'}],
'layout': {'barmode': 'relative',
'legend': {'title': {'text': 'Model'}, 'tracegroupgap': 0},
'template': '...',
- 'title': {'text': 'Summary metrics sentence count'},
- 'xaxis': {'anchor': 'y', 'domain': [0.0, 1.0], 'title': {'text': 'sentence count'}},
+ 'title': {'text': 'Summary metrics original text length part'},
+ 'xaxis': {'anchor': 'y', 'domain': [0.0, 1.0], 'title': {'text': 'original text length part'}},
'yaxis': {'anchor': 'x',
'categoryarray': [Upstage SOLAR Instruct v1 (11B),
- Chronos Hermes (13B), 01-ai Yi Chat
- (34B), LLaMA-2 Chat (7B),
- OpenHermes-2.5-Mistral (7B), Qwen 1.5
- Chat (7B), WizardLM v1.2 (13B), Snorkel
- Mistral PairRM DPO (7B), RedPajama-
- INCITE Chat (7B), Falcon Instruct (7B),
- Vicuna v1.5 (7B), Mistral (7B) Instruct
- v0.2 (Together AI),
- Mistral-7B-Instruct-v0.2,
- zephyr-7b-beta,
- Mixtral-8x7B-Instruct-v0.1,
- gpt-3.5-turbo, llama-2-70b-chat,
+ Mistral-7B-Instruct-v0.2, Falcon
+ Instruct (7B), RedPajama-INCITE Chat
+ (7B), zephyr-7b-beta,
TinyLlama/TinyLlama-1.1B-Chat-v1.0,
- gemini-pro, gpt-4, gpt-4-turbo, chat-
- bison-32k (PaLM 2 32K), chat-bison (PaLM
- 2)],
+ chat-bison-32k (PaLM 2 32K),
+ Mixtral-8x7B-Instruct-v0.1, Vicuna v1.5
+ (7B), WizardLM v1.2 (13B), chat-bison
+ (PaLM 2), gemini-pro, llama-2-70b-chat,
+ Qwen 1.5 Chat (7B),
+ OpenHermes-2.5-Mistral (7B), LLaMA-2
+ Chat (7B), 01-ai Yi Chat (34B), Chronos
+ Hermes (13B), gpt-4, Mistral (7B)
+ Instruct v0.2 (Together AI),
+ gpt-4-turbo, gpt-3.5-turbo, Snorkel
+ Mistral PairRM DPO (7B)],
'categoryorder': 'array',
'domain': [0.0, 1.0],
'title': {'text': 'Model'}}}
-})",Summary metrics sentence count,"{""data"":[{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003esentence count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison (PaLM 2)"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""chat-bison (PaLM 2)"",""offsetgroup"":""chat-bison (PaLM 2)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[4.281081081081081],""xaxis"":""x"",""y"":[""chat-bison (PaLM 2)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003esentence count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison-32k (PaLM 2 32K)"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""chat-bison-32k (PaLM 2 32K)"",""offsetgroup"":""chat-bison-32k (PaLM 2 32K)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[4.281081081081081],""xaxis"":""x"",""y"":[""chat-bison-32k (PaLM 2 32K)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003esentence count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4-turbo"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""gpt-4-turbo"",""offsetgroup"":""gpt-4-turbo"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[4.266137566137566],""xaxis"":""x"",""y"":[""gpt-4-turbo""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003esentence count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""gpt-4"",""offsetgroup"":""gpt-4"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[4.266137566137566],""xaxis"":""x"",""y"":[""gpt-4""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003esentence count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gemini-pro"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""gemini-pro"",""offsetgroup"":""gemini-pro"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[4.244871794871795],""xaxis"":""x"",""y"":[""gemini-pro""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003esentence count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""offsetgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[4.244871794871795],""xaxis"":""x"",""y"":[""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003esentence count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""llama-2-70b-chat"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""llama-2-70b-chat"",""offsetgroup"":""llama-2-70b-chat"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[4.2436893203883495],""xaxis"":""x"",""y"":[""llama-2-70b-chat""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003esentence count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-3.5-turbo"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""gpt-3.5-turbo"",""offsetgroup"":""gpt-3.5-turbo"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[4.229639819909955],""xaxis"":""x"",""y"":[""gpt-3.5-turbo""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003esentence count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mixtral-8x7B-Instruct-v0.1"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""Mixtral-8x7B-Instruct-v0.1"",""offsetgroup"":""Mixtral-8x7B-Instruct-v0.1"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[4.161038961038961],""xaxis"":""x"",""y"":[""Mixtral-8x7B-Instruct-v0.1""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003esentence count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""zephyr-7b-beta"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""zephyr-7b-beta"",""offsetgroup"":""zephyr-7b-beta"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[4.159788702026735],""xaxis"":""x"",""y"":[""zephyr-7b-beta""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003esentence count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral-7B-Instruct-v0.2"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""Mistral-7B-Instruct-v0.2"",""offsetgroup"":""Mistral-7B-Instruct-v0.2"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[4.120342654588421],""xaxis"":""x"",""y"":[""Mistral-7B-Instruct-v0.2""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003esentence count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral (7B) Instruct v0.2 (Together AI)"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""Mistral (7B) Instruct v0.2 (Together AI)"",""offsetgroup"":""Mistral (7B) Instruct v0.2 (Together AI)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[3.712222222222222],""xaxis"":""x"",""y"":[""Mistral (7B) Instruct v0.2 (Together AI)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003esentence count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Vicuna v1.5 (7B)"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""Vicuna v1.5 (7B)"",""offsetgroup"":""Vicuna v1.5 (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[3.6173027989821884],""xaxis"":""x"",""y"":[""Vicuna v1.5 (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003esentence count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Falcon Instruct (7B)"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""Falcon Instruct (7B)"",""offsetgroup"":""Falcon Instruct (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[3.5818443804034583],""xaxis"":""x"",""y"":[""Falcon Instruct (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003esentence count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""RedPajama-INCITE Chat (7B)"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""RedPajama-INCITE Chat (7B)"",""offsetgroup"":""RedPajama-INCITE Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[3.5818443804034583],""xaxis"":""x"",""y"":[""RedPajama-INCITE Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003esentence count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Snorkel Mistral PairRM DPO (7B)"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""Snorkel Mistral PairRM DPO (7B)"",""offsetgroup"":""Snorkel Mistral PairRM DPO (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[3.5818443804034583],""xaxis"":""x"",""y"":[""Snorkel Mistral PairRM DPO (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003esentence count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""WizardLM v1.2 (13B)"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""WizardLM v1.2 (13B)"",""offsetgroup"":""WizardLM v1.2 (13B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[3.5818443804034583],""xaxis"":""x"",""y"":[""WizardLM v1.2 (13B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003esentence count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Qwen 1.5 Chat (7B)"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""Qwen 1.5 Chat (7B)"",""offsetgroup"":""Qwen 1.5 Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[3.5818443804034583],""xaxis"":""x"",""y"":[""Qwen 1.5 Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003esentence count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""OpenHermes-2.5-Mistral (7B)"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""OpenHermes-2.5-Mistral (7B)"",""offsetgroup"":""OpenHermes-2.5-Mistral (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[3.5818443804034583],""xaxis"":""x"",""y"":[""OpenHermes-2.5-Mistral (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003esentence count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""LLaMA-2 Chat (7B)"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""LLaMA-2 Chat (7B)"",""offsetgroup"":""LLaMA-2 Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[3.5818443804034583],""xaxis"":""x"",""y"":[""LLaMA-2 Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003esentence count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""01-ai Yi Chat (34B)"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""01-ai Yi Chat (34B)"",""offsetgroup"":""01-ai Yi Chat (34B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[3.5818443804034583],""xaxis"":""x"",""y"":[""01-ai Yi Chat (34B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003esentence count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Chronos Hermes (13B)"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""Chronos Hermes (13B)"",""offsetgroup"":""Chronos Hermes (13B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[3.5818443804034583],""xaxis"":""x"",""y"":[""Chronos Hermes (13B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003esentence count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Upstage SOLAR Instruct v1 (11B)"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""Upstage SOLAR Instruct v1 (11B)"",""offsetgroup"":""Upstage SOLAR Instruct v1 (11B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[3.5818443804034583],""xaxis"":""x"",""y"":[""Upstage SOLAR Instruct v1 (11B)""],""yaxis"":""y"",""type"":""bar""}],""layout"":{""template"":{""data"":{""histogram2dcontour"":[{""type"":""histogram2dcontour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""choropleth"":[{""type"":""choropleth"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""histogram2d"":[{""type"":""histogram2d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmap"":[{""type"":""heatmap"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmapgl"":[{""type"":""heatmapgl"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""contourcarpet"":[{""type"":""contourcarpet"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""contour"":[{""type"":""contour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""surface"":[{""type"":""surface"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""mesh3d"":[{""type"":""mesh3d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""scatter"":[{""fillpattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2},""type"":""scatter""}],""parcoords"":[{""type"":""parcoords"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolargl"":[{""type"":""scatterpolargl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""bar"":[{""error_x"":{""color"":""#2a3f5f""},""error_y"":{""color"":""#2a3f5f""},""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""bar""}],""scattergeo"":[{""type"":""scattergeo"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolar"":[{""type"":""scatterpolar"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""histogram"":[{""marker"":{""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""histogram""}],""scattergl"":[{""type"":""scattergl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatter3d"":[{""type"":""scatter3d"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattermapbox"":[{""type"":""scattermapbox"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterternary"":[{""type"":""scatterternary"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattercarpet"":[{""type"":""scattercarpet"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""carpet"":[{""aaxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""baxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""type"":""carpet""}],""table"":[{""cells"":{""fill"":{""color"":""#EBF0F8""},""line"":{""color"":""white""}},""header"":{""fill"":{""color"":""#C8D4E3""},""line"":{""color"":""white""}},""type"":""table""}],""barpolar"":[{""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""barpolar""}],""pie"":[{""automargin"":true,""type"":""pie""}]},""layout"":{""autotypenumbers"":""strict"",""colorway"":[""#636efa"",""#EF553B"",""#00cc96"",""#ab63fa"",""#FFA15A"",""#19d3f3"",""#FF6692"",""#B6E880"",""#FF97FF"",""#FECB52""],""font"":{""color"":""#2a3f5f""},""hovermode"":""closest"",""hoverlabel"":{""align"":""left""},""paper_bgcolor"":""white"",""plot_bgcolor"":""#E5ECF6"",""polar"":{""bgcolor"":""#E5ECF6"",""angularaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""radialaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""ternary"":{""bgcolor"":""#E5ECF6"",""aaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""baxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""caxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""coloraxis"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""colorscale"":{""sequential"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""sequentialminus"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""diverging"":[[0,""#8e0152""],[0.1,""#c51b7d""],[0.2,""#de77ae""],[0.3,""#f1b6da""],[0.4,""#fde0ef""],[0.5,""#f7f7f7""],[0.6,""#e6f5d0""],[0.7,""#b8e186""],[0.8,""#7fbc41""],[0.9,""#4d9221""],[1,""#276419""]]},""xaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""yaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""scene"":{""xaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""yaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""zaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2}},""shapedefaults"":{""line"":{""color"":""#2a3f5f""}},""annotationdefaults"":{""arrowcolor"":""#2a3f5f"",""arrowhead"":0,""arrowwidth"":1},""geo"":{""bgcolor"":""white"",""landcolor"":""#E5ECF6"",""subunitcolor"":""white"",""showland"":true,""showlakes"":true,""lakecolor"":""white""},""title"":{""x"":0.05},""mapbox"":{""style"":""light""}}},""xaxis"":{""anchor"":""y"",""domain"":[0.0,1.0],""title"":{""text"":""sentence count""}},""yaxis"":{""anchor"":""x"",""domain"":[0.0,1.0],""title"":{""text"":""Model""},""categoryorder"":""array"",""categoryarray"":[""Upstage SOLAR Instruct v1 (11B)"",""Chronos Hermes (13B)"",""01-ai Yi Chat (34B)"",""LLaMA-2 Chat (7B)"",""OpenHermes-2.5-Mistral (7B)"",""Qwen 1.5 Chat (7B)"",""WizardLM v1.2 (13B)"",""Snorkel Mistral PairRM DPO (7B)"",""RedPajama-INCITE Chat (7B)"",""Falcon Instruct (7B)"",""Vicuna v1.5 (7B)"",""Mistral (7B) Instruct v0.2 (Together AI)"",""Mistral-7B-Instruct-v0.2"",""zephyr-7b-beta"",""Mixtral-8x7B-Instruct-v0.1"",""gpt-3.5-turbo"",""llama-2-70b-chat"",""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""gemini-pro"",""gpt-4"",""gpt-4-turbo"",""chat-bison-32k (PaLM 2 32K)"",""chat-bison (PaLM 2)""]},""legend"":{""title"":{""text"":""Model""},""tracegroupgap"":0},""title"":{""text"":""Summary metrics sentence count""},""barmode"":""relative""}}",Average sentence count of the summary.,",model,bert_score_P,bert_score_R,bert_score_F1,original_text_length_part,sentence_count,length_penalty,bleu_score
-15,chat-bison (PaLM 2),0.23117188,0.23029378,0.23060663,0.2927236655934559,4.281081081081081,83400.0,0.0033173472693443363
-16,chat-bison-32k (PaLM 2 32K),0.23046139,0.22983725,0.23002876,0.2608806894318779,4.281081081081081,83400.0,0.002970914340485325
-20,gpt-4-turbo,0.42728576,0.4162435,0.42098433,0.5393220459796505,4.266137566137566,85120.0,0.0034873692407505464
-19,gpt-4,0.48605907,0.472583,0.47901583,0.4763731952669352,4.266137566137566,85120.0,0.004704572681138337
-17,gemini-pro,0.23105659,0.23057175,0.23072062,0.295286999418032,4.244871794871795,87700.0,0.0025439281189154664
-11,TinyLlama/TinyLlama-1.1B-Chat-v1.0,0.122185074,0.11885959,0.12042627,0.13915355617375091,4.244871794871795,87700.0,0.002991155730532842
-21,llama-2-70b-chat,0.20800962,0.21472095,0.21117964,0.29684572894554634,4.2436893203883495,88008.0,0.00329426273003284
-18,gpt-3.5-turbo,0.4943981,0.48408476,0.4888874,0.5905700146991734,4.229639819909955,89814.0,0.007892445077902592
-6,Mixtral-8x7B-Instruct-v0.1,0.19128644,0.19555509,0.19330867,0.2665288353398184,4.161038961038961,103320.0,0.0026839271544750283
-22,zephyr-7b-beta,0.085390136,0.08266569,0.08394519,0.08796697338212889,4.159788702026735,103714.0,0.0010625100735849574
-5,Mistral-7B-Instruct-v0.2,0.043820098,0.042561684,0.04313921,0.04250630683894714,4.120342654588421,113258.0,0.0004930290548816363
-4,Mistral (7B) Instruct v0.2 (Together AI),0.3647361,0.3664233,0.36540908,0.5233998570385472,3.712222222222222,29298.0,0.005478518060743351
-13,Vicuna v1.5 (7B),0.284109,0.27878883,0.28129113,0.2781035051738079,3.6173027989821884,16948.0,0.006952332387656228
-2,Falcon Instruct (7B),0.2895086,0.23968808,0.2615204,0.0490635544441649,3.5818443804034583,14928.0,0.00021729364201653395
-9,RedPajama-INCITE Chat (7B),0.261367,0.23758642,0.2487217,0.0560284823193376,3.5818443804034583,14928.0,0.0
-10,Snorkel Mistral PairRM DPO (7B),0.31672964,0.33782956,0.3265383,3.7740234383755356,3.5818443804034583,14928.0,0.002907897771152987
-14,WizardLM v1.2 (13B),0.34085444,0.32933056,0.33466902,0.28716720161049375,3.5818443804034583,14928.0,0.003671383039102015
-8,Qwen 1.5 Chat (7B),0.34855434,0.34154576,0.344803,0.29904529709475364,3.5818443804034583,14928.0,0.003185571110431172
-7,OpenHermes-2.5-Mistral (7B),0.3618188,0.35180506,0.3565194,0.312054520357568,3.5818443804034583,14928.0,0.006563161880264231
-3,LLaMA-2 Chat (7B),0.3203912,0.3153909,0.31770444,0.4084233313416049,3.5818443804034583,14928.0,0.004255859538193306
-0,01-ai Yi Chat (34B),0.33974892,0.3404481,0.3399749,0.43251538287409536,3.5818443804034583,14928.0,0.007311566390840339
-1,Chronos Hermes (13B),0.3124825,0.31071666,0.311415,0.4742810243835248,3.5818443804034583,14928.0,0.011439012700594395
-12,Upstage SOLAR Instruct v1 (11B),0.0,0.0,0.0,0.0017662349842492329,3.5818443804034583,14928.0,0.0
-","{""x"": ""sentence_count"", ""y"": ""model"", ""color"": ""model"", ""orientation"": ""h"", ""labels"": {""sentence_count"": ""sentence count"", ""model"": ""Model""}, ""title"": ""Summary metrics sentence count""}"
+})",Summary metrics original text length part,"{""data"":[{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eoriginal text length part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Snorkel Mistral PairRM DPO (7B)"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""Snorkel Mistral PairRM DPO (7B)"",""offsetgroup"":""Snorkel Mistral PairRM DPO (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[3.7740234383755356],""xaxis"":""x"",""y"":[""Snorkel Mistral PairRM DPO (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eoriginal text length part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-3.5-turbo"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""gpt-3.5-turbo"",""offsetgroup"":""gpt-3.5-turbo"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.5905700146991734],""xaxis"":""x"",""y"":[""gpt-3.5-turbo""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eoriginal text length part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4-turbo"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""gpt-4-turbo"",""offsetgroup"":""gpt-4-turbo"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.5393220459796505],""xaxis"":""x"",""y"":[""gpt-4-turbo""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eoriginal text length part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral (7B) Instruct v0.2 (Together AI)"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""Mistral (7B) Instruct v0.2 (Together AI)"",""offsetgroup"":""Mistral (7B) Instruct v0.2 (Together AI)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.5233998570385472],""xaxis"":""x"",""y"":[""Mistral (7B) Instruct v0.2 (Together AI)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eoriginal text length part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""gpt-4"",""offsetgroup"":""gpt-4"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.4763731952669352],""xaxis"":""x"",""y"":[""gpt-4""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eoriginal text length part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Chronos Hermes (13B)"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""Chronos Hermes (13B)"",""offsetgroup"":""Chronos Hermes (13B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.4742810243835248],""xaxis"":""x"",""y"":[""Chronos Hermes (13B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eoriginal text length part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""01-ai Yi Chat (34B)"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""01-ai Yi Chat (34B)"",""offsetgroup"":""01-ai Yi Chat (34B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.43251538287409536],""xaxis"":""x"",""y"":[""01-ai Yi Chat (34B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eoriginal text length part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""LLaMA-2 Chat (7B)"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""LLaMA-2 Chat (7B)"",""offsetgroup"":""LLaMA-2 Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.4084233313416049],""xaxis"":""x"",""y"":[""LLaMA-2 Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eoriginal text length part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""OpenHermes-2.5-Mistral (7B)"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""OpenHermes-2.5-Mistral (7B)"",""offsetgroup"":""OpenHermes-2.5-Mistral (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.312054520357568],""xaxis"":""x"",""y"":[""OpenHermes-2.5-Mistral (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eoriginal text length part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Qwen 1.5 Chat (7B)"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""Qwen 1.5 Chat (7B)"",""offsetgroup"":""Qwen 1.5 Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.29904529709475364],""xaxis"":""x"",""y"":[""Qwen 1.5 Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eoriginal text length part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""llama-2-70b-chat"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""llama-2-70b-chat"",""offsetgroup"":""llama-2-70b-chat"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.29684572894554634],""xaxis"":""x"",""y"":[""llama-2-70b-chat""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eoriginal text length part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gemini-pro"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""gemini-pro"",""offsetgroup"":""gemini-pro"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.295286999418032],""xaxis"":""x"",""y"":[""gemini-pro""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eoriginal text length part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison (PaLM 2)"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""chat-bison (PaLM 2)"",""offsetgroup"":""chat-bison (PaLM 2)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.2927236655934559],""xaxis"":""x"",""y"":[""chat-bison (PaLM 2)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eoriginal text length part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""WizardLM v1.2 (13B)"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""WizardLM v1.2 (13B)"",""offsetgroup"":""WizardLM v1.2 (13B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.28716720161049375],""xaxis"":""x"",""y"":[""WizardLM v1.2 (13B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eoriginal text length part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Vicuna v1.5 (7B)"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""Vicuna v1.5 (7B)"",""offsetgroup"":""Vicuna v1.5 (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.2781035051738079],""xaxis"":""x"",""y"":[""Vicuna v1.5 (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eoriginal text length part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mixtral-8x7B-Instruct-v0.1"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""Mixtral-8x7B-Instruct-v0.1"",""offsetgroup"":""Mixtral-8x7B-Instruct-v0.1"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.2665288353398184],""xaxis"":""x"",""y"":[""Mixtral-8x7B-Instruct-v0.1""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eoriginal text length part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison-32k (PaLM 2 32K)"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""chat-bison-32k (PaLM 2 32K)"",""offsetgroup"":""chat-bison-32k (PaLM 2 32K)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.2608806894318779],""xaxis"":""x"",""y"":[""chat-bison-32k (PaLM 2 32K)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eoriginal text length part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""offsetgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.13915355617375091],""xaxis"":""x"",""y"":[""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eoriginal text length part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""zephyr-7b-beta"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""zephyr-7b-beta"",""offsetgroup"":""zephyr-7b-beta"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.08796697338212889],""xaxis"":""x"",""y"":[""zephyr-7b-beta""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eoriginal text length part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""RedPajama-INCITE Chat (7B)"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""RedPajama-INCITE Chat (7B)"",""offsetgroup"":""RedPajama-INCITE Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.0560284823193376],""xaxis"":""x"",""y"":[""RedPajama-INCITE Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eoriginal text length part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Falcon Instruct (7B)"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""Falcon Instruct (7B)"",""offsetgroup"":""Falcon Instruct (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.0490635544441649],""xaxis"":""x"",""y"":[""Falcon Instruct (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eoriginal text length part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral-7B-Instruct-v0.2"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""Mistral-7B-Instruct-v0.2"",""offsetgroup"":""Mistral-7B-Instruct-v0.2"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.04250630683894714],""xaxis"":""x"",""y"":[""Mistral-7B-Instruct-v0.2""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eoriginal text length part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Upstage SOLAR Instruct v1 (11B)"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""Upstage SOLAR Instruct v1 (11B)"",""offsetgroup"":""Upstage SOLAR Instruct v1 (11B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.0017662349842492329],""xaxis"":""x"",""y"":[""Upstage SOLAR Instruct v1 (11B)""],""yaxis"":""y"",""type"":""bar""}],""layout"":{""template"":{""data"":{""histogram2dcontour"":[{""type"":""histogram2dcontour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""choropleth"":[{""type"":""choropleth"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""histogram2d"":[{""type"":""histogram2d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmap"":[{""type"":""heatmap"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmapgl"":[{""type"":""heatmapgl"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""contourcarpet"":[{""type"":""contourcarpet"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""contour"":[{""type"":""contour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""surface"":[{""type"":""surface"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""mesh3d"":[{""type"":""mesh3d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""scatter"":[{""fillpattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2},""type"":""scatter""}],""parcoords"":[{""type"":""parcoords"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolargl"":[{""type"":""scatterpolargl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""bar"":[{""error_x"":{""color"":""#2a3f5f""},""error_y"":{""color"":""#2a3f5f""},""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""bar""}],""scattergeo"":[{""type"":""scattergeo"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolar"":[{""type"":""scatterpolar"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""histogram"":[{""marker"":{""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""histogram""}],""scattergl"":[{""type"":""scattergl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatter3d"":[{""type"":""scatter3d"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattermapbox"":[{""type"":""scattermapbox"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterternary"":[{""type"":""scatterternary"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattercarpet"":[{""type"":""scattercarpet"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""carpet"":[{""aaxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""baxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""type"":""carpet""}],""table"":[{""cells"":{""fill"":{""color"":""#EBF0F8""},""line"":{""color"":""white""}},""header"":{""fill"":{""color"":""#C8D4E3""},""line"":{""color"":""white""}},""type"":""table""}],""barpolar"":[{""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""barpolar""}],""pie"":[{""automargin"":true,""type"":""pie""}]},""layout"":{""autotypenumbers"":""strict"",""colorway"":[""#636efa"",""#EF553B"",""#00cc96"",""#ab63fa"",""#FFA15A"",""#19d3f3"",""#FF6692"",""#B6E880"",""#FF97FF"",""#FECB52""],""font"":{""color"":""#2a3f5f""},""hovermode"":""closest"",""hoverlabel"":{""align"":""left""},""paper_bgcolor"":""white"",""plot_bgcolor"":""#E5ECF6"",""polar"":{""bgcolor"":""#E5ECF6"",""angularaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""radialaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""ternary"":{""bgcolor"":""#E5ECF6"",""aaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""baxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""caxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""coloraxis"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""colorscale"":{""sequential"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""sequentialminus"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""diverging"":[[0,""#8e0152""],[0.1,""#c51b7d""],[0.2,""#de77ae""],[0.3,""#f1b6da""],[0.4,""#fde0ef""],[0.5,""#f7f7f7""],[0.6,""#e6f5d0""],[0.7,""#b8e186""],[0.8,""#7fbc41""],[0.9,""#4d9221""],[1,""#276419""]]},""xaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""yaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""scene"":{""xaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""yaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""zaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2}},""shapedefaults"":{""line"":{""color"":""#2a3f5f""}},""annotationdefaults"":{""arrowcolor"":""#2a3f5f"",""arrowhead"":0,""arrowwidth"":1},""geo"":{""bgcolor"":""white"",""landcolor"":""#E5ECF6"",""subunitcolor"":""white"",""showland"":true,""showlakes"":true,""lakecolor"":""white""},""title"":{""x"":0.05},""mapbox"":{""style"":""light""}}},""xaxis"":{""anchor"":""y"",""domain"":[0.0,1.0],""title"":{""text"":""original text length part""}},""yaxis"":{""anchor"":""x"",""domain"":[0.0,1.0],""title"":{""text"":""Model""},""categoryorder"":""array"",""categoryarray"":[""Upstage SOLAR Instruct v1 (11B)"",""Mistral-7B-Instruct-v0.2"",""Falcon Instruct (7B)"",""RedPajama-INCITE Chat (7B)"",""zephyr-7b-beta"",""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""chat-bison-32k (PaLM 2 32K)"",""Mixtral-8x7B-Instruct-v0.1"",""Vicuna v1.5 (7B)"",""WizardLM v1.2 (13B)"",""chat-bison (PaLM 2)"",""gemini-pro"",""llama-2-70b-chat"",""Qwen 1.5 Chat (7B)"",""OpenHermes-2.5-Mistral (7B)"",""LLaMA-2 Chat (7B)"",""01-ai Yi Chat (34B)"",""Chronos Hermes (13B)"",""gpt-4"",""Mistral (7B) Instruct v0.2 (Together AI)"",""gpt-4-turbo"",""gpt-3.5-turbo"",""Snorkel Mistral PairRM DPO (7B)""]},""legend"":{""title"":{""text"":""Model""},""tracegroupgap"":0},""title"":{""text"":""Summary metrics original text length part""},""barmode"":""relative""}}","How long is the summarization compared to the original text,
+ calculated as: `len(summarized_text) + 1 / len(original_text) + 1`.
+
+ The value is averaged for each model.
+ ",",model,BERT_score_precision,BERT_score_recall,BERT_score_F1,BLEU_score,original_text_length_part,sentence_count,length_penalty
+10,Snorkel Mistral PairRM DPO (7B),0.3167385,0.34785262,0.32718164,0.0029236226777824676,3.7740234383755356,3.5818443804034583,14928.0
+18,gpt-3.5-turbo,0.49478123,0.50445867,0.49331823,0.00919205486407126,0.5905700146991734,4.229639819909955,89814.0
+20,gpt-4-turbo,0.42933634,0.4414623,0.4294052,0.0042830628392272,0.5393220459796505,4.266137566137566,85120.0
+4,Mistral (7B) Instruct v0.2 (Together AI),0.36488953,0.3797993,0.36758336,0.005650224193975447,0.5233998570385472,3.712222222222222,29298.0
+19,gpt-4,0.4864653,0.49512562,0.4839312,0.005711113295666468,0.4763731952669352,4.266137566137566,85120.0
+1,Chronos Hermes (13B),0.31285536,0.32630467,0.3150877,0.011542047908319874,0.4742810243835248,3.5818443804034583,14928.0
+0,01-ai Yi Chat (34B),0.33981326,0.35219854,0.34183535,0.007428840277380581,0.43251538287409536,3.5818443804034583,14928.0
+3,LLaMA-2 Chat (7B),0.32074162,0.33171847,0.32136682,0.004415024709996126,0.4084233313416049,3.5818443804034583,14928.0
+7,OpenHermes-2.5-Mistral (7B),0.3621834,0.3685358,0.36003792,0.0068684572027745494,0.312054520357568,3.5818443804034583,14928.0
+8,Qwen 1.5 Chat (7B),0.34898603,0.35945317,0.34867778,0.0033327500620805805,0.29904529709475364,3.5818443804034583,14928.0
+21,llama-2-70b-chat,0.20810011,0.22406381,0.21268094,0.004560500754935232,0.29684572894554634,4.2436893203883495,88008.0
+17,gemini-pro,0.23109974,0.23956373,0.23199782,0.0032373504004405487,0.295286999418032,4.244871794871795,87700.0
+15,chat-bison (PaLM 2),0.23123139,0.24001649,0.23214735,0.0037652345768886663,0.2927236655934559,4.281081081081081,83400.0
+14,WizardLM v1.2 (13B),0.3420949,0.34746957,0.33996373,0.00373442128604677,0.28716720161049375,3.5818443804034583,14928.0
+13,Vicuna v1.5 (7B),0.28434175,0.29119453,0.2839047,0.007105541953090669,0.2781035051738079,3.6173027989821884,16948.0
+6,Mixtral-8x7B-Instruct-v0.1,0.19137934,0.2029136,0.19449018,0.0031843990217988536,0.2665288353398184,4.161038961038961,103320.0
+16,chat-bison-32k (PaLM 2 32K),0.23051436,0.23993237,0.2317056,0.003694633514634998,0.2608806894318779,4.281081081081081,83400.0
+11,TinyLlama/TinyLlama-1.1B-Chat-v1.0,0.122332305,0.12540509,0.12200464,0.003286423403673119,0.13915355617375091,4.244871794871795,87700.0
+22,zephyr-7b-beta,0.085546724,0.08755772,0.085219756,0.0012612839176470308,0.08796697338212889,4.159788702026735,103714.0
+9,RedPajama-INCITE Chat (7B),0.26832756,0.27305293,0.26768887,0.0,0.0560284823193376,3.5818443804034583,14928.0
+2,Falcon Instruct (7B),0.30270517,0.28607234,0.29104736,0.0030232447024239606,0.0490635544441649,3.5818443804034583,14928.0
+5,Mistral-7B-Instruct-v0.2,0.04389399,0.045185987,0.04378006,0.000566625796313851,0.04250630683894714,4.120342654588421,113258.0
+12,Upstage SOLAR Instruct v1 (11B),0.0,0.0,0.0,0.0,0.0017662349842492329,3.5818443804034583,14928.0
+","{""x"": ""original_text_length_part"", ""y"": ""model"", ""color"": ""model"", ""orientation"": ""h"", ""labels"": {""original_text_length_part"": ""original text length part"", ""model"": ""Model""}, ""title"": ""Summary metrics original text length part""}"
"Figure({
'data': [{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
length penalty=%{x}',
- 'legendgroup': 'Mistral-7B-Instruct-v0.2',
+ 'hovertemplate': 'Model=%{y}
sentence count=%{x}',
+ 'legendgroup': 'chat-bison (PaLM 2)',
'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
- 'name': 'Mistral-7B-Instruct-v0.2',
- 'offsetgroup': 'Mistral-7B-Instruct-v0.2',
+ 'name': 'chat-bison (PaLM 2)',
+ 'offsetgroup': 'chat-bison (PaLM 2)',
'orientation': 'h',
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([113258.]),
+ 'x': array([4.28108108]),
'xaxis': 'x',
- 'y': array(['Mistral-7B-Instruct-v0.2'], dtype=object),
+ 'y': array(['chat-bison (PaLM 2)'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
length penalty=%{x}',
- 'legendgroup': 'zephyr-7b-beta',
+ 'hovertemplate': 'Model=%{y}
sentence count=%{x}',
+ 'legendgroup': 'chat-bison-32k (PaLM 2 32K)',
'marker': {'color': '#EF553B', 'pattern': {'shape': ''}},
- 'name': 'zephyr-7b-beta',
- 'offsetgroup': 'zephyr-7b-beta',
+ 'name': 'chat-bison-32k (PaLM 2 32K)',
+ 'offsetgroup': 'chat-bison-32k (PaLM 2 32K)',
'orientation': 'h',
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([103714.]),
+ 'x': array([4.28108108]),
'xaxis': 'x',
- 'y': array(['zephyr-7b-beta'], dtype=object),
+ 'y': array(['chat-bison-32k (PaLM 2 32K)'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
length penalty=%{x}',
- 'legendgroup': 'Mixtral-8x7B-Instruct-v0.1',
+ 'hovertemplate': 'Model=%{y}
sentence count=%{x}',
+ 'legendgroup': 'gpt-4-turbo',
'marker': {'color': '#00cc96', 'pattern': {'shape': ''}},
- 'name': 'Mixtral-8x7B-Instruct-v0.1',
- 'offsetgroup': 'Mixtral-8x7B-Instruct-v0.1',
+ 'name': 'gpt-4-turbo',
+ 'offsetgroup': 'gpt-4-turbo',
'orientation': 'h',
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([103320.]),
+ 'x': array([4.26613757]),
'xaxis': 'x',
- 'y': array(['Mixtral-8x7B-Instruct-v0.1'], dtype=object),
+ 'y': array(['gpt-4-turbo'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
length penalty=%{x}',
- 'legendgroup': 'gpt-3.5-turbo',
+ 'hovertemplate': 'Model=%{y}
sentence count=%{x}',
+ 'legendgroup': 'gpt-4',
'marker': {'color': '#ab63fa', 'pattern': {'shape': ''}},
- 'name': 'gpt-3.5-turbo',
- 'offsetgroup': 'gpt-3.5-turbo',
+ 'name': 'gpt-4',
+ 'offsetgroup': 'gpt-4',
'orientation': 'h',
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([89814.]),
+ 'x': array([4.26613757]),
'xaxis': 'x',
- 'y': array(['gpt-3.5-turbo'], dtype=object),
+ 'y': array(['gpt-4'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
length penalty=%{x}',
- 'legendgroup': 'llama-2-70b-chat',
+ 'hovertemplate': 'Model=%{y}
sentence count=%{x}',
+ 'legendgroup': 'gemini-pro',
'marker': {'color': '#FFA15A', 'pattern': {'shape': ''}},
- 'name': 'llama-2-70b-chat',
- 'offsetgroup': 'llama-2-70b-chat',
+ 'name': 'gemini-pro',
+ 'offsetgroup': 'gemini-pro',
'orientation': 'h',
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([88008.]),
+ 'x': array([4.24487179]),
'xaxis': 'x',
- 'y': array(['llama-2-70b-chat'], dtype=object),
+ 'y': array(['gemini-pro'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
length penalty=%{x}',
- 'legendgroup': 'gemini-pro',
+ 'hovertemplate': 'Model=%{y}
sentence count=%{x}',
+ 'legendgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
'marker': {'color': '#19d3f3', 'pattern': {'shape': ''}},
- 'name': 'gemini-pro',
- 'offsetgroup': 'gemini-pro',
+ 'name': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
+ 'offsetgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
'orientation': 'h',
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([87700.]),
+ 'x': array([4.24487179]),
'xaxis': 'x',
- 'y': array(['gemini-pro'], dtype=object),
+ 'y': array(['TinyLlama/TinyLlama-1.1B-Chat-v1.0'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
length penalty=%{x}',
- 'legendgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
+ 'hovertemplate': 'Model=%{y}
sentence count=%{x}',
+ 'legendgroup': 'llama-2-70b-chat',
'marker': {'color': '#FF6692', 'pattern': {'shape': ''}},
- 'name': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
- 'offsetgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
+ 'name': 'llama-2-70b-chat',
+ 'offsetgroup': 'llama-2-70b-chat',
'orientation': 'h',
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([87700.]),
+ 'x': array([4.24368932]),
'xaxis': 'x',
- 'y': array(['TinyLlama/TinyLlama-1.1B-Chat-v1.0'], dtype=object),
+ 'y': array(['llama-2-70b-chat'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
length penalty=%{x}',
- 'legendgroup': 'gpt-4-turbo',
+ 'hovertemplate': 'Model=%{y}
sentence count=%{x}',
+ 'legendgroup': 'gpt-3.5-turbo',
'marker': {'color': '#B6E880', 'pattern': {'shape': ''}},
- 'name': 'gpt-4-turbo',
- 'offsetgroup': 'gpt-4-turbo',
+ 'name': 'gpt-3.5-turbo',
+ 'offsetgroup': 'gpt-3.5-turbo',
'orientation': 'h',
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([85120.]),
+ 'x': array([4.22963982]),
'xaxis': 'x',
- 'y': array(['gpt-4-turbo'], dtype=object),
+ 'y': array(['gpt-3.5-turbo'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
length penalty=%{x}',
- 'legendgroup': 'gpt-4',
+ 'hovertemplate': 'Model=%{y}
sentence count=%{x}',
+ 'legendgroup': 'Mixtral-8x7B-Instruct-v0.1',
'marker': {'color': '#FF97FF', 'pattern': {'shape': ''}},
- 'name': 'gpt-4',
- 'offsetgroup': 'gpt-4',
+ 'name': 'Mixtral-8x7B-Instruct-v0.1',
+ 'offsetgroup': 'Mixtral-8x7B-Instruct-v0.1',
'orientation': 'h',
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([85120.]),
+ 'x': array([4.16103896]),
'xaxis': 'x',
- 'y': array(['gpt-4'], dtype=object),
+ 'y': array(['Mixtral-8x7B-Instruct-v0.1'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
length penalty=%{x}',
- 'legendgroup': 'chat-bison (PaLM 2)',
+ 'hovertemplate': 'Model=%{y}
sentence count=%{x}',
+ 'legendgroup': 'zephyr-7b-beta',
'marker': {'color': '#FECB52', 'pattern': {'shape': ''}},
- 'name': 'chat-bison (PaLM 2)',
- 'offsetgroup': 'chat-bison (PaLM 2)',
+ 'name': 'zephyr-7b-beta',
+ 'offsetgroup': 'zephyr-7b-beta',
'orientation': 'h',
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([83400.]),
+ 'x': array([4.1597887]),
'xaxis': 'x',
- 'y': array(['chat-bison (PaLM 2)'], dtype=object),
+ 'y': array(['zephyr-7b-beta'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
length penalty=%{x}',
- 'legendgroup': 'chat-bison-32k (PaLM 2 32K)',
+ 'hovertemplate': 'Model=%{y}
sentence count=%{x}',
+ 'legendgroup': 'Mistral-7B-Instruct-v0.2',
'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
- 'name': 'chat-bison-32k (PaLM 2 32K)',
- 'offsetgroup': 'chat-bison-32k (PaLM 2 32K)',
+ 'name': 'Mistral-7B-Instruct-v0.2',
+ 'offsetgroup': 'Mistral-7B-Instruct-v0.2',
'orientation': 'h',
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([83400.]),
+ 'x': array([4.12034265]),
'xaxis': 'x',
- 'y': array(['chat-bison-32k (PaLM 2 32K)'], dtype=object),
+ 'y': array(['Mistral-7B-Instruct-v0.2'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
length penalty=%{x}',
+ 'hovertemplate': 'Model=%{y}
sentence count=%{x}',
'legendgroup': 'Mistral (7B) Instruct v0.2 (Together AI)',
'marker': {'color': '#EF553B', 'pattern': {'shape': ''}},
'name': 'Mistral (7B) Instruct v0.2 (Together AI)',
@@ -2028,12 +2044,12 @@ plot_object,header,plot_json,description,df,arguments
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([29298.]),
+ 'x': array([3.71222222]),
'xaxis': 'x',
'y': array(['Mistral (7B) Instruct v0.2 (Together AI)'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
length penalty=%{x}',
+ 'hovertemplate': 'Model=%{y}
sentence count=%{x}',
'legendgroup': 'Vicuna v1.5 (7B)',
'marker': {'color': '#00cc96', 'pattern': {'shape': ''}},
'name': 'Vicuna v1.5 (7B)',
@@ -2042,12 +2058,12 @@ plot_object,header,plot_json,description,df,arguments
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([16948.]),
+ 'x': array([3.6173028]),
'xaxis': 'x',
'y': array(['Vicuna v1.5 (7B)'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
length penalty=%{x}',
+ 'hovertemplate': 'Model=%{y}
sentence count=%{x}',
'legendgroup': 'Falcon Instruct (7B)',
'marker': {'color': '#ab63fa', 'pattern': {'shape': ''}},
'name': 'Falcon Instruct (7B)',
@@ -2056,12 +2072,12 @@ plot_object,header,plot_json,description,df,arguments
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([14928.]),
+ 'x': array([3.58184438]),
'xaxis': 'x',
'y': array(['Falcon Instruct (7B)'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
length penalty=%{x}',
+ 'hovertemplate': 'Model=%{y}
sentence count=%{x}',
'legendgroup': 'RedPajama-INCITE Chat (7B)',
'marker': {'color': '#FFA15A', 'pattern': {'shape': ''}},
'name': 'RedPajama-INCITE Chat (7B)',
@@ -2070,12 +2086,12 @@ plot_object,header,plot_json,description,df,arguments
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([14928.]),
+ 'x': array([3.58184438]),
'xaxis': 'x',
'y': array(['RedPajama-INCITE Chat (7B)'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
length penalty=%{x}',
+ 'hovertemplate': 'Model=%{y}
sentence count=%{x}',
'legendgroup': 'Snorkel Mistral PairRM DPO (7B)',
'marker': {'color': '#19d3f3', 'pattern': {'shape': ''}},
'name': 'Snorkel Mistral PairRM DPO (7B)',
@@ -2084,12 +2100,12 @@ plot_object,header,plot_json,description,df,arguments
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([14928.]),
+ 'x': array([3.58184438]),
'xaxis': 'x',
'y': array(['Snorkel Mistral PairRM DPO (7B)'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
length penalty=%{x}',
+ 'hovertemplate': 'Model=%{y}
sentence count=%{x}',
'legendgroup': 'WizardLM v1.2 (13B)',
'marker': {'color': '#FF6692', 'pattern': {'shape': ''}},
'name': 'WizardLM v1.2 (13B)',
@@ -2098,12 +2114,12 @@ plot_object,header,plot_json,description,df,arguments
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([14928.]),
+ 'x': array([3.58184438]),
'xaxis': 'x',
'y': array(['WizardLM v1.2 (13B)'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
length penalty=%{x}',
+ 'hovertemplate': 'Model=%{y}
sentence count=%{x}',
'legendgroup': 'Qwen 1.5 Chat (7B)',
'marker': {'color': '#B6E880', 'pattern': {'shape': ''}},
'name': 'Qwen 1.5 Chat (7B)',
@@ -2112,12 +2128,12 @@ plot_object,header,plot_json,description,df,arguments
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([14928.]),
+ 'x': array([3.58184438]),
'xaxis': 'x',
'y': array(['Qwen 1.5 Chat (7B)'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
length penalty=%{x}',
+ 'hovertemplate': 'Model=%{y}
sentence count=%{x}',
'legendgroup': 'OpenHermes-2.5-Mistral (7B)',
'marker': {'color': '#FF97FF', 'pattern': {'shape': ''}},
'name': 'OpenHermes-2.5-Mistral (7B)',
@@ -2126,12 +2142,12 @@ plot_object,header,plot_json,description,df,arguments
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([14928.]),
+ 'x': array([3.58184438]),
'xaxis': 'x',
'y': array(['OpenHermes-2.5-Mistral (7B)'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
length penalty=%{x}',
+ 'hovertemplate': 'Model=%{y}
sentence count=%{x}',
'legendgroup': 'LLaMA-2 Chat (7B)',
'marker': {'color': '#FECB52', 'pattern': {'shape': ''}},
'name': 'LLaMA-2 Chat (7B)',
@@ -2140,12 +2156,12 @@ plot_object,header,plot_json,description,df,arguments
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([14928.]),
+ 'x': array([3.58184438]),
'xaxis': 'x',
'y': array(['LLaMA-2 Chat (7B)'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
length penalty=%{x}',
+ 'hovertemplate': 'Model=%{y}
sentence count=%{x}',
'legendgroup': '01-ai Yi Chat (34B)',
'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
'name': '01-ai Yi Chat (34B)',
@@ -2154,12 +2170,12 @@ plot_object,header,plot_json,description,df,arguments
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([14928.]),
+ 'x': array([3.58184438]),
'xaxis': 'x',
'y': array(['01-ai Yi Chat (34B)'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
length penalty=%{x}',
+ 'hovertemplate': 'Model=%{y}
sentence count=%{x}',
'legendgroup': 'Chronos Hermes (13B)',
'marker': {'color': '#EF553B', 'pattern': {'shape': ''}},
'name': 'Chronos Hermes (13B)',
@@ -2168,12 +2184,12 @@ plot_object,header,plot_json,description,df,arguments
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([14928.]),
+ 'x': array([3.58184438]),
'xaxis': 'x',
'y': array(['Chronos Hermes (13B)'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
length penalty=%{x}',
+ 'hovertemplate': 'Model=%{y}
sentence count=%{x}',
'legendgroup': 'Upstage SOLAR Instruct v1 (11B)',
'marker': {'color': '#00cc96', 'pattern': {'shape': ''}},
'name': 'Upstage SOLAR Instruct v1 (11B)',
@@ -2182,15 +2198,15 @@ plot_object,header,plot_json,description,df,arguments
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([14928.]),
+ 'x': array([3.58184438]),
'xaxis': 'x',
'y': array(['Upstage SOLAR Instruct v1 (11B)'], dtype=object),
'yaxis': 'y'}],
'layout': {'barmode': 'relative',
'legend': {'title': {'text': 'Model'}, 'tracegroupgap': 0},
'template': '...',
- 'title': {'text': 'Summary metrics length penalty'},
- 'xaxis': {'anchor': 'y', 'domain': [0.0, 1.0], 'title': {'text': 'length penalty'}},
+ 'title': {'text': 'Summary metrics sentence count'},
+ 'xaxis': {'anchor': 'y', 'domain': [0.0, 1.0], 'title': {'text': 'sentence count'}},
'yaxis': {'anchor': 'x',
'categoryarray': [Upstage SOLAR Instruct v1 (11B),
Chronos Hermes (13B), 01-ai Yi Chat
@@ -2200,256 +2216,256 @@ plot_object,header,plot_json,description,df,arguments
Mistral PairRM DPO (7B), RedPajama-
INCITE Chat (7B), Falcon Instruct (7B),
Vicuna v1.5 (7B), Mistral (7B) Instruct
- v0.2 (Together AI), chat-bison-32k (PaLM
- 2 32K), chat-bison (PaLM 2), gpt-4,
- gpt-4-turbo,
- TinyLlama/TinyLlama-1.1B-Chat-v1.0,
- gemini-pro, llama-2-70b-chat,
- gpt-3.5-turbo,
- Mixtral-8x7B-Instruct-v0.1,
+ v0.2 (Together AI),
+ Mistral-7B-Instruct-v0.2,
zephyr-7b-beta,
- Mistral-7B-Instruct-v0.2],
+ Mixtral-8x7B-Instruct-v0.1,
+ gpt-3.5-turbo, llama-2-70b-chat,
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,
+ gemini-pro, gpt-4, gpt-4-turbo, chat-
+ bison-32k (PaLM 2 32K), chat-bison (PaLM
+ 2)],
'categoryorder': 'array',
'domain': [0.0, 1.0],
'title': {'text': 'Model'}}}
-})",Summary metrics length penalty,"{""data"":[{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003elength penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral-7B-Instruct-v0.2"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""Mistral-7B-Instruct-v0.2"",""offsetgroup"":""Mistral-7B-Instruct-v0.2"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[113258.0],""xaxis"":""x"",""y"":[""Mistral-7B-Instruct-v0.2""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003elength penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""zephyr-7b-beta"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""zephyr-7b-beta"",""offsetgroup"":""zephyr-7b-beta"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[103714.0],""xaxis"":""x"",""y"":[""zephyr-7b-beta""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003elength penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mixtral-8x7B-Instruct-v0.1"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""Mixtral-8x7B-Instruct-v0.1"",""offsetgroup"":""Mixtral-8x7B-Instruct-v0.1"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[103320.0],""xaxis"":""x"",""y"":[""Mixtral-8x7B-Instruct-v0.1""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003elength penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-3.5-turbo"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""gpt-3.5-turbo"",""offsetgroup"":""gpt-3.5-turbo"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[89814.0],""xaxis"":""x"",""y"":[""gpt-3.5-turbo""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003elength penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""llama-2-70b-chat"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""llama-2-70b-chat"",""offsetgroup"":""llama-2-70b-chat"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[88008.0],""xaxis"":""x"",""y"":[""llama-2-70b-chat""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003elength penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gemini-pro"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""gemini-pro"",""offsetgroup"":""gemini-pro"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[87700.0],""xaxis"":""x"",""y"":[""gemini-pro""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003elength penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""offsetgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[87700.0],""xaxis"":""x"",""y"":[""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003elength penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4-turbo"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""gpt-4-turbo"",""offsetgroup"":""gpt-4-turbo"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[85120.0],""xaxis"":""x"",""y"":[""gpt-4-turbo""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003elength penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""gpt-4"",""offsetgroup"":""gpt-4"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[85120.0],""xaxis"":""x"",""y"":[""gpt-4""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003elength penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison (PaLM 2)"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""chat-bison (PaLM 2)"",""offsetgroup"":""chat-bison (PaLM 2)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[83400.0],""xaxis"":""x"",""y"":[""chat-bison (PaLM 2)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003elength penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison-32k (PaLM 2 32K)"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""chat-bison-32k (PaLM 2 32K)"",""offsetgroup"":""chat-bison-32k (PaLM 2 32K)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[83400.0],""xaxis"":""x"",""y"":[""chat-bison-32k (PaLM 2 32K)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003elength penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral (7B) Instruct v0.2 (Together AI)"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""Mistral (7B) Instruct v0.2 (Together AI)"",""offsetgroup"":""Mistral (7B) Instruct v0.2 (Together AI)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[29298.0],""xaxis"":""x"",""y"":[""Mistral (7B) Instruct v0.2 (Together AI)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003elength penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Vicuna v1.5 (7B)"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""Vicuna v1.5 (7B)"",""offsetgroup"":""Vicuna v1.5 (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[16948.0],""xaxis"":""x"",""y"":[""Vicuna v1.5 (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003elength penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Falcon Instruct (7B)"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""Falcon Instruct (7B)"",""offsetgroup"":""Falcon Instruct (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[14928.0],""xaxis"":""x"",""y"":[""Falcon Instruct (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003elength penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""RedPajama-INCITE Chat (7B)"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""RedPajama-INCITE Chat (7B)"",""offsetgroup"":""RedPajama-INCITE Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[14928.0],""xaxis"":""x"",""y"":[""RedPajama-INCITE Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003elength penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Snorkel Mistral PairRM DPO (7B)"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""Snorkel Mistral PairRM DPO (7B)"",""offsetgroup"":""Snorkel Mistral PairRM DPO (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[14928.0],""xaxis"":""x"",""y"":[""Snorkel Mistral PairRM DPO (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003elength penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""WizardLM v1.2 (13B)"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""WizardLM v1.2 (13B)"",""offsetgroup"":""WizardLM v1.2 (13B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[14928.0],""xaxis"":""x"",""y"":[""WizardLM v1.2 (13B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003elength penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Qwen 1.5 Chat (7B)"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""Qwen 1.5 Chat (7B)"",""offsetgroup"":""Qwen 1.5 Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[14928.0],""xaxis"":""x"",""y"":[""Qwen 1.5 Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003elength penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""OpenHermes-2.5-Mistral (7B)"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""OpenHermes-2.5-Mistral (7B)"",""offsetgroup"":""OpenHermes-2.5-Mistral (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[14928.0],""xaxis"":""x"",""y"":[""OpenHermes-2.5-Mistral (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003elength penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""LLaMA-2 Chat (7B)"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""LLaMA-2 Chat (7B)"",""offsetgroup"":""LLaMA-2 Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[14928.0],""xaxis"":""x"",""y"":[""LLaMA-2 Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003elength penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""01-ai Yi Chat (34B)"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""01-ai Yi Chat (34B)"",""offsetgroup"":""01-ai Yi Chat (34B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[14928.0],""xaxis"":""x"",""y"":[""01-ai Yi Chat (34B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003elength penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Chronos Hermes (13B)"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""Chronos Hermes (13B)"",""offsetgroup"":""Chronos Hermes (13B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[14928.0],""xaxis"":""x"",""y"":[""Chronos Hermes (13B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003elength penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Upstage SOLAR Instruct v1 (11B)"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""Upstage SOLAR Instruct v1 (11B)"",""offsetgroup"":""Upstage SOLAR Instruct v1 (11B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[14928.0],""xaxis"":""x"",""y"":[""Upstage SOLAR Instruct v1 (11B)""],""yaxis"":""y"",""type"":""bar""}],""layout"":{""template"":{""data"":{""histogram2dcontour"":[{""type"":""histogram2dcontour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""choropleth"":[{""type"":""choropleth"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""histogram2d"":[{""type"":""histogram2d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmap"":[{""type"":""heatmap"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmapgl"":[{""type"":""heatmapgl"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""contourcarpet"":[{""type"":""contourcarpet"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""contour"":[{""type"":""contour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""surface"":[{""type"":""surface"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""mesh3d"":[{""type"":""mesh3d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""scatter"":[{""fillpattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2},""type"":""scatter""}],""parcoords"":[{""type"":""parcoords"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolargl"":[{""type"":""scatterpolargl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""bar"":[{""error_x"":{""color"":""#2a3f5f""},""error_y"":{""color"":""#2a3f5f""},""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""bar""}],""scattergeo"":[{""type"":""scattergeo"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolar"":[{""type"":""scatterpolar"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""histogram"":[{""marker"":{""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""histogram""}],""scattergl"":[{""type"":""scattergl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatter3d"":[{""type"":""scatter3d"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattermapbox"":[{""type"":""scattermapbox"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterternary"":[{""type"":""scatterternary"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattercarpet"":[{""type"":""scattercarpet"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""carpet"":[{""aaxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""baxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""type"":""carpet""}],""table"":[{""cells"":{""fill"":{""color"":""#EBF0F8""},""line"":{""color"":""white""}},""header"":{""fill"":{""color"":""#C8D4E3""},""line"":{""color"":""white""}},""type"":""table""}],""barpolar"":[{""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""barpolar""}],""pie"":[{""automargin"":true,""type"":""pie""}]},""layout"":{""autotypenumbers"":""strict"",""colorway"":[""#636efa"",""#EF553B"",""#00cc96"",""#ab63fa"",""#FFA15A"",""#19d3f3"",""#FF6692"",""#B6E880"",""#FF97FF"",""#FECB52""],""font"":{""color"":""#2a3f5f""},""hovermode"":""closest"",""hoverlabel"":{""align"":""left""},""paper_bgcolor"":""white"",""plot_bgcolor"":""#E5ECF6"",""polar"":{""bgcolor"":""#E5ECF6"",""angularaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""radialaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""ternary"":{""bgcolor"":""#E5ECF6"",""aaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""baxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""caxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""coloraxis"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""colorscale"":{""sequential"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""sequentialminus"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""diverging"":[[0,""#8e0152""],[0.1,""#c51b7d""],[0.2,""#de77ae""],[0.3,""#f1b6da""],[0.4,""#fde0ef""],[0.5,""#f7f7f7""],[0.6,""#e6f5d0""],[0.7,""#b8e186""],[0.8,""#7fbc41""],[0.9,""#4d9221""],[1,""#276419""]]},""xaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""yaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""scene"":{""xaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""yaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""zaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2}},""shapedefaults"":{""line"":{""color"":""#2a3f5f""}},""annotationdefaults"":{""arrowcolor"":""#2a3f5f"",""arrowhead"":0,""arrowwidth"":1},""geo"":{""bgcolor"":""white"",""landcolor"":""#E5ECF6"",""subunitcolor"":""white"",""showland"":true,""showlakes"":true,""lakecolor"":""white""},""title"":{""x"":0.05},""mapbox"":{""style"":""light""}}},""xaxis"":{""anchor"":""y"",""domain"":[0.0,1.0],""title"":{""text"":""length penalty""}},""yaxis"":{""anchor"":""x"",""domain"":[0.0,1.0],""title"":{""text"":""Model""},""categoryorder"":""array"",""categoryarray"":[""Upstage SOLAR Instruct v1 (11B)"",""Chronos Hermes (13B)"",""01-ai Yi Chat (34B)"",""LLaMA-2 Chat (7B)"",""OpenHermes-2.5-Mistral (7B)"",""Qwen 1.5 Chat (7B)"",""WizardLM v1.2 (13B)"",""Snorkel Mistral PairRM DPO (7B)"",""RedPajama-INCITE Chat (7B)"",""Falcon Instruct (7B)"",""Vicuna v1.5 (7B)"",""Mistral (7B) Instruct v0.2 (Together AI)"",""chat-bison-32k (PaLM 2 32K)"",""chat-bison (PaLM 2)"",""gpt-4"",""gpt-4-turbo"",""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""gemini-pro"",""llama-2-70b-chat"",""gpt-3.5-turbo"",""Mixtral-8x7B-Instruct-v0.1"",""zephyr-7b-beta"",""Mistral-7B-Instruct-v0.2""]},""legend"":{""title"":{""text"":""Model""},""tracegroupgap"":0},""title"":{""text"":""Summary metrics length penalty""},""barmode"":""relative""}}",It is assumed that good quality summary contains between 2 and 5 sentences (inclusive range). The penalty is a difference between summary sentence count and this range. It is summed for each model.,",model,bert_score_P,bert_score_R,bert_score_F1,original_text_length_part,sentence_count,length_penalty,bleu_score
-5,Mistral-7B-Instruct-v0.2,0.043820098,0.042561684,0.04313921,0.04250630683894714,4.120342654588421,113258.0,0.0004930290548816363
-22,zephyr-7b-beta,0.085390136,0.08266569,0.08394519,0.08796697338212889,4.159788702026735,103714.0,0.0010625100735849574
-6,Mixtral-8x7B-Instruct-v0.1,0.19128644,0.19555509,0.19330867,0.2665288353398184,4.161038961038961,103320.0,0.0026839271544750283
-18,gpt-3.5-turbo,0.4943981,0.48408476,0.4888874,0.5905700146991734,4.229639819909955,89814.0,0.007892445077902592
-21,llama-2-70b-chat,0.20800962,0.21472095,0.21117964,0.29684572894554634,4.2436893203883495,88008.0,0.00329426273003284
-17,gemini-pro,0.23105659,0.23057175,0.23072062,0.295286999418032,4.244871794871795,87700.0,0.0025439281189154664
-11,TinyLlama/TinyLlama-1.1B-Chat-v1.0,0.122185074,0.11885959,0.12042627,0.13915355617375091,4.244871794871795,87700.0,0.002991155730532842
-20,gpt-4-turbo,0.42728576,0.4162435,0.42098433,0.5393220459796505,4.266137566137566,85120.0,0.0034873692407505464
-19,gpt-4,0.48605907,0.472583,0.47901583,0.4763731952669352,4.266137566137566,85120.0,0.004704572681138337
-15,chat-bison (PaLM 2),0.23117188,0.23029378,0.23060663,0.2927236655934559,4.281081081081081,83400.0,0.0033173472693443363
-16,chat-bison-32k (PaLM 2 32K),0.23046139,0.22983725,0.23002876,0.2608806894318779,4.281081081081081,83400.0,0.002970914340485325
-4,Mistral (7B) Instruct v0.2 (Together AI),0.3647361,0.3664233,0.36540908,0.5233998570385472,3.712222222222222,29298.0,0.005478518060743351
-13,Vicuna v1.5 (7B),0.284109,0.27878883,0.28129113,0.2781035051738079,3.6173027989821884,16948.0,0.006952332387656228
-2,Falcon Instruct (7B),0.2895086,0.23968808,0.2615204,0.0490635544441649,3.5818443804034583,14928.0,0.00021729364201653395
-9,RedPajama-INCITE Chat (7B),0.261367,0.23758642,0.2487217,0.0560284823193376,3.5818443804034583,14928.0,0.0
-10,Snorkel Mistral PairRM DPO (7B),0.31672964,0.33782956,0.3265383,3.7740234383755356,3.5818443804034583,14928.0,0.002907897771152987
-14,WizardLM v1.2 (13B),0.34085444,0.32933056,0.33466902,0.28716720161049375,3.5818443804034583,14928.0,0.003671383039102015
-8,Qwen 1.5 Chat (7B),0.34855434,0.34154576,0.344803,0.29904529709475364,3.5818443804034583,14928.0,0.003185571110431172
-7,OpenHermes-2.5-Mistral (7B),0.3618188,0.35180506,0.3565194,0.312054520357568,3.5818443804034583,14928.0,0.006563161880264231
-3,LLaMA-2 Chat (7B),0.3203912,0.3153909,0.31770444,0.4084233313416049,3.5818443804034583,14928.0,0.004255859538193306
-0,01-ai Yi Chat (34B),0.33974892,0.3404481,0.3399749,0.43251538287409536,3.5818443804034583,14928.0,0.007311566390840339
-1,Chronos Hermes (13B),0.3124825,0.31071666,0.311415,0.4742810243835248,3.5818443804034583,14928.0,0.011439012700594395
-12,Upstage SOLAR Instruct v1 (11B),0.0,0.0,0.0,0.0017662349842492329,3.5818443804034583,14928.0,0.0
-","{""x"": ""length_penalty"", ""y"": ""model"", ""color"": ""model"", ""orientation"": ""h"", ""labels"": {""length_penalty"": ""length penalty"", ""model"": ""Model""}, ""title"": ""Summary metrics length penalty""}"
+})",Summary metrics sentence count,"{""data"":[{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003esentence count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison (PaLM 2)"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""chat-bison (PaLM 2)"",""offsetgroup"":""chat-bison (PaLM 2)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[4.281081081081081],""xaxis"":""x"",""y"":[""chat-bison (PaLM 2)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003esentence count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison-32k (PaLM 2 32K)"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""chat-bison-32k (PaLM 2 32K)"",""offsetgroup"":""chat-bison-32k (PaLM 2 32K)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[4.281081081081081],""xaxis"":""x"",""y"":[""chat-bison-32k (PaLM 2 32K)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003esentence count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4-turbo"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""gpt-4-turbo"",""offsetgroup"":""gpt-4-turbo"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[4.266137566137566],""xaxis"":""x"",""y"":[""gpt-4-turbo""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003esentence count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""gpt-4"",""offsetgroup"":""gpt-4"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[4.266137566137566],""xaxis"":""x"",""y"":[""gpt-4""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003esentence count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gemini-pro"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""gemini-pro"",""offsetgroup"":""gemini-pro"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[4.244871794871795],""xaxis"":""x"",""y"":[""gemini-pro""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003esentence count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""offsetgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[4.244871794871795],""xaxis"":""x"",""y"":[""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003esentence count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""llama-2-70b-chat"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""llama-2-70b-chat"",""offsetgroup"":""llama-2-70b-chat"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[4.2436893203883495],""xaxis"":""x"",""y"":[""llama-2-70b-chat""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003esentence count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-3.5-turbo"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""gpt-3.5-turbo"",""offsetgroup"":""gpt-3.5-turbo"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[4.229639819909955],""xaxis"":""x"",""y"":[""gpt-3.5-turbo""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003esentence count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mixtral-8x7B-Instruct-v0.1"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""Mixtral-8x7B-Instruct-v0.1"",""offsetgroup"":""Mixtral-8x7B-Instruct-v0.1"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[4.161038961038961],""xaxis"":""x"",""y"":[""Mixtral-8x7B-Instruct-v0.1""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003esentence count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""zephyr-7b-beta"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""zephyr-7b-beta"",""offsetgroup"":""zephyr-7b-beta"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[4.159788702026735],""xaxis"":""x"",""y"":[""zephyr-7b-beta""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003esentence count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral-7B-Instruct-v0.2"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""Mistral-7B-Instruct-v0.2"",""offsetgroup"":""Mistral-7B-Instruct-v0.2"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[4.120342654588421],""xaxis"":""x"",""y"":[""Mistral-7B-Instruct-v0.2""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003esentence count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral (7B) Instruct v0.2 (Together AI)"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""Mistral (7B) Instruct v0.2 (Together AI)"",""offsetgroup"":""Mistral (7B) Instruct v0.2 (Together AI)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[3.712222222222222],""xaxis"":""x"",""y"":[""Mistral (7B) Instruct v0.2 (Together AI)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003esentence count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Vicuna v1.5 (7B)"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""Vicuna v1.5 (7B)"",""offsetgroup"":""Vicuna v1.5 (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[3.6173027989821884],""xaxis"":""x"",""y"":[""Vicuna v1.5 (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003esentence count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Falcon Instruct (7B)"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""Falcon Instruct (7B)"",""offsetgroup"":""Falcon Instruct (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[3.5818443804034583],""xaxis"":""x"",""y"":[""Falcon Instruct (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003esentence count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""RedPajama-INCITE Chat (7B)"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""RedPajama-INCITE Chat (7B)"",""offsetgroup"":""RedPajama-INCITE Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[3.5818443804034583],""xaxis"":""x"",""y"":[""RedPajama-INCITE Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003esentence count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Snorkel Mistral PairRM DPO (7B)"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""Snorkel Mistral PairRM DPO (7B)"",""offsetgroup"":""Snorkel Mistral PairRM DPO (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[3.5818443804034583],""xaxis"":""x"",""y"":[""Snorkel Mistral PairRM DPO (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003esentence count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""WizardLM v1.2 (13B)"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""WizardLM v1.2 (13B)"",""offsetgroup"":""WizardLM v1.2 (13B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[3.5818443804034583],""xaxis"":""x"",""y"":[""WizardLM v1.2 (13B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003esentence count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Qwen 1.5 Chat (7B)"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""Qwen 1.5 Chat (7B)"",""offsetgroup"":""Qwen 1.5 Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[3.5818443804034583],""xaxis"":""x"",""y"":[""Qwen 1.5 Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003esentence count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""OpenHermes-2.5-Mistral (7B)"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""OpenHermes-2.5-Mistral (7B)"",""offsetgroup"":""OpenHermes-2.5-Mistral (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[3.5818443804034583],""xaxis"":""x"",""y"":[""OpenHermes-2.5-Mistral (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003esentence count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""LLaMA-2 Chat (7B)"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""LLaMA-2 Chat (7B)"",""offsetgroup"":""LLaMA-2 Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[3.5818443804034583],""xaxis"":""x"",""y"":[""LLaMA-2 Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003esentence count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""01-ai Yi Chat (34B)"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""01-ai Yi Chat (34B)"",""offsetgroup"":""01-ai Yi Chat (34B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[3.5818443804034583],""xaxis"":""x"",""y"":[""01-ai Yi Chat (34B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003esentence count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Chronos Hermes (13B)"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""Chronos Hermes (13B)"",""offsetgroup"":""Chronos Hermes (13B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[3.5818443804034583],""xaxis"":""x"",""y"":[""Chronos Hermes (13B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003esentence count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Upstage SOLAR Instruct v1 (11B)"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""Upstage SOLAR Instruct v1 (11B)"",""offsetgroup"":""Upstage SOLAR Instruct v1 (11B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[3.5818443804034583],""xaxis"":""x"",""y"":[""Upstage SOLAR Instruct v1 (11B)""],""yaxis"":""y"",""type"":""bar""}],""layout"":{""template"":{""data"":{""histogram2dcontour"":[{""type"":""histogram2dcontour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""choropleth"":[{""type"":""choropleth"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""histogram2d"":[{""type"":""histogram2d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmap"":[{""type"":""heatmap"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmapgl"":[{""type"":""heatmapgl"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""contourcarpet"":[{""type"":""contourcarpet"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""contour"":[{""type"":""contour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""surface"":[{""type"":""surface"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""mesh3d"":[{""type"":""mesh3d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""scatter"":[{""fillpattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2},""type"":""scatter""}],""parcoords"":[{""type"":""parcoords"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolargl"":[{""type"":""scatterpolargl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""bar"":[{""error_x"":{""color"":""#2a3f5f""},""error_y"":{""color"":""#2a3f5f""},""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""bar""}],""scattergeo"":[{""type"":""scattergeo"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolar"":[{""type"":""scatterpolar"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""histogram"":[{""marker"":{""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""histogram""}],""scattergl"":[{""type"":""scattergl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatter3d"":[{""type"":""scatter3d"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattermapbox"":[{""type"":""scattermapbox"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterternary"":[{""type"":""scatterternary"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattercarpet"":[{""type"":""scattercarpet"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""carpet"":[{""aaxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""baxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""type"":""carpet""}],""table"":[{""cells"":{""fill"":{""color"":""#EBF0F8""},""line"":{""color"":""white""}},""header"":{""fill"":{""color"":""#C8D4E3""},""line"":{""color"":""white""}},""type"":""table""}],""barpolar"":[{""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""barpolar""}],""pie"":[{""automargin"":true,""type"":""pie""}]},""layout"":{""autotypenumbers"":""strict"",""colorway"":[""#636efa"",""#EF553B"",""#00cc96"",""#ab63fa"",""#FFA15A"",""#19d3f3"",""#FF6692"",""#B6E880"",""#FF97FF"",""#FECB52""],""font"":{""color"":""#2a3f5f""},""hovermode"":""closest"",""hoverlabel"":{""align"":""left""},""paper_bgcolor"":""white"",""plot_bgcolor"":""#E5ECF6"",""polar"":{""bgcolor"":""#E5ECF6"",""angularaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""radialaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""ternary"":{""bgcolor"":""#E5ECF6"",""aaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""baxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""caxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""coloraxis"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""colorscale"":{""sequential"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""sequentialminus"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""diverging"":[[0,""#8e0152""],[0.1,""#c51b7d""],[0.2,""#de77ae""],[0.3,""#f1b6da""],[0.4,""#fde0ef""],[0.5,""#f7f7f7""],[0.6,""#e6f5d0""],[0.7,""#b8e186""],[0.8,""#7fbc41""],[0.9,""#4d9221""],[1,""#276419""]]},""xaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""yaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""scene"":{""xaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""yaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""zaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2}},""shapedefaults"":{""line"":{""color"":""#2a3f5f""}},""annotationdefaults"":{""arrowcolor"":""#2a3f5f"",""arrowhead"":0,""arrowwidth"":1},""geo"":{""bgcolor"":""white"",""landcolor"":""#E5ECF6"",""subunitcolor"":""white"",""showland"":true,""showlakes"":true,""lakecolor"":""white""},""title"":{""x"":0.05},""mapbox"":{""style"":""light""}}},""xaxis"":{""anchor"":""y"",""domain"":[0.0,1.0],""title"":{""text"":""sentence count""}},""yaxis"":{""anchor"":""x"",""domain"":[0.0,1.0],""title"":{""text"":""Model""},""categoryorder"":""array"",""categoryarray"":[""Upstage SOLAR Instruct v1 (11B)"",""Chronos Hermes (13B)"",""01-ai Yi Chat (34B)"",""LLaMA-2 Chat (7B)"",""OpenHermes-2.5-Mistral (7B)"",""Qwen 1.5 Chat (7B)"",""WizardLM v1.2 (13B)"",""Snorkel Mistral PairRM DPO (7B)"",""RedPajama-INCITE Chat (7B)"",""Falcon Instruct (7B)"",""Vicuna v1.5 (7B)"",""Mistral (7B) Instruct v0.2 (Together AI)"",""Mistral-7B-Instruct-v0.2"",""zephyr-7b-beta"",""Mixtral-8x7B-Instruct-v0.1"",""gpt-3.5-turbo"",""llama-2-70b-chat"",""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""gemini-pro"",""gpt-4"",""gpt-4-turbo"",""chat-bison-32k (PaLM 2 32K)"",""chat-bison (PaLM 2)""]},""legend"":{""title"":{""text"":""Model""},""tracegroupgap"":0},""title"":{""text"":""Summary metrics sentence count""},""barmode"":""relative""}}",Average sentence count of the summary.,",model,BERT_score_precision,BERT_score_recall,BERT_score_F1,BLEU_score,original_text_length_part,sentence_count,length_penalty
+15,chat-bison (PaLM 2),0.23123139,0.24001649,0.23214735,0.0037652345768886663,0.2927236655934559,4.281081081081081,83400.0
+16,chat-bison-32k (PaLM 2 32K),0.23051436,0.23993237,0.2317056,0.003694633514634998,0.2608806894318779,4.281081081081081,83400.0
+20,gpt-4-turbo,0.42933634,0.4414623,0.4294052,0.0042830628392272,0.5393220459796505,4.266137566137566,85120.0
+19,gpt-4,0.4864653,0.49512562,0.4839312,0.005711113295666468,0.4763731952669352,4.266137566137566,85120.0
+17,gemini-pro,0.23109974,0.23956373,0.23199782,0.0032373504004405487,0.295286999418032,4.244871794871795,87700.0
+11,TinyLlama/TinyLlama-1.1B-Chat-v1.0,0.122332305,0.12540509,0.12200464,0.003286423403673119,0.13915355617375091,4.244871794871795,87700.0
+21,llama-2-70b-chat,0.20810011,0.22406381,0.21268094,0.004560500754935232,0.29684572894554634,4.2436893203883495,88008.0
+18,gpt-3.5-turbo,0.49478123,0.50445867,0.49331823,0.00919205486407126,0.5905700146991734,4.229639819909955,89814.0
+6,Mixtral-8x7B-Instruct-v0.1,0.19137934,0.2029136,0.19449018,0.0031843990217988536,0.2665288353398184,4.161038961038961,103320.0
+22,zephyr-7b-beta,0.085546724,0.08755772,0.085219756,0.0012612839176470308,0.08796697338212889,4.159788702026735,103714.0
+5,Mistral-7B-Instruct-v0.2,0.04389399,0.045185987,0.04378006,0.000566625796313851,0.04250630683894714,4.120342654588421,113258.0
+4,Mistral (7B) Instruct v0.2 (Together AI),0.36488953,0.3797993,0.36758336,0.005650224193975447,0.5233998570385472,3.712222222222222,29298.0
+13,Vicuna v1.5 (7B),0.28434175,0.29119453,0.2839047,0.007105541953090669,0.2781035051738079,3.6173027989821884,16948.0
+2,Falcon Instruct (7B),0.30270517,0.28607234,0.29104736,0.0030232447024239606,0.0490635544441649,3.5818443804034583,14928.0
+9,RedPajama-INCITE Chat (7B),0.26832756,0.27305293,0.26768887,0.0,0.0560284823193376,3.5818443804034583,14928.0
+10,Snorkel Mistral PairRM DPO (7B),0.3167385,0.34785262,0.32718164,0.0029236226777824676,3.7740234383755356,3.5818443804034583,14928.0
+14,WizardLM v1.2 (13B),0.3420949,0.34746957,0.33996373,0.00373442128604677,0.28716720161049375,3.5818443804034583,14928.0
+8,Qwen 1.5 Chat (7B),0.34898603,0.35945317,0.34867778,0.0033327500620805805,0.29904529709475364,3.5818443804034583,14928.0
+7,OpenHermes-2.5-Mistral (7B),0.3621834,0.3685358,0.36003792,0.0068684572027745494,0.312054520357568,3.5818443804034583,14928.0
+3,LLaMA-2 Chat (7B),0.32074162,0.33171847,0.32136682,0.004415024709996126,0.4084233313416049,3.5818443804034583,14928.0
+0,01-ai Yi Chat (34B),0.33981326,0.35219854,0.34183535,0.007428840277380581,0.43251538287409536,3.5818443804034583,14928.0
+1,Chronos Hermes (13B),0.31285536,0.32630467,0.3150877,0.011542047908319874,0.4742810243835248,3.5818443804034583,14928.0
+12,Upstage SOLAR Instruct v1 (11B),0.0,0.0,0.0,0.0,0.0017662349842492329,3.5818443804034583,14928.0
+","{""x"": ""sentence_count"", ""y"": ""model"", ""color"": ""model"", ""orientation"": ""h"", ""labels"": {""sentence_count"": ""sentence count"", ""model"": ""Model""}, ""title"": ""Summary metrics sentence count""}"
"Figure({
'data': [{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
BLEU score=%{x}',
- 'legendgroup': 'Chronos Hermes (13B)',
+ 'hovertemplate': 'Model=%{y}
length penalty=%{x}',
+ 'legendgroup': 'Mistral-7B-Instruct-v0.2',
'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
- 'name': 'Chronos Hermes (13B)',
- 'offsetgroup': 'Chronos Hermes (13B)',
+ 'name': 'Mistral-7B-Instruct-v0.2',
+ 'offsetgroup': 'Mistral-7B-Instruct-v0.2',
'orientation': 'h',
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.01143901]),
+ 'x': array([113258.]),
'xaxis': 'x',
- 'y': array(['Chronos Hermes (13B)'], dtype=object),
+ 'y': array(['Mistral-7B-Instruct-v0.2'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
BLEU score=%{x}',
- 'legendgroup': 'gpt-3.5-turbo',
+ 'hovertemplate': 'Model=%{y}
length penalty=%{x}',
+ 'legendgroup': 'zephyr-7b-beta',
'marker': {'color': '#EF553B', 'pattern': {'shape': ''}},
- 'name': 'gpt-3.5-turbo',
- 'offsetgroup': 'gpt-3.5-turbo',
+ 'name': 'zephyr-7b-beta',
+ 'offsetgroup': 'zephyr-7b-beta',
'orientation': 'h',
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.00789245]),
+ 'x': array([103714.]),
'xaxis': 'x',
- 'y': array(['gpt-3.5-turbo'], dtype=object),
+ 'y': array(['zephyr-7b-beta'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
BLEU score=%{x}',
- 'legendgroup': '01-ai Yi Chat (34B)',
+ 'hovertemplate': 'Model=%{y}
length penalty=%{x}',
+ 'legendgroup': 'Mixtral-8x7B-Instruct-v0.1',
'marker': {'color': '#00cc96', 'pattern': {'shape': ''}},
- 'name': '01-ai Yi Chat (34B)',
- 'offsetgroup': '01-ai Yi Chat (34B)',
+ 'name': 'Mixtral-8x7B-Instruct-v0.1',
+ 'offsetgroup': 'Mixtral-8x7B-Instruct-v0.1',
'orientation': 'h',
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.00731157]),
+ 'x': array([103320.]),
'xaxis': 'x',
- 'y': array(['01-ai Yi Chat (34B)'], dtype=object),
+ 'y': array(['Mixtral-8x7B-Instruct-v0.1'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
BLEU score=%{x}',
- 'legendgroup': 'Vicuna v1.5 (7B)',
+ 'hovertemplate': 'Model=%{y}
length penalty=%{x}',
+ 'legendgroup': 'gpt-3.5-turbo',
'marker': {'color': '#ab63fa', 'pattern': {'shape': ''}},
- 'name': 'Vicuna v1.5 (7B)',
- 'offsetgroup': 'Vicuna v1.5 (7B)',
+ 'name': 'gpt-3.5-turbo',
+ 'offsetgroup': 'gpt-3.5-turbo',
'orientation': 'h',
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.00695233]),
+ 'x': array([89814.]),
'xaxis': 'x',
- 'y': array(['Vicuna v1.5 (7B)'], dtype=object),
+ 'y': array(['gpt-3.5-turbo'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
BLEU score=%{x}',
- 'legendgroup': 'OpenHermes-2.5-Mistral (7B)',
+ 'hovertemplate': 'Model=%{y}
length penalty=%{x}',
+ 'legendgroup': 'llama-2-70b-chat',
'marker': {'color': '#FFA15A', 'pattern': {'shape': ''}},
- 'name': 'OpenHermes-2.5-Mistral (7B)',
- 'offsetgroup': 'OpenHermes-2.5-Mistral (7B)',
+ 'name': 'llama-2-70b-chat',
+ 'offsetgroup': 'llama-2-70b-chat',
'orientation': 'h',
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.00656316]),
+ 'x': array([88008.]),
'xaxis': 'x',
- 'y': array(['OpenHermes-2.5-Mistral (7B)'], dtype=object),
+ 'y': array(['llama-2-70b-chat'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
BLEU score=%{x}',
- 'legendgroup': 'Mistral (7B) Instruct v0.2 (Together AI)',
+ 'hovertemplate': 'Model=%{y}
length penalty=%{x}',
+ 'legendgroup': 'gemini-pro',
'marker': {'color': '#19d3f3', 'pattern': {'shape': ''}},
- 'name': 'Mistral (7B) Instruct v0.2 (Together AI)',
- 'offsetgroup': 'Mistral (7B) Instruct v0.2 (Together AI)',
+ 'name': 'gemini-pro',
+ 'offsetgroup': 'gemini-pro',
'orientation': 'h',
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.00547852]),
+ 'x': array([87700.]),
'xaxis': 'x',
- 'y': array(['Mistral (7B) Instruct v0.2 (Together AI)'], dtype=object),
+ 'y': array(['gemini-pro'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
BLEU score=%{x}',
- 'legendgroup': 'gpt-4',
+ 'hovertemplate': 'Model=%{y}
length penalty=%{x}',
+ 'legendgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
'marker': {'color': '#FF6692', 'pattern': {'shape': ''}},
- 'name': 'gpt-4',
- 'offsetgroup': 'gpt-4',
+ 'name': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
+ 'offsetgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
'orientation': 'h',
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.00470457]),
+ 'x': array([87700.]),
'xaxis': 'x',
- 'y': array(['gpt-4'], dtype=object),
+ 'y': array(['TinyLlama/TinyLlama-1.1B-Chat-v1.0'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
BLEU score=%{x}',
- 'legendgroup': 'LLaMA-2 Chat (7B)',
+ 'hovertemplate': 'Model=%{y}
length penalty=%{x}',
+ 'legendgroup': 'gpt-4-turbo',
'marker': {'color': '#B6E880', 'pattern': {'shape': ''}},
- 'name': 'LLaMA-2 Chat (7B)',
- 'offsetgroup': 'LLaMA-2 Chat (7B)',
+ 'name': 'gpt-4-turbo',
+ 'offsetgroup': 'gpt-4-turbo',
'orientation': 'h',
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.00425586]),
+ 'x': array([85120.]),
'xaxis': 'x',
- 'y': array(['LLaMA-2 Chat (7B)'], dtype=object),
+ 'y': array(['gpt-4-turbo'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
BLEU score=%{x}',
- 'legendgroup': 'WizardLM v1.2 (13B)',
+ 'hovertemplate': 'Model=%{y}
length penalty=%{x}',
+ 'legendgroup': 'gpt-4',
'marker': {'color': '#FF97FF', 'pattern': {'shape': ''}},
- 'name': 'WizardLM v1.2 (13B)',
- 'offsetgroup': 'WizardLM v1.2 (13B)',
+ 'name': 'gpt-4',
+ 'offsetgroup': 'gpt-4',
'orientation': 'h',
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.00367138]),
+ 'x': array([85120.]),
'xaxis': 'x',
- 'y': array(['WizardLM v1.2 (13B)'], dtype=object),
+ 'y': array(['gpt-4'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
BLEU score=%{x}',
- 'legendgroup': 'gpt-4-turbo',
+ 'hovertemplate': 'Model=%{y}
length penalty=%{x}',
+ 'legendgroup': 'chat-bison (PaLM 2)',
'marker': {'color': '#FECB52', 'pattern': {'shape': ''}},
- 'name': 'gpt-4-turbo',
- 'offsetgroup': 'gpt-4-turbo',
+ 'name': 'chat-bison (PaLM 2)',
+ 'offsetgroup': 'chat-bison (PaLM 2)',
'orientation': 'h',
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.00348737]),
+ 'x': array([83400.]),
'xaxis': 'x',
- 'y': array(['gpt-4-turbo'], dtype=object),
+ 'y': array(['chat-bison (PaLM 2)'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
BLEU score=%{x}',
- 'legendgroup': 'chat-bison (PaLM 2)',
+ 'hovertemplate': 'Model=%{y}
length penalty=%{x}',
+ 'legendgroup': 'chat-bison-32k (PaLM 2 32K)',
'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
- 'name': 'chat-bison (PaLM 2)',
- 'offsetgroup': 'chat-bison (PaLM 2)',
+ 'name': 'chat-bison-32k (PaLM 2 32K)',
+ 'offsetgroup': 'chat-bison-32k (PaLM 2 32K)',
'orientation': 'h',
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.00331735]),
+ 'x': array([83400.]),
'xaxis': 'x',
- 'y': array(['chat-bison (PaLM 2)'], dtype=object),
+ 'y': array(['chat-bison-32k (PaLM 2 32K)'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
BLEU score=%{x}',
- 'legendgroup': 'llama-2-70b-chat',
+ 'hovertemplate': 'Model=%{y}
length penalty=%{x}',
+ 'legendgroup': 'Mistral (7B) Instruct v0.2 (Together AI)',
'marker': {'color': '#EF553B', 'pattern': {'shape': ''}},
- 'name': 'llama-2-70b-chat',
- 'offsetgroup': 'llama-2-70b-chat',
+ 'name': 'Mistral (7B) Instruct v0.2 (Together AI)',
+ 'offsetgroup': 'Mistral (7B) Instruct v0.2 (Together AI)',
'orientation': 'h',
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.00329426]),
+ 'x': array([29298.]),
'xaxis': 'x',
- 'y': array(['llama-2-70b-chat'], dtype=object),
+ 'y': array(['Mistral (7B) Instruct v0.2 (Together AI)'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
BLEU score=%{x}',
- 'legendgroup': 'Qwen 1.5 Chat (7B)',
+ 'hovertemplate': 'Model=%{y}
length penalty=%{x}',
+ 'legendgroup': 'Vicuna v1.5 (7B)',
'marker': {'color': '#00cc96', 'pattern': {'shape': ''}},
- 'name': 'Qwen 1.5 Chat (7B)',
- 'offsetgroup': 'Qwen 1.5 Chat (7B)',
+ 'name': 'Vicuna v1.5 (7B)',
+ 'offsetgroup': 'Vicuna v1.5 (7B)',
'orientation': 'h',
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.00318557]),
+ 'x': array([16948.]),
'xaxis': 'x',
- 'y': array(['Qwen 1.5 Chat (7B)'], dtype=object),
+ 'y': array(['Vicuna v1.5 (7B)'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
BLEU score=%{x}',
- 'legendgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
+ 'hovertemplate': 'Model=%{y}
length penalty=%{x}',
+ 'legendgroup': 'Falcon Instruct (7B)',
'marker': {'color': '#ab63fa', 'pattern': {'shape': ''}},
- 'name': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
- 'offsetgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
+ 'name': 'Falcon Instruct (7B)',
+ 'offsetgroup': 'Falcon Instruct (7B)',
'orientation': 'h',
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.00299116]),
+ 'x': array([14928.]),
'xaxis': 'x',
- 'y': array(['TinyLlama/TinyLlama-1.1B-Chat-v1.0'], dtype=object),
+ 'y': array(['Falcon Instruct (7B)'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
BLEU score=%{x}',
- 'legendgroup': 'chat-bison-32k (PaLM 2 32K)',
+ 'hovertemplate': 'Model=%{y}
length penalty=%{x}',
+ 'legendgroup': 'RedPajama-INCITE Chat (7B)',
'marker': {'color': '#FFA15A', 'pattern': {'shape': ''}},
- 'name': 'chat-bison-32k (PaLM 2 32K)',
- 'offsetgroup': 'chat-bison-32k (PaLM 2 32K)',
+ 'name': 'RedPajama-INCITE Chat (7B)',
+ 'offsetgroup': 'RedPajama-INCITE Chat (7B)',
'orientation': 'h',
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.00297091]),
+ 'x': array([14928.]),
'xaxis': 'x',
- 'y': array(['chat-bison-32k (PaLM 2 32K)'], dtype=object),
+ 'y': array(['RedPajama-INCITE Chat (7B)'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
BLEU score=%{x}',
+ 'hovertemplate': 'Model=%{y}
length penalty=%{x}',
'legendgroup': 'Snorkel Mistral PairRM DPO (7B)',
'marker': {'color': '#19d3f3', 'pattern': {'shape': ''}},
'name': 'Snorkel Mistral PairRM DPO (7B)',
@@ -2458,96 +2474,96 @@ plot_object,header,plot_json,description,df,arguments
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.0029079]),
+ 'x': array([14928.]),
'xaxis': 'x',
'y': array(['Snorkel Mistral PairRM DPO (7B)'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
BLEU score=%{x}',
- 'legendgroup': 'Mixtral-8x7B-Instruct-v0.1',
+ 'hovertemplate': 'Model=%{y}
length penalty=%{x}',
+ 'legendgroup': 'WizardLM v1.2 (13B)',
'marker': {'color': '#FF6692', 'pattern': {'shape': ''}},
- 'name': 'Mixtral-8x7B-Instruct-v0.1',
- 'offsetgroup': 'Mixtral-8x7B-Instruct-v0.1',
+ 'name': 'WizardLM v1.2 (13B)',
+ 'offsetgroup': 'WizardLM v1.2 (13B)',
'orientation': 'h',
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.00268393]),
+ 'x': array([14928.]),
'xaxis': 'x',
- 'y': array(['Mixtral-8x7B-Instruct-v0.1'], dtype=object),
+ 'y': array(['WizardLM v1.2 (13B)'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
BLEU score=%{x}',
- 'legendgroup': 'gemini-pro',
+ 'hovertemplate': 'Model=%{y}
length penalty=%{x}',
+ 'legendgroup': 'Qwen 1.5 Chat (7B)',
'marker': {'color': '#B6E880', 'pattern': {'shape': ''}},
- 'name': 'gemini-pro',
- 'offsetgroup': 'gemini-pro',
+ 'name': 'Qwen 1.5 Chat (7B)',
+ 'offsetgroup': 'Qwen 1.5 Chat (7B)',
'orientation': 'h',
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.00254393]),
+ 'x': array([14928.]),
'xaxis': 'x',
- 'y': array(['gemini-pro'], dtype=object),
+ 'y': array(['Qwen 1.5 Chat (7B)'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
BLEU score=%{x}',
- 'legendgroup': 'zephyr-7b-beta',
+ 'hovertemplate': 'Model=%{y}
length penalty=%{x}',
+ 'legendgroup': 'OpenHermes-2.5-Mistral (7B)',
'marker': {'color': '#FF97FF', 'pattern': {'shape': ''}},
- 'name': 'zephyr-7b-beta',
- 'offsetgroup': 'zephyr-7b-beta',
+ 'name': 'OpenHermes-2.5-Mistral (7B)',
+ 'offsetgroup': 'OpenHermes-2.5-Mistral (7B)',
'orientation': 'h',
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.00106251]),
+ 'x': array([14928.]),
'xaxis': 'x',
- 'y': array(['zephyr-7b-beta'], dtype=object),
+ 'y': array(['OpenHermes-2.5-Mistral (7B)'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
BLEU score=%{x}',
- 'legendgroup': 'Mistral-7B-Instruct-v0.2',
+ 'hovertemplate': 'Model=%{y}
length penalty=%{x}',
+ 'legendgroup': 'LLaMA-2 Chat (7B)',
'marker': {'color': '#FECB52', 'pattern': {'shape': ''}},
- 'name': 'Mistral-7B-Instruct-v0.2',
- 'offsetgroup': 'Mistral-7B-Instruct-v0.2',
+ 'name': 'LLaMA-2 Chat (7B)',
+ 'offsetgroup': 'LLaMA-2 Chat (7B)',
'orientation': 'h',
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.00049303]),
+ 'x': array([14928.]),
'xaxis': 'x',
- 'y': array(['Mistral-7B-Instruct-v0.2'], dtype=object),
+ 'y': array(['LLaMA-2 Chat (7B)'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
BLEU score=%{x}',
- 'legendgroup': 'Falcon Instruct (7B)',
+ 'hovertemplate': 'Model=%{y}
length penalty=%{x}',
+ 'legendgroup': '01-ai Yi Chat (34B)',
'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
- 'name': 'Falcon Instruct (7B)',
- 'offsetgroup': 'Falcon Instruct (7B)',
+ 'name': '01-ai Yi Chat (34B)',
+ 'offsetgroup': '01-ai Yi Chat (34B)',
'orientation': 'h',
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.00021729]),
+ 'x': array([14928.]),
'xaxis': 'x',
- 'y': array(['Falcon Instruct (7B)'], dtype=object),
+ 'y': array(['01-ai Yi Chat (34B)'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
BLEU score=%{x}',
- 'legendgroup': 'RedPajama-INCITE Chat (7B)',
+ 'hovertemplate': 'Model=%{y}
length penalty=%{x}',
+ 'legendgroup': 'Chronos Hermes (13B)',
'marker': {'color': '#EF553B', 'pattern': {'shape': ''}},
- 'name': 'RedPajama-INCITE Chat (7B)',
- 'offsetgroup': 'RedPajama-INCITE Chat (7B)',
+ 'name': 'Chronos Hermes (13B)',
+ 'offsetgroup': 'Chronos Hermes (13B)',
'orientation': 'h',
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.]),
+ 'x': array([14928.]),
'xaxis': 'x',
- 'y': array(['RedPajama-INCITE Chat (7B)'], dtype=object),
+ 'y': array(['Chronos Hermes (13B)'], dtype=object),
'yaxis': 'y'},
{'alignmentgroup': 'True',
- 'hovertemplate': 'Model=%{y}
BLEU score=%{x}',
+ 'hovertemplate': 'Model=%{y}
length penalty=%{x}',
'legendgroup': 'Upstage SOLAR Instruct v1 (11B)',
'marker': {'color': '#00cc96', 'pattern': {'shape': ''}},
'name': 'Upstage SOLAR Instruct v1 (11B)',
@@ -2556,56 +2572,61 @@ plot_object,header,plot_json,description,df,arguments
'showlegend': True,
'textposition': 'auto',
'type': 'bar',
- 'x': array([0.]),
+ 'x': array([14928.]),
'xaxis': 'x',
'y': array(['Upstage SOLAR Instruct v1 (11B)'], dtype=object),
'yaxis': 'y'}],
'layout': {'barmode': 'relative',
'legend': {'title': {'text': 'Model'}, 'tracegroupgap': 0},
'template': '...',
- 'title': {'text': 'Summary metrics BLEU score'},
- 'xaxis': {'anchor': 'y', 'domain': [0.0, 1.0], 'title': {'text': 'BLEU score'}},
+ 'title': {'text': 'Summary metrics length penalty'},
+ 'xaxis': {'anchor': 'y', 'domain': [0.0, 1.0], 'title': {'text': 'length penalty'}},
'yaxis': {'anchor': 'x',
'categoryarray': [Upstage SOLAR Instruct v1 (11B),
- RedPajama-INCITE Chat (7B), Falcon
- Instruct (7B), Mistral-7B-Instruct-v0.2,
- zephyr-7b-beta, gemini-pro,
- Mixtral-8x7B-Instruct-v0.1, Snorkel
- Mistral PairRM DPO (7B), chat-bison-32k
- (PaLM 2 32K),
- TinyLlama/TinyLlama-1.1B-Chat-v1.0, Qwen
- 1.5 Chat (7B), llama-2-70b-chat, chat-
- bison (PaLM 2), gpt-4-turbo, WizardLM
- v1.2 (13B), LLaMA-2 Chat (7B), gpt-4,
- Mistral (7B) Instruct v0.2 (Together
- AI), OpenHermes-2.5-Mistral (7B), Vicuna
- v1.5 (7B), 01-ai Yi Chat (34B),
- gpt-3.5-turbo, Chronos Hermes (13B)],
+ Chronos Hermes (13B), 01-ai Yi Chat
+ (34B), LLaMA-2 Chat (7B),
+ OpenHermes-2.5-Mistral (7B), Qwen 1.5
+ Chat (7B), WizardLM v1.2 (13B), Snorkel
+ Mistral PairRM DPO (7B), RedPajama-
+ INCITE Chat (7B), Falcon Instruct (7B),
+ Vicuna v1.5 (7B), Mistral (7B) Instruct
+ v0.2 (Together AI), chat-bison-32k (PaLM
+ 2 32K), chat-bison (PaLM 2), gpt-4,
+ gpt-4-turbo,
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,
+ gemini-pro, llama-2-70b-chat,
+ gpt-3.5-turbo,
+ Mixtral-8x7B-Instruct-v0.1,
+ zephyr-7b-beta,
+ Mistral-7B-Instruct-v0.2],
'categoryorder': 'array',
'domain': [0.0, 1.0],
'title': {'text': 'Model'}}}
-})",Summary metrics BLEU score,"{""data"":[{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBLEU score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Chronos Hermes (13B)"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""Chronos Hermes (13B)"",""offsetgroup"":""Chronos Hermes (13B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.011439012700594395],""xaxis"":""x"",""y"":[""Chronos Hermes (13B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBLEU score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-3.5-turbo"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""gpt-3.5-turbo"",""offsetgroup"":""gpt-3.5-turbo"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.007892445077902592],""xaxis"":""x"",""y"":[""gpt-3.5-turbo""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBLEU score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""01-ai Yi Chat (34B)"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""01-ai Yi Chat (34B)"",""offsetgroup"":""01-ai Yi Chat (34B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.007311566390840339],""xaxis"":""x"",""y"":[""01-ai Yi Chat (34B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBLEU score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Vicuna v1.5 (7B)"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""Vicuna v1.5 (7B)"",""offsetgroup"":""Vicuna v1.5 (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.006952332387656228],""xaxis"":""x"",""y"":[""Vicuna v1.5 (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBLEU score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""OpenHermes-2.5-Mistral (7B)"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""OpenHermes-2.5-Mistral (7B)"",""offsetgroup"":""OpenHermes-2.5-Mistral (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.006563161880264231],""xaxis"":""x"",""y"":[""OpenHermes-2.5-Mistral (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBLEU score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral (7B) Instruct v0.2 (Together AI)"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""Mistral (7B) Instruct v0.2 (Together AI)"",""offsetgroup"":""Mistral (7B) Instruct v0.2 (Together AI)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.005478518060743351],""xaxis"":""x"",""y"":[""Mistral (7B) Instruct v0.2 (Together AI)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBLEU score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""gpt-4"",""offsetgroup"":""gpt-4"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.004704572681138337],""xaxis"":""x"",""y"":[""gpt-4""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBLEU score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""LLaMA-2 Chat (7B)"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""LLaMA-2 Chat (7B)"",""offsetgroup"":""LLaMA-2 Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.004255859538193306],""xaxis"":""x"",""y"":[""LLaMA-2 Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBLEU score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""WizardLM v1.2 (13B)"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""WizardLM v1.2 (13B)"",""offsetgroup"":""WizardLM v1.2 (13B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.003671383039102015],""xaxis"":""x"",""y"":[""WizardLM v1.2 (13B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBLEU score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4-turbo"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""gpt-4-turbo"",""offsetgroup"":""gpt-4-turbo"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.0034873692407505464],""xaxis"":""x"",""y"":[""gpt-4-turbo""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBLEU score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison (PaLM 2)"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""chat-bison (PaLM 2)"",""offsetgroup"":""chat-bison (PaLM 2)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.0033173472693443363],""xaxis"":""x"",""y"":[""chat-bison (PaLM 2)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBLEU score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""llama-2-70b-chat"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""llama-2-70b-chat"",""offsetgroup"":""llama-2-70b-chat"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.00329426273003284],""xaxis"":""x"",""y"":[""llama-2-70b-chat""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBLEU score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Qwen 1.5 Chat (7B)"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""Qwen 1.5 Chat (7B)"",""offsetgroup"":""Qwen 1.5 Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.003185571110431172],""xaxis"":""x"",""y"":[""Qwen 1.5 Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBLEU score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""offsetgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.002991155730532842],""xaxis"":""x"",""y"":[""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBLEU score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison-32k (PaLM 2 32K)"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""chat-bison-32k (PaLM 2 32K)"",""offsetgroup"":""chat-bison-32k (PaLM 2 32K)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.002970914340485325],""xaxis"":""x"",""y"":[""chat-bison-32k (PaLM 2 32K)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBLEU score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Snorkel Mistral PairRM DPO (7B)"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""Snorkel Mistral PairRM DPO (7B)"",""offsetgroup"":""Snorkel Mistral PairRM DPO (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.002907897771152987],""xaxis"":""x"",""y"":[""Snorkel Mistral PairRM DPO (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBLEU score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mixtral-8x7B-Instruct-v0.1"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""Mixtral-8x7B-Instruct-v0.1"",""offsetgroup"":""Mixtral-8x7B-Instruct-v0.1"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.0026839271544750283],""xaxis"":""x"",""y"":[""Mixtral-8x7B-Instruct-v0.1""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBLEU score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gemini-pro"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""gemini-pro"",""offsetgroup"":""gemini-pro"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.0025439281189154664],""xaxis"":""x"",""y"":[""gemini-pro""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBLEU score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""zephyr-7b-beta"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""zephyr-7b-beta"",""offsetgroup"":""zephyr-7b-beta"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.0010625100735849574],""xaxis"":""x"",""y"":[""zephyr-7b-beta""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBLEU score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral-7B-Instruct-v0.2"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""Mistral-7B-Instruct-v0.2"",""offsetgroup"":""Mistral-7B-Instruct-v0.2"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.0004930290548816363],""xaxis"":""x"",""y"":[""Mistral-7B-Instruct-v0.2""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBLEU score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Falcon Instruct (7B)"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""Falcon Instruct (7B)"",""offsetgroup"":""Falcon Instruct (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.00021729364201653395],""xaxis"":""x"",""y"":[""Falcon Instruct (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBLEU score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""RedPajama-INCITE Chat (7B)"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""RedPajama-INCITE Chat (7B)"",""offsetgroup"":""RedPajama-INCITE Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.0],""xaxis"":""x"",""y"":[""RedPajama-INCITE Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBLEU score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Upstage SOLAR Instruct v1 (11B)"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""Upstage SOLAR Instruct v1 (11B)"",""offsetgroup"":""Upstage SOLAR Instruct v1 (11B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.0],""xaxis"":""x"",""y"":[""Upstage SOLAR Instruct v1 (11B)""],""yaxis"":""y"",""type"":""bar""}],""layout"":{""template"":{""data"":{""histogram2dcontour"":[{""type"":""histogram2dcontour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""choropleth"":[{""type"":""choropleth"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""histogram2d"":[{""type"":""histogram2d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmap"":[{""type"":""heatmap"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmapgl"":[{""type"":""heatmapgl"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""contourcarpet"":[{""type"":""contourcarpet"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""contour"":[{""type"":""contour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""surface"":[{""type"":""surface"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""mesh3d"":[{""type"":""mesh3d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""scatter"":[{""fillpattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2},""type"":""scatter""}],""parcoords"":[{""type"":""parcoords"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolargl"":[{""type"":""scatterpolargl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""bar"":[{""error_x"":{""color"":""#2a3f5f""},""error_y"":{""color"":""#2a3f5f""},""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""bar""}],""scattergeo"":[{""type"":""scattergeo"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolar"":[{""type"":""scatterpolar"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""histogram"":[{""marker"":{""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""histogram""}],""scattergl"":[{""type"":""scattergl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatter3d"":[{""type"":""scatter3d"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattermapbox"":[{""type"":""scattermapbox"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterternary"":[{""type"":""scatterternary"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattercarpet"":[{""type"":""scattercarpet"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""carpet"":[{""aaxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""baxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""type"":""carpet""}],""table"":[{""cells"":{""fill"":{""color"":""#EBF0F8""},""line"":{""color"":""white""}},""header"":{""fill"":{""color"":""#C8D4E3""},""line"":{""color"":""white""}},""type"":""table""}],""barpolar"":[{""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""barpolar""}],""pie"":[{""automargin"":true,""type"":""pie""}]},""layout"":{""autotypenumbers"":""strict"",""colorway"":[""#636efa"",""#EF553B"",""#00cc96"",""#ab63fa"",""#FFA15A"",""#19d3f3"",""#FF6692"",""#B6E880"",""#FF97FF"",""#FECB52""],""font"":{""color"":""#2a3f5f""},""hovermode"":""closest"",""hoverlabel"":{""align"":""left""},""paper_bgcolor"":""white"",""plot_bgcolor"":""#E5ECF6"",""polar"":{""bgcolor"":""#E5ECF6"",""angularaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""radialaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""ternary"":{""bgcolor"":""#E5ECF6"",""aaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""baxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""caxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""coloraxis"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""colorscale"":{""sequential"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""sequentialminus"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""diverging"":[[0,""#8e0152""],[0.1,""#c51b7d""],[0.2,""#de77ae""],[0.3,""#f1b6da""],[0.4,""#fde0ef""],[0.5,""#f7f7f7""],[0.6,""#e6f5d0""],[0.7,""#b8e186""],[0.8,""#7fbc41""],[0.9,""#4d9221""],[1,""#276419""]]},""xaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""yaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""scene"":{""xaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""yaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""zaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2}},""shapedefaults"":{""line"":{""color"":""#2a3f5f""}},""annotationdefaults"":{""arrowcolor"":""#2a3f5f"",""arrowhead"":0,""arrowwidth"":1},""geo"":{""bgcolor"":""white"",""landcolor"":""#E5ECF6"",""subunitcolor"":""white"",""showland"":true,""showlakes"":true,""lakecolor"":""white""},""title"":{""x"":0.05},""mapbox"":{""style"":""light""}}},""xaxis"":{""anchor"":""y"",""domain"":[0.0,1.0],""title"":{""text"":""BLEU score""}},""yaxis"":{""anchor"":""x"",""domain"":[0.0,1.0],""title"":{""text"":""Model""},""categoryorder"":""array"",""categoryarray"":[""Upstage SOLAR Instruct v1 (11B)"",""RedPajama-INCITE Chat (7B)"",""Falcon Instruct (7B)"",""Mistral-7B-Instruct-v0.2"",""zephyr-7b-beta"",""gemini-pro"",""Mixtral-8x7B-Instruct-v0.1"",""Snorkel Mistral PairRM DPO (7B)"",""chat-bison-32k (PaLM 2 32K)"",""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""Qwen 1.5 Chat (7B)"",""llama-2-70b-chat"",""chat-bison (PaLM 2)"",""gpt-4-turbo"",""WizardLM v1.2 (13B)"",""LLaMA-2 Chat (7B)"",""gpt-4"",""Mistral (7B) Instruct v0.2 (Together AI)"",""OpenHermes-2.5-Mistral (7B)"",""Vicuna v1.5 (7B)"",""01-ai Yi Chat (34B)"",""gpt-3.5-turbo"",""Chronos Hermes (13B)""]},""legend"":{""title"":{""text"":""Model""},""tracegroupgap"":0},""title"":{""text"":""Summary metrics BLEU score""},""barmode"":""relative""}}","BLEU (BiLingual Evaluation Understudy) measures similarity between unigrams, bigrams and trigrams in the summarized and original text. Unlike BERT score this metric doesn't handle synonyms. Value is averaged for each model.",",model,bert_score_P,bert_score_R,bert_score_F1,original_text_length_part,sentence_count,length_penalty,bleu_score
-1,Chronos Hermes (13B),0.3124825,0.31071666,0.311415,0.4742810243835248,3.5818443804034583,14928.0,0.011439012700594395
-18,gpt-3.5-turbo,0.4943981,0.48408476,0.4888874,0.5905700146991734,4.229639819909955,89814.0,0.007892445077902592
-0,01-ai Yi Chat (34B),0.33974892,0.3404481,0.3399749,0.43251538287409536,3.5818443804034583,14928.0,0.007311566390840339
-13,Vicuna v1.5 (7B),0.284109,0.27878883,0.28129113,0.2781035051738079,3.6173027989821884,16948.0,0.006952332387656228
-7,OpenHermes-2.5-Mistral (7B),0.3618188,0.35180506,0.3565194,0.312054520357568,3.5818443804034583,14928.0,0.006563161880264231
-4,Mistral (7B) Instruct v0.2 (Together AI),0.3647361,0.3664233,0.36540908,0.5233998570385472,3.712222222222222,29298.0,0.005478518060743351
-19,gpt-4,0.48605907,0.472583,0.47901583,0.4763731952669352,4.266137566137566,85120.0,0.004704572681138337
-3,LLaMA-2 Chat (7B),0.3203912,0.3153909,0.31770444,0.4084233313416049,3.5818443804034583,14928.0,0.004255859538193306
-14,WizardLM v1.2 (13B),0.34085444,0.32933056,0.33466902,0.28716720161049375,3.5818443804034583,14928.0,0.003671383039102015
-20,gpt-4-turbo,0.42728576,0.4162435,0.42098433,0.5393220459796505,4.266137566137566,85120.0,0.0034873692407505464
-15,chat-bison (PaLM 2),0.23117188,0.23029378,0.23060663,0.2927236655934559,4.281081081081081,83400.0,0.0033173472693443363
-21,llama-2-70b-chat,0.20800962,0.21472095,0.21117964,0.29684572894554634,4.2436893203883495,88008.0,0.00329426273003284
-8,Qwen 1.5 Chat (7B),0.34855434,0.34154576,0.344803,0.29904529709475364,3.5818443804034583,14928.0,0.003185571110431172
-11,TinyLlama/TinyLlama-1.1B-Chat-v1.0,0.122185074,0.11885959,0.12042627,0.13915355617375091,4.244871794871795,87700.0,0.002991155730532842
-16,chat-bison-32k (PaLM 2 32K),0.23046139,0.22983725,0.23002876,0.2608806894318779,4.281081081081081,83400.0,0.002970914340485325
-10,Snorkel Mistral PairRM DPO (7B),0.31672964,0.33782956,0.3265383,3.7740234383755356,3.5818443804034583,14928.0,0.002907897771152987
-6,Mixtral-8x7B-Instruct-v0.1,0.19128644,0.19555509,0.19330867,0.2665288353398184,4.161038961038961,103320.0,0.0026839271544750283
-17,gemini-pro,0.23105659,0.23057175,0.23072062,0.295286999418032,4.244871794871795,87700.0,0.0025439281189154664
-22,zephyr-7b-beta,0.085390136,0.08266569,0.08394519,0.08796697338212889,4.159788702026735,103714.0,0.0010625100735849574
-5,Mistral-7B-Instruct-v0.2,0.043820098,0.042561684,0.04313921,0.04250630683894714,4.120342654588421,113258.0,0.0004930290548816363
-2,Falcon Instruct (7B),0.2895086,0.23968808,0.2615204,0.0490635544441649,3.5818443804034583,14928.0,0.00021729364201653395
-9,RedPajama-INCITE Chat (7B),0.261367,0.23758642,0.2487217,0.0560284823193376,3.5818443804034583,14928.0,0.0
-12,Upstage SOLAR Instruct v1 (11B),0.0,0.0,0.0,0.0017662349842492329,3.5818443804034583,14928.0,0.0
-","{""x"": ""bleu_score"", ""y"": ""model"", ""color"": ""model"", ""orientation"": ""h"", ""labels"": {""bleu_score"": ""BLEU score"", ""model"": ""Model""}, ""title"": ""Summary metrics BLEU score""}"
+})",Summary metrics length penalty,"{""data"":[{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003elength penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral-7B-Instruct-v0.2"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""Mistral-7B-Instruct-v0.2"",""offsetgroup"":""Mistral-7B-Instruct-v0.2"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[113258.0],""xaxis"":""x"",""y"":[""Mistral-7B-Instruct-v0.2""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003elength penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""zephyr-7b-beta"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""zephyr-7b-beta"",""offsetgroup"":""zephyr-7b-beta"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[103714.0],""xaxis"":""x"",""y"":[""zephyr-7b-beta""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003elength penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mixtral-8x7B-Instruct-v0.1"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""Mixtral-8x7B-Instruct-v0.1"",""offsetgroup"":""Mixtral-8x7B-Instruct-v0.1"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[103320.0],""xaxis"":""x"",""y"":[""Mixtral-8x7B-Instruct-v0.1""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003elength penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-3.5-turbo"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""gpt-3.5-turbo"",""offsetgroup"":""gpt-3.5-turbo"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[89814.0],""xaxis"":""x"",""y"":[""gpt-3.5-turbo""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003elength penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""llama-2-70b-chat"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""llama-2-70b-chat"",""offsetgroup"":""llama-2-70b-chat"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[88008.0],""xaxis"":""x"",""y"":[""llama-2-70b-chat""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003elength penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gemini-pro"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""gemini-pro"",""offsetgroup"":""gemini-pro"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[87700.0],""xaxis"":""x"",""y"":[""gemini-pro""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003elength penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""offsetgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[87700.0],""xaxis"":""x"",""y"":[""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003elength penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4-turbo"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""gpt-4-turbo"",""offsetgroup"":""gpt-4-turbo"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[85120.0],""xaxis"":""x"",""y"":[""gpt-4-turbo""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003elength penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""gpt-4"",""offsetgroup"":""gpt-4"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[85120.0],""xaxis"":""x"",""y"":[""gpt-4""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003elength penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison (PaLM 2)"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""chat-bison (PaLM 2)"",""offsetgroup"":""chat-bison (PaLM 2)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[83400.0],""xaxis"":""x"",""y"":[""chat-bison (PaLM 2)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003elength penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison-32k (PaLM 2 32K)"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""chat-bison-32k (PaLM 2 32K)"",""offsetgroup"":""chat-bison-32k (PaLM 2 32K)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[83400.0],""xaxis"":""x"",""y"":[""chat-bison-32k (PaLM 2 32K)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003elength penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral (7B) Instruct v0.2 (Together AI)"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""Mistral (7B) Instruct v0.2 (Together AI)"",""offsetgroup"":""Mistral (7B) Instruct v0.2 (Together AI)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[29298.0],""xaxis"":""x"",""y"":[""Mistral (7B) Instruct v0.2 (Together AI)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003elength penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Vicuna v1.5 (7B)"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""Vicuna v1.5 (7B)"",""offsetgroup"":""Vicuna v1.5 (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[16948.0],""xaxis"":""x"",""y"":[""Vicuna v1.5 (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003elength penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Falcon Instruct (7B)"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""Falcon Instruct (7B)"",""offsetgroup"":""Falcon Instruct (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[14928.0],""xaxis"":""x"",""y"":[""Falcon Instruct (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003elength penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""RedPajama-INCITE Chat (7B)"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""RedPajama-INCITE Chat (7B)"",""offsetgroup"":""RedPajama-INCITE Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[14928.0],""xaxis"":""x"",""y"":[""RedPajama-INCITE Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003elength penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Snorkel Mistral PairRM DPO (7B)"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""Snorkel Mistral PairRM DPO (7B)"",""offsetgroup"":""Snorkel Mistral PairRM DPO (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[14928.0],""xaxis"":""x"",""y"":[""Snorkel Mistral PairRM DPO (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003elength penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""WizardLM v1.2 (13B)"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""WizardLM v1.2 (13B)"",""offsetgroup"":""WizardLM v1.2 (13B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[14928.0],""xaxis"":""x"",""y"":[""WizardLM v1.2 (13B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003elength penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Qwen 1.5 Chat (7B)"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""Qwen 1.5 Chat (7B)"",""offsetgroup"":""Qwen 1.5 Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[14928.0],""xaxis"":""x"",""y"":[""Qwen 1.5 Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003elength penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""OpenHermes-2.5-Mistral (7B)"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""OpenHermes-2.5-Mistral (7B)"",""offsetgroup"":""OpenHermes-2.5-Mistral (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[14928.0],""xaxis"":""x"",""y"":[""OpenHermes-2.5-Mistral (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003elength penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""LLaMA-2 Chat (7B)"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""LLaMA-2 Chat (7B)"",""offsetgroup"":""LLaMA-2 Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[14928.0],""xaxis"":""x"",""y"":[""LLaMA-2 Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003elength penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""01-ai Yi Chat (34B)"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""01-ai Yi Chat (34B)"",""offsetgroup"":""01-ai Yi Chat (34B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[14928.0],""xaxis"":""x"",""y"":[""01-ai Yi Chat (34B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003elength penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Chronos Hermes (13B)"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""Chronos Hermes (13B)"",""offsetgroup"":""Chronos Hermes (13B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[14928.0],""xaxis"":""x"",""y"":[""Chronos Hermes (13B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003elength penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Upstage SOLAR Instruct v1 (11B)"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""Upstage SOLAR Instruct v1 (11B)"",""offsetgroup"":""Upstage SOLAR Instruct v1 (11B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[14928.0],""xaxis"":""x"",""y"":[""Upstage SOLAR Instruct v1 (11B)""],""yaxis"":""y"",""type"":""bar""}],""layout"":{""template"":{""data"":{""histogram2dcontour"":[{""type"":""histogram2dcontour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""choropleth"":[{""type"":""choropleth"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""histogram2d"":[{""type"":""histogram2d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmap"":[{""type"":""heatmap"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmapgl"":[{""type"":""heatmapgl"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""contourcarpet"":[{""type"":""contourcarpet"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""contour"":[{""type"":""contour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""surface"":[{""type"":""surface"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""mesh3d"":[{""type"":""mesh3d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""scatter"":[{""fillpattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2},""type"":""scatter""}],""parcoords"":[{""type"":""parcoords"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolargl"":[{""type"":""scatterpolargl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""bar"":[{""error_x"":{""color"":""#2a3f5f""},""error_y"":{""color"":""#2a3f5f""},""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""bar""}],""scattergeo"":[{""type"":""scattergeo"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolar"":[{""type"":""scatterpolar"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""histogram"":[{""marker"":{""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""histogram""}],""scattergl"":[{""type"":""scattergl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatter3d"":[{""type"":""scatter3d"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattermapbox"":[{""type"":""scattermapbox"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterternary"":[{""type"":""scatterternary"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattercarpet"":[{""type"":""scattercarpet"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""carpet"":[{""aaxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""baxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""type"":""carpet""}],""table"":[{""cells"":{""fill"":{""color"":""#EBF0F8""},""line"":{""color"":""white""}},""header"":{""fill"":{""color"":""#C8D4E3""},""line"":{""color"":""white""}},""type"":""table""}],""barpolar"":[{""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""barpolar""}],""pie"":[{""automargin"":true,""type"":""pie""}]},""layout"":{""autotypenumbers"":""strict"",""colorway"":[""#636efa"",""#EF553B"",""#00cc96"",""#ab63fa"",""#FFA15A"",""#19d3f3"",""#FF6692"",""#B6E880"",""#FF97FF"",""#FECB52""],""font"":{""color"":""#2a3f5f""},""hovermode"":""closest"",""hoverlabel"":{""align"":""left""},""paper_bgcolor"":""white"",""plot_bgcolor"":""#E5ECF6"",""polar"":{""bgcolor"":""#E5ECF6"",""angularaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""radialaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""ternary"":{""bgcolor"":""#E5ECF6"",""aaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""baxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""caxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""coloraxis"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""colorscale"":{""sequential"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""sequentialminus"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""diverging"":[[0,""#8e0152""],[0.1,""#c51b7d""],[0.2,""#de77ae""],[0.3,""#f1b6da""],[0.4,""#fde0ef""],[0.5,""#f7f7f7""],[0.6,""#e6f5d0""],[0.7,""#b8e186""],[0.8,""#7fbc41""],[0.9,""#4d9221""],[1,""#276419""]]},""xaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""yaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""scene"":{""xaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""yaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""zaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2}},""shapedefaults"":{""line"":{""color"":""#2a3f5f""}},""annotationdefaults"":{""arrowcolor"":""#2a3f5f"",""arrowhead"":0,""arrowwidth"":1},""geo"":{""bgcolor"":""white"",""landcolor"":""#E5ECF6"",""subunitcolor"":""white"",""showland"":true,""showlakes"":true,""lakecolor"":""white""},""title"":{""x"":0.05},""mapbox"":{""style"":""light""}}},""xaxis"":{""anchor"":""y"",""domain"":[0.0,1.0],""title"":{""text"":""length penalty""}},""yaxis"":{""anchor"":""x"",""domain"":[0.0,1.0],""title"":{""text"":""Model""},""categoryorder"":""array"",""categoryarray"":[""Upstage SOLAR Instruct v1 (11B)"",""Chronos Hermes (13B)"",""01-ai Yi Chat (34B)"",""LLaMA-2 Chat (7B)"",""OpenHermes-2.5-Mistral (7B)"",""Qwen 1.5 Chat (7B)"",""WizardLM v1.2 (13B)"",""Snorkel Mistral PairRM DPO (7B)"",""RedPajama-INCITE Chat (7B)"",""Falcon Instruct (7B)"",""Vicuna v1.5 (7B)"",""Mistral (7B) Instruct v0.2 (Together AI)"",""chat-bison-32k (PaLM 2 32K)"",""chat-bison (PaLM 2)"",""gpt-4"",""gpt-4-turbo"",""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""gemini-pro"",""llama-2-70b-chat"",""gpt-3.5-turbo"",""Mixtral-8x7B-Instruct-v0.1"",""zephyr-7b-beta"",""Mistral-7B-Instruct-v0.2""]},""legend"":{""title"":{""text"":""Model""},""tracegroupgap"":0},""title"":{""text"":""Summary metrics length penalty""},""barmode"":""relative""}}","It is assumed that good quality summary contains between 2 and 5 sentences (inclusive range).
+ The penalty is a difference between summary sentence count and this range.
+
+ It is summed for each model.",",model,BERT_score_precision,BERT_score_recall,BERT_score_F1,BLEU_score,original_text_length_part,sentence_count,length_penalty
+5,Mistral-7B-Instruct-v0.2,0.04389399,0.045185987,0.04378006,0.000566625796313851,0.04250630683894714,4.120342654588421,113258.0
+22,zephyr-7b-beta,0.085546724,0.08755772,0.085219756,0.0012612839176470308,0.08796697338212889,4.159788702026735,103714.0
+6,Mixtral-8x7B-Instruct-v0.1,0.19137934,0.2029136,0.19449018,0.0031843990217988536,0.2665288353398184,4.161038961038961,103320.0
+18,gpt-3.5-turbo,0.49478123,0.50445867,0.49331823,0.00919205486407126,0.5905700146991734,4.229639819909955,89814.0
+21,llama-2-70b-chat,0.20810011,0.22406381,0.21268094,0.004560500754935232,0.29684572894554634,4.2436893203883495,88008.0
+17,gemini-pro,0.23109974,0.23956373,0.23199782,0.0032373504004405487,0.295286999418032,4.244871794871795,87700.0
+11,TinyLlama/TinyLlama-1.1B-Chat-v1.0,0.122332305,0.12540509,0.12200464,0.003286423403673119,0.13915355617375091,4.244871794871795,87700.0
+20,gpt-4-turbo,0.42933634,0.4414623,0.4294052,0.0042830628392272,0.5393220459796505,4.266137566137566,85120.0
+19,gpt-4,0.4864653,0.49512562,0.4839312,0.005711113295666468,0.4763731952669352,4.266137566137566,85120.0
+15,chat-bison (PaLM 2),0.23123139,0.24001649,0.23214735,0.0037652345768886663,0.2927236655934559,4.281081081081081,83400.0
+16,chat-bison-32k (PaLM 2 32K),0.23051436,0.23993237,0.2317056,0.003694633514634998,0.2608806894318779,4.281081081081081,83400.0
+4,Mistral (7B) Instruct v0.2 (Together AI),0.36488953,0.3797993,0.36758336,0.005650224193975447,0.5233998570385472,3.712222222222222,29298.0
+13,Vicuna v1.5 (7B),0.28434175,0.29119453,0.2839047,0.007105541953090669,0.2781035051738079,3.6173027989821884,16948.0
+2,Falcon Instruct (7B),0.30270517,0.28607234,0.29104736,0.0030232447024239606,0.0490635544441649,3.5818443804034583,14928.0
+9,RedPajama-INCITE Chat (7B),0.26832756,0.27305293,0.26768887,0.0,0.0560284823193376,3.5818443804034583,14928.0
+10,Snorkel Mistral PairRM DPO (7B),0.3167385,0.34785262,0.32718164,0.0029236226777824676,3.7740234383755356,3.5818443804034583,14928.0
+14,WizardLM v1.2 (13B),0.3420949,0.34746957,0.33996373,0.00373442128604677,0.28716720161049375,3.5818443804034583,14928.0
+8,Qwen 1.5 Chat (7B),0.34898603,0.35945317,0.34867778,0.0033327500620805805,0.29904529709475364,3.5818443804034583,14928.0
+7,OpenHermes-2.5-Mistral (7B),0.3621834,0.3685358,0.36003792,0.0068684572027745494,0.312054520357568,3.5818443804034583,14928.0
+3,LLaMA-2 Chat (7B),0.32074162,0.33171847,0.32136682,0.004415024709996126,0.4084233313416049,3.5818443804034583,14928.0
+0,01-ai Yi Chat (34B),0.33981326,0.35219854,0.34183535,0.007428840277380581,0.43251538287409536,3.5818443804034583,14928.0
+1,Chronos Hermes (13B),0.31285536,0.32630467,0.3150877,0.011542047908319874,0.4742810243835248,3.5818443804034583,14928.0
+12,Upstage SOLAR Instruct v1 (11B),0.0,0.0,0.0,0.0,0.0017662349842492329,3.5818443804034583,14928.0
+","{""x"": ""length_penalty"", ""y"": ""model"", ""color"": ""model"", ""orientation"": ""h"", ""labels"": {""length_penalty"": ""length penalty"", ""model"": ""Model""}, ""title"": ""Summary metrics length penalty""}"