diff --git "a/data/summary_metrics_plots.csv" "b/data/summary_metrics_plots.csv" --- "a/data/summary_metrics_plots.csv" +++ "b/data/summary_metrics_plots.csv" @@ -1,7 +1,7 @@ plot_object,header,plot_json,description,df,arguments "Figure({ 'data': [{'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
BERT score P=%{x}', + 'hovertemplate': 'Model=%{y}
BERT score precision=%{x}', 'legendgroup': 'gpt-3.5-turbo', 'marker': {'color': '#636efa', 'pattern': {'shape': ''}}, 'name': 'gpt-3.5-turbo', @@ -10,12 +10,12 @@ plot_object,header,plot_json,description,df,arguments 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.4943981], dtype=float32), + 'x': array([0.49478123], dtype=float32), 'xaxis': 'x', 'y': array(['gpt-3.5-turbo'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
BERT score P=%{x}', + 'hovertemplate': 'Model=%{y}
BERT score precision=%{x}', 'legendgroup': 'gpt-4', 'marker': {'color': '#EF553B', 'pattern': {'shape': ''}}, 'name': 'gpt-4', @@ -24,12 +24,12 @@ plot_object,header,plot_json,description,df,arguments 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.48605907], dtype=float32), + 'x': array([0.4864653], dtype=float32), 'xaxis': 'x', 'y': array(['gpt-4'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
BERT score P=%{x}', + 'hovertemplate': 'Model=%{y}
BERT score precision=%{x}', 'legendgroup': 'gpt-4-turbo', 'marker': {'color': '#00cc96', 'pattern': {'shape': ''}}, 'name': 'gpt-4-turbo', @@ -38,12 +38,12 @@ plot_object,header,plot_json,description,df,arguments 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.42728576], dtype=float32), + 'x': array([0.42933634], dtype=float32), 'xaxis': 'x', 'y': array(['gpt-4-turbo'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
BERT score P=%{x}', + 'hovertemplate': 'Model=%{y}
BERT score precision=%{x}', 'legendgroup': 'Mistral (7B) Instruct v0.2 (Together AI)', 'marker': {'color': '#ab63fa', 'pattern': {'shape': ''}}, 'name': 'Mistral (7B) Instruct v0.2 (Together AI)', @@ -52,12 +52,12 @@ plot_object,header,plot_json,description,df,arguments 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.3647361], dtype=float32), + 'x': array([0.36488953], dtype=float32), 'xaxis': 'x', 'y': array(['Mistral (7B) Instruct v0.2 (Together AI)'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
BERT score P=%{x}', + 'hovertemplate': 'Model=%{y}
BERT score precision=%{x}', 'legendgroup': 'OpenHermes-2.5-Mistral (7B)', 'marker': {'color': '#FFA15A', 'pattern': {'shape': ''}}, 'name': 'OpenHermes-2.5-Mistral (7B)', @@ -66,12 +66,12 @@ plot_object,header,plot_json,description,df,arguments 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.3618188], dtype=float32), + 'x': array([0.3621834], dtype=float32), 'xaxis': 'x', 'y': array(['OpenHermes-2.5-Mistral (7B)'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
BERT score P=%{x}', + 'hovertemplate': 'Model=%{y}
BERT score precision=%{x}', 'legendgroup': 'Qwen 1.5 Chat (7B)', 'marker': {'color': '#19d3f3', 'pattern': {'shape': ''}}, 'name': 'Qwen 1.5 Chat (7B)', @@ -80,12 +80,12 @@ plot_object,header,plot_json,description,df,arguments 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.34855434], dtype=float32), + 'x': array([0.34898603], dtype=float32), 'xaxis': 'x', 'y': array(['Qwen 1.5 Chat (7B)'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
BERT score P=%{x}', + 'hovertemplate': 'Model=%{y}
BERT score precision=%{x}', 'legendgroup': 'WizardLM v1.2 (13B)', 'marker': {'color': '#FF6692', 'pattern': {'shape': ''}}, 'name': 'WizardLM v1.2 (13B)', @@ -94,12 +94,12 @@ plot_object,header,plot_json,description,df,arguments 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.34085444], dtype=float32), + 'x': array([0.3420949], dtype=float32), 'xaxis': 'x', 'y': array(['WizardLM v1.2 (13B)'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
BERT score P=%{x}', + 'hovertemplate': 'Model=%{y}
BERT score precision=%{x}', 'legendgroup': '01-ai Yi Chat (34B)', 'marker': {'color': '#B6E880', 'pattern': {'shape': ''}}, 'name': '01-ai Yi Chat (34B)', @@ -108,12 +108,12 @@ plot_object,header,plot_json,description,df,arguments 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.33974892], dtype=float32), + 'x': array([0.33981326], dtype=float32), 'xaxis': 'x', 'y': array(['01-ai Yi Chat (34B)'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
BERT score P=%{x}', + 'hovertemplate': 'Model=%{y}
BERT score precision=%{x}', 'legendgroup': 'LLaMA-2 Chat (7B)', 'marker': {'color': '#FF97FF', 'pattern': {'shape': ''}}, 'name': 'LLaMA-2 Chat (7B)', @@ -122,12 +122,12 @@ plot_object,header,plot_json,description,df,arguments 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.3203912], dtype=float32), + 'x': array([0.32074162], dtype=float32), 'xaxis': 'x', 'y': array(['LLaMA-2 Chat (7B)'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
BERT score P=%{x}', + 'hovertemplate': 'Model=%{y}
BERT score precision=%{x}', 'legendgroup': 'Snorkel Mistral PairRM DPO (7B)', 'marker': {'color': '#FECB52', 'pattern': {'shape': ''}}, 'name': 'Snorkel Mistral PairRM DPO (7B)', @@ -136,12 +136,12 @@ plot_object,header,plot_json,description,df,arguments 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.31672964], dtype=float32), + 'x': array([0.3167385], dtype=float32), 'xaxis': 'x', 'y': array(['Snorkel Mistral PairRM DPO (7B)'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
BERT score P=%{x}', + 'hovertemplate': 'Model=%{y}
BERT score precision=%{x}', 'legendgroup': 'Chronos Hermes (13B)', 'marker': {'color': '#636efa', 'pattern': {'shape': ''}}, 'name': 'Chronos Hermes (13B)', @@ -150,12 +150,12 @@ plot_object,header,plot_json,description,df,arguments 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.3124825], dtype=float32), + 'x': array([0.31285536], dtype=float32), 'xaxis': 'x', 'y': array(['Chronos Hermes (13B)'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
BERT score P=%{x}', + 'hovertemplate': 'Model=%{y}
BERT score precision=%{x}', 'legendgroup': 'Falcon Instruct (7B)', 'marker': {'color': '#EF553B', 'pattern': {'shape': ''}}, 'name': 'Falcon Instruct (7B)', @@ -164,12 +164,12 @@ plot_object,header,plot_json,description,df,arguments 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.2895086], dtype=float32), + 'x': array([0.30270517], dtype=float32), 'xaxis': 'x', 'y': array(['Falcon Instruct (7B)'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
BERT score P=%{x}', + 'hovertemplate': 'Model=%{y}
BERT score precision=%{x}', 'legendgroup': 'Vicuna v1.5 (7B)', 'marker': {'color': '#00cc96', 'pattern': {'shape': ''}}, 'name': 'Vicuna v1.5 (7B)', @@ -178,12 +178,12 @@ plot_object,header,plot_json,description,df,arguments 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.284109], dtype=float32), + 'x': array([0.28434175], dtype=float32), 'xaxis': 'x', 'y': array(['Vicuna v1.5 (7B)'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
BERT score P=%{x}', + 'hovertemplate': 'Model=%{y}
BERT score precision=%{x}', 'legendgroup': 'RedPajama-INCITE Chat (7B)', 'marker': {'color': '#ab63fa', 'pattern': {'shape': ''}}, 'name': 'RedPajama-INCITE Chat (7B)', @@ -192,12 +192,12 @@ plot_object,header,plot_json,description,df,arguments 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.261367], dtype=float32), + 'x': array([0.26832756], dtype=float32), 'xaxis': 'x', 'y': array(['RedPajama-INCITE Chat (7B)'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
BERT score P=%{x}', + 'hovertemplate': 'Model=%{y}
BERT score precision=%{x}', 'legendgroup': 'chat-bison (PaLM 2)', 'marker': {'color': '#FFA15A', 'pattern': {'shape': ''}}, 'name': 'chat-bison (PaLM 2)', @@ -206,12 +206,12 @@ plot_object,header,plot_json,description,df,arguments 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.23117188], dtype=float32), + 'x': array([0.23123139], dtype=float32), 'xaxis': 'x', 'y': array(['chat-bison (PaLM 2)'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
BERT score P=%{x}', + 'hovertemplate': 'Model=%{y}
BERT score precision=%{x}', 'legendgroup': 'gemini-pro', 'marker': {'color': '#19d3f3', 'pattern': {'shape': ''}}, 'name': 'gemini-pro', @@ -220,12 +220,12 @@ plot_object,header,plot_json,description,df,arguments 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.23105659], dtype=float32), + 'x': array([0.23109974], dtype=float32), 'xaxis': 'x', 'y': array(['gemini-pro'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
BERT score P=%{x}', + 'hovertemplate': 'Model=%{y}
BERT score precision=%{x}', 'legendgroup': 'chat-bison-32k (PaLM 2 32K)', 'marker': {'color': '#FF6692', 'pattern': {'shape': ''}}, 'name': 'chat-bison-32k (PaLM 2 32K)', @@ -234,12 +234,12 @@ plot_object,header,plot_json,description,df,arguments 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.23046139], dtype=float32), + 'x': array([0.23051436], dtype=float32), 'xaxis': 'x', 'y': array(['chat-bison-32k (PaLM 2 32K)'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
BERT score P=%{x}', + 'hovertemplate': 'Model=%{y}
BERT score precision=%{x}', 'legendgroup': 'llama-2-70b-chat', 'marker': {'color': '#B6E880', 'pattern': {'shape': ''}}, 'name': 'llama-2-70b-chat', @@ -248,12 +248,12 @@ plot_object,header,plot_json,description,df,arguments 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.20800962], dtype=float32), + 'x': array([0.20810011], dtype=float32), 'xaxis': 'x', 'y': array(['llama-2-70b-chat'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
BERT score P=%{x}', + 'hovertemplate': 'Model=%{y}
BERT score precision=%{x}', 'legendgroup': 'Mixtral-8x7B-Instruct-v0.1', 'marker': {'color': '#FF97FF', 'pattern': {'shape': ''}}, 'name': 'Mixtral-8x7B-Instruct-v0.1', @@ -262,12 +262,12 @@ plot_object,header,plot_json,description,df,arguments 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.19128644], dtype=float32), + 'x': array([0.19137934], dtype=float32), 'xaxis': 'x', 'y': array(['Mixtral-8x7B-Instruct-v0.1'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
BERT score P=%{x}', + 'hovertemplate': 'Model=%{y}
BERT score precision=%{x}', 'legendgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0', 'marker': {'color': '#FECB52', 'pattern': {'shape': ''}}, 'name': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0', @@ -276,12 +276,12 @@ plot_object,header,plot_json,description,df,arguments 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.12218507], dtype=float32), + 'x': array([0.1223323], dtype=float32), 'xaxis': 'x', 'y': array(['TinyLlama/TinyLlama-1.1B-Chat-v1.0'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
BERT score P=%{x}', + 'hovertemplate': 'Model=%{y}
BERT score precision=%{x}', 'legendgroup': 'zephyr-7b-beta', 'marker': {'color': '#636efa', 'pattern': {'shape': ''}}, 'name': 'zephyr-7b-beta', @@ -290,12 +290,12 @@ plot_object,header,plot_json,description,df,arguments 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.08539014], dtype=float32), + 'x': array([0.08554672], dtype=float32), 'xaxis': 'x', 'y': array(['zephyr-7b-beta'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
BERT score P=%{x}', + 'hovertemplate': 'Model=%{y}
BERT score precision=%{x}', 'legendgroup': 'Mistral-7B-Instruct-v0.2', 'marker': {'color': '#EF553B', 'pattern': {'shape': ''}}, 'name': 'Mistral-7B-Instruct-v0.2', @@ -304,12 +304,12 @@ plot_object,header,plot_json,description,df,arguments 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.0438201], dtype=float32), + 'x': array([0.04389399], dtype=float32), 'xaxis': 'x', 'y': array(['Mistral-7B-Instruct-v0.2'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
BERT score P=%{x}', + 'hovertemplate': 'Model=%{y}
BERT score precision=%{x}', 'legendgroup': 'Upstage SOLAR Instruct v1 (11B)', 'marker': {'color': '#00cc96', 'pattern': {'shape': ''}}, 'name': 'Upstage SOLAR Instruct v1 (11B)', @@ -325,8 +325,8 @@ plot_object,header,plot_json,description,df,arguments 'layout': {'barmode': 'relative', 'legend': {'title': {'text': 'Model'}, 'tracegroupgap': 0}, 'template': '...', - 'title': {'text': 'Summary metrics BERT score P'}, - 'xaxis': {'anchor': 'y', 'domain': [0.0, 1.0], 'title': {'text': 'BERT score P'}}, + 'title': {'text': 'Summary metrics BERT score precision'}, + 'xaxis': {'anchor': 'y', 'domain': [0.0, 1.0], 'title': {'text': 'BERT score precision'}}, 'yaxis': {'anchor': 'x', 'categoryarray': [Upstage SOLAR Instruct v1 (11B), Mistral-7B-Instruct-v0.2, @@ -346,34 +346,34 @@ plot_object,header,plot_json,description,df,arguments 'categoryorder': 'array', 'domain': [0.0, 1.0], 'title': {'text': 'Model'}}} -})",Summary metrics BERT score P,"{""data"":[{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score P=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-3.5-turbo"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""gpt-3.5-turbo"",""offsetgroup"":""gpt-3.5-turbo"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.4943981],""xaxis"":""x"",""y"":[""gpt-3.5-turbo""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score P=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""gpt-4"",""offsetgroup"":""gpt-4"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.48605907],""xaxis"":""x"",""y"":[""gpt-4""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score P=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4-turbo"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""gpt-4-turbo"",""offsetgroup"":""gpt-4-turbo"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.42728576],""xaxis"":""x"",""y"":[""gpt-4-turbo""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score P=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral (7B) Instruct v0.2 (Together AI)"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""Mistral (7B) Instruct v0.2 (Together AI)"",""offsetgroup"":""Mistral (7B) Instruct v0.2 (Together AI)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.3647361],""xaxis"":""x"",""y"":[""Mistral (7B) Instruct v0.2 (Together AI)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score P=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""OpenHermes-2.5-Mistral (7B)"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""OpenHermes-2.5-Mistral (7B)"",""offsetgroup"":""OpenHermes-2.5-Mistral (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.3618188],""xaxis"":""x"",""y"":[""OpenHermes-2.5-Mistral (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score P=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Qwen 1.5 Chat (7B)"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""Qwen 1.5 Chat (7B)"",""offsetgroup"":""Qwen 1.5 Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.34855434],""xaxis"":""x"",""y"":[""Qwen 1.5 Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score P=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""WizardLM v1.2 (13B)"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""WizardLM v1.2 (13B)"",""offsetgroup"":""WizardLM v1.2 (13B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.34085444],""xaxis"":""x"",""y"":[""WizardLM v1.2 (13B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score P=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""01-ai Yi Chat (34B)"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""01-ai Yi Chat (34B)"",""offsetgroup"":""01-ai Yi Chat (34B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.33974892],""xaxis"":""x"",""y"":[""01-ai Yi Chat (34B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score P=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""LLaMA-2 Chat (7B)"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""LLaMA-2 Chat (7B)"",""offsetgroup"":""LLaMA-2 Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.3203912],""xaxis"":""x"",""y"":[""LLaMA-2 Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score P=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Snorkel Mistral PairRM DPO (7B)"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""Snorkel Mistral PairRM DPO (7B)"",""offsetgroup"":""Snorkel Mistral PairRM DPO (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.31672964],""xaxis"":""x"",""y"":[""Snorkel Mistral PairRM DPO (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score P=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Chronos Hermes (13B)"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""Chronos Hermes (13B)"",""offsetgroup"":""Chronos Hermes (13B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.3124825],""xaxis"":""x"",""y"":[""Chronos Hermes (13B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score P=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Falcon Instruct (7B)"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""Falcon Instruct (7B)"",""offsetgroup"":""Falcon Instruct (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.2895086],""xaxis"":""x"",""y"":[""Falcon Instruct (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score P=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Vicuna v1.5 (7B)"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""Vicuna v1.5 (7B)"",""offsetgroup"":""Vicuna v1.5 (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.284109],""xaxis"":""x"",""y"":[""Vicuna v1.5 (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score P=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""RedPajama-INCITE Chat (7B)"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""RedPajama-INCITE Chat (7B)"",""offsetgroup"":""RedPajama-INCITE Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.261367],""xaxis"":""x"",""y"":[""RedPajama-INCITE Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score P=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison (PaLM 2)"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""chat-bison (PaLM 2)"",""offsetgroup"":""chat-bison (PaLM 2)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.23117188],""xaxis"":""x"",""y"":[""chat-bison (PaLM 2)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score P=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gemini-pro"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""gemini-pro"",""offsetgroup"":""gemini-pro"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.23105659],""xaxis"":""x"",""y"":[""gemini-pro""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score P=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison-32k (PaLM 2 32K)"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""chat-bison-32k (PaLM 2 32K)"",""offsetgroup"":""chat-bison-32k (PaLM 2 32K)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.23046139],""xaxis"":""x"",""y"":[""chat-bison-32k (PaLM 2 32K)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score P=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""llama-2-70b-chat"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""llama-2-70b-chat"",""offsetgroup"":""llama-2-70b-chat"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.20800962],""xaxis"":""x"",""y"":[""llama-2-70b-chat""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score P=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mixtral-8x7B-Instruct-v0.1"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""Mixtral-8x7B-Instruct-v0.1"",""offsetgroup"":""Mixtral-8x7B-Instruct-v0.1"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.19128644],""xaxis"":""x"",""y"":[""Mixtral-8x7B-Instruct-v0.1""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score P=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""offsetgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.122185074],""xaxis"":""x"",""y"":[""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score P=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""zephyr-7b-beta"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""zephyr-7b-beta"",""offsetgroup"":""zephyr-7b-beta"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.085390136],""xaxis"":""x"",""y"":[""zephyr-7b-beta""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score P=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral-7B-Instruct-v0.2"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""Mistral-7B-Instruct-v0.2"",""offsetgroup"":""Mistral-7B-Instruct-v0.2"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.043820098],""xaxis"":""x"",""y"":[""Mistral-7B-Instruct-v0.2""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score P=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Upstage SOLAR Instruct v1 (11B)"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""Upstage SOLAR Instruct v1 (11B)"",""offsetgroup"":""Upstage SOLAR Instruct v1 (11B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.0],""xaxis"":""x"",""y"":[""Upstage SOLAR Instruct v1 (11B)""],""yaxis"":""y"",""type"":""bar""}],""layout"":{""template"":{""data"":{""histogram2dcontour"":[{""type"":""histogram2dcontour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""choropleth"":[{""type"":""choropleth"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""histogram2d"":[{""type"":""histogram2d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmap"":[{""type"":""heatmap"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmapgl"":[{""type"":""heatmapgl"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""contourcarpet"":[{""type"":""contourcarpet"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""contour"":[{""type"":""contour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""surface"":[{""type"":""surface"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""mesh3d"":[{""type"":""mesh3d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""scatter"":[{""fillpattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2},""type"":""scatter""}],""parcoords"":[{""type"":""parcoords"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolargl"":[{""type"":""scatterpolargl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""bar"":[{""error_x"":{""color"":""#2a3f5f""},""error_y"":{""color"":""#2a3f5f""},""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""bar""}],""scattergeo"":[{""type"":""scattergeo"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolar"":[{""type"":""scatterpolar"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""histogram"":[{""marker"":{""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""histogram""}],""scattergl"":[{""type"":""scattergl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatter3d"":[{""type"":""scatter3d"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattermapbox"":[{""type"":""scattermapbox"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterternary"":[{""type"":""scatterternary"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattercarpet"":[{""type"":""scattercarpet"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""carpet"":[{""aaxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""baxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""type"":""carpet""}],""table"":[{""cells"":{""fill"":{""color"":""#EBF0F8""},""line"":{""color"":""white""}},""header"":{""fill"":{""color"":""#C8D4E3""},""line"":{""color"":""white""}},""type"":""table""}],""barpolar"":[{""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""barpolar""}],""pie"":[{""automargin"":true,""type"":""pie""}]},""layout"":{""autotypenumbers"":""strict"",""colorway"":[""#636efa"",""#EF553B"",""#00cc96"",""#ab63fa"",""#FFA15A"",""#19d3f3"",""#FF6692"",""#B6E880"",""#FF97FF"",""#FECB52""],""font"":{""color"":""#2a3f5f""},""hovermode"":""closest"",""hoverlabel"":{""align"":""left""},""paper_bgcolor"":""white"",""plot_bgcolor"":""#E5ECF6"",""polar"":{""bgcolor"":""#E5ECF6"",""angularaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""radialaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""ternary"":{""bgcolor"":""#E5ECF6"",""aaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""baxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""caxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""coloraxis"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""colorscale"":{""sequential"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""sequentialminus"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""diverging"":[[0,""#8e0152""],[0.1,""#c51b7d""],[0.2,""#de77ae""],[0.3,""#f1b6da""],[0.4,""#fde0ef""],[0.5,""#f7f7f7""],[0.6,""#e6f5d0""],[0.7,""#b8e186""],[0.8,""#7fbc41""],[0.9,""#4d9221""],[1,""#276419""]]},""xaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""yaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""scene"":{""xaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""yaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""zaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2}},""shapedefaults"":{""line"":{""color"":""#2a3f5f""}},""annotationdefaults"":{""arrowcolor"":""#2a3f5f"",""arrowhead"":0,""arrowwidth"":1},""geo"":{""bgcolor"":""white"",""landcolor"":""#E5ECF6"",""subunitcolor"":""white"",""showland"":true,""showlakes"":true,""lakecolor"":""white""},""title"":{""x"":0.05},""mapbox"":{""style"":""light""}}},""xaxis"":{""anchor"":""y"",""domain"":[0.0,1.0],""title"":{""text"":""BERT score P""}},""yaxis"":{""anchor"":""x"",""domain"":[0.0,1.0],""title"":{""text"":""Model""},""categoryorder"":""array"",""categoryarray"":[""Upstage SOLAR Instruct v1 (11B)"",""Mistral-7B-Instruct-v0.2"",""zephyr-7b-beta"",""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""Mixtral-8x7B-Instruct-v0.1"",""llama-2-70b-chat"",""chat-bison-32k (PaLM 2 32K)"",""gemini-pro"",""chat-bison (PaLM 2)"",""RedPajama-INCITE Chat (7B)"",""Vicuna v1.5 (7B)"",""Falcon Instruct (7B)"",""Chronos Hermes (13B)"",""Snorkel Mistral PairRM DPO (7B)"",""LLaMA-2 Chat (7B)"",""01-ai Yi Chat (34B)"",""WizardLM v1.2 (13B)"",""Qwen 1.5 Chat (7B)"",""OpenHermes-2.5-Mistral (7B)"",""Mistral (7B) Instruct v0.2 (Together AI)"",""gpt-4-turbo"",""gpt-4"",""gpt-3.5-turbo""]},""legend"":{""title"":{""text"":""Model""},""tracegroupgap"":0},""title"":{""text"":""Summary metrics BERT score P""},""barmode"":""relative""}}",,",model,bert_score_P,bert_score_R,bert_score_F1,original_text_length_part,sentence_count,length_penalty,bleu_score -18,gpt-3.5-turbo,0.4943981,0.48408476,0.4888874,0.5905700146991734,4.229639819909955,89814.0,0.007892445077902592 -19,gpt-4,0.48605907,0.472583,0.47901583,0.4763731952669352,4.266137566137566,85120.0,0.004704572681138337 -20,gpt-4-turbo,0.42728576,0.4162435,0.42098433,0.5393220459796505,4.266137566137566,85120.0,0.0034873692407505464 -4,Mistral (7B) Instruct v0.2 (Together AI),0.3647361,0.3664233,0.36540908,0.5233998570385472,3.712222222222222,29298.0,0.005478518060743351 -7,OpenHermes-2.5-Mistral (7B),0.3618188,0.35180506,0.3565194,0.312054520357568,3.5818443804034583,14928.0,0.006563161880264231 -8,Qwen 1.5 Chat (7B),0.34855434,0.34154576,0.344803,0.29904529709475364,3.5818443804034583,14928.0,0.003185571110431172 -14,WizardLM v1.2 (13B),0.34085444,0.32933056,0.33466902,0.28716720161049375,3.5818443804034583,14928.0,0.003671383039102015 -0,01-ai Yi Chat (34B),0.33974892,0.3404481,0.3399749,0.43251538287409536,3.5818443804034583,14928.0,0.007311566390840339 -3,LLaMA-2 Chat (7B),0.3203912,0.3153909,0.31770444,0.4084233313416049,3.5818443804034583,14928.0,0.004255859538193306 -10,Snorkel Mistral PairRM DPO (7B),0.31672964,0.33782956,0.3265383,3.7740234383755356,3.5818443804034583,14928.0,0.002907897771152987 -1,Chronos Hermes (13B),0.3124825,0.31071666,0.311415,0.4742810243835248,3.5818443804034583,14928.0,0.011439012700594395 -2,Falcon Instruct (7B),0.2895086,0.23968808,0.2615204,0.0490635544441649,3.5818443804034583,14928.0,0.00021729364201653395 -13,Vicuna v1.5 (7B),0.284109,0.27878883,0.28129113,0.2781035051738079,3.6173027989821884,16948.0,0.006952332387656228 -9,RedPajama-INCITE Chat (7B),0.261367,0.23758642,0.2487217,0.0560284823193376,3.5818443804034583,14928.0,0.0 -15,chat-bison (PaLM 2),0.23117188,0.23029378,0.23060663,0.2927236655934559,4.281081081081081,83400.0,0.0033173472693443363 -17,gemini-pro,0.23105659,0.23057175,0.23072062,0.295286999418032,4.244871794871795,87700.0,0.0025439281189154664 -16,chat-bison-32k (PaLM 2 32K),0.23046139,0.22983725,0.23002876,0.2608806894318779,4.281081081081081,83400.0,0.002970914340485325 -21,llama-2-70b-chat,0.20800962,0.21472095,0.21117964,0.29684572894554634,4.2436893203883495,88008.0,0.00329426273003284 -6,Mixtral-8x7B-Instruct-v0.1,0.19128644,0.19555509,0.19330867,0.2665288353398184,4.161038961038961,103320.0,0.0026839271544750283 -11,TinyLlama/TinyLlama-1.1B-Chat-v1.0,0.122185074,0.11885959,0.12042627,0.13915355617375091,4.244871794871795,87700.0,0.002991155730532842 -22,zephyr-7b-beta,0.085390136,0.08266569,0.08394519,0.08796697338212889,4.159788702026735,103714.0,0.0010625100735849574 -5,Mistral-7B-Instruct-v0.2,0.043820098,0.042561684,0.04313921,0.04250630683894714,4.120342654588421,113258.0,0.0004930290548816363 -12,Upstage SOLAR Instruct v1 (11B),0.0,0.0,0.0,0.0017662349842492329,3.5818443804034583,14928.0,0.0 -","{""x"": ""bert_score_P"", ""y"": ""model"", ""color"": ""model"", ""orientation"": ""h"", ""labels"": {""bert_score_P"": ""BERT score P"", ""model"": ""Model""}, ""title"": ""Summary metrics BERT score P""}" +})",Summary metrics BERT score precision,"{""data"":[{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score precision=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-3.5-turbo"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""gpt-3.5-turbo"",""offsetgroup"":""gpt-3.5-turbo"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.49478123],""xaxis"":""x"",""y"":[""gpt-3.5-turbo""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score precision=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""gpt-4"",""offsetgroup"":""gpt-4"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.4864653],""xaxis"":""x"",""y"":[""gpt-4""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score precision=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4-turbo"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""gpt-4-turbo"",""offsetgroup"":""gpt-4-turbo"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.42933634],""xaxis"":""x"",""y"":[""gpt-4-turbo""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score precision=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral (7B) Instruct v0.2 (Together AI)"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""Mistral (7B) Instruct v0.2 (Together AI)"",""offsetgroup"":""Mistral (7B) Instruct v0.2 (Together AI)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.36488953],""xaxis"":""x"",""y"":[""Mistral (7B) Instruct v0.2 (Together AI)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score precision=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""OpenHermes-2.5-Mistral (7B)"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""OpenHermes-2.5-Mistral (7B)"",""offsetgroup"":""OpenHermes-2.5-Mistral (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.3621834],""xaxis"":""x"",""y"":[""OpenHermes-2.5-Mistral (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score precision=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Qwen 1.5 Chat (7B)"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""Qwen 1.5 Chat (7B)"",""offsetgroup"":""Qwen 1.5 Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.34898603],""xaxis"":""x"",""y"":[""Qwen 1.5 Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score precision=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""WizardLM v1.2 (13B)"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""WizardLM v1.2 (13B)"",""offsetgroup"":""WizardLM v1.2 (13B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.3420949],""xaxis"":""x"",""y"":[""WizardLM v1.2 (13B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score precision=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""01-ai Yi Chat (34B)"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""01-ai Yi Chat (34B)"",""offsetgroup"":""01-ai Yi Chat (34B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.33981326],""xaxis"":""x"",""y"":[""01-ai Yi Chat (34B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score precision=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""LLaMA-2 Chat (7B)"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""LLaMA-2 Chat (7B)"",""offsetgroup"":""LLaMA-2 Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.32074162],""xaxis"":""x"",""y"":[""LLaMA-2 Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score precision=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Snorkel Mistral PairRM DPO (7B)"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""Snorkel Mistral PairRM DPO (7B)"",""offsetgroup"":""Snorkel Mistral PairRM DPO (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.3167385],""xaxis"":""x"",""y"":[""Snorkel Mistral PairRM DPO (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score precision=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Chronos Hermes (13B)"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""Chronos Hermes (13B)"",""offsetgroup"":""Chronos Hermes (13B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.31285536],""xaxis"":""x"",""y"":[""Chronos Hermes (13B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score precision=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Falcon Instruct (7B)"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""Falcon Instruct (7B)"",""offsetgroup"":""Falcon Instruct (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.30270517],""xaxis"":""x"",""y"":[""Falcon Instruct (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score precision=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Vicuna v1.5 (7B)"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""Vicuna v1.5 (7B)"",""offsetgroup"":""Vicuna v1.5 (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.28434175],""xaxis"":""x"",""y"":[""Vicuna v1.5 (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score precision=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""RedPajama-INCITE Chat (7B)"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""RedPajama-INCITE Chat (7B)"",""offsetgroup"":""RedPajama-INCITE Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.26832756],""xaxis"":""x"",""y"":[""RedPajama-INCITE Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score precision=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison (PaLM 2)"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""chat-bison (PaLM 2)"",""offsetgroup"":""chat-bison (PaLM 2)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.23123139],""xaxis"":""x"",""y"":[""chat-bison (PaLM 2)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score precision=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gemini-pro"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""gemini-pro"",""offsetgroup"":""gemini-pro"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.23109974],""xaxis"":""x"",""y"":[""gemini-pro""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score precision=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison-32k (PaLM 2 32K)"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""chat-bison-32k (PaLM 2 32K)"",""offsetgroup"":""chat-bison-32k (PaLM 2 32K)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.23051436],""xaxis"":""x"",""y"":[""chat-bison-32k (PaLM 2 32K)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score precision=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""llama-2-70b-chat"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""llama-2-70b-chat"",""offsetgroup"":""llama-2-70b-chat"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.20810011],""xaxis"":""x"",""y"":[""llama-2-70b-chat""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score precision=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mixtral-8x7B-Instruct-v0.1"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""Mixtral-8x7B-Instruct-v0.1"",""offsetgroup"":""Mixtral-8x7B-Instruct-v0.1"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.19137934],""xaxis"":""x"",""y"":[""Mixtral-8x7B-Instruct-v0.1""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score precision=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""offsetgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.122332305],""xaxis"":""x"",""y"":[""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score precision=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""zephyr-7b-beta"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""zephyr-7b-beta"",""offsetgroup"":""zephyr-7b-beta"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.085546724],""xaxis"":""x"",""y"":[""zephyr-7b-beta""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score precision=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral-7B-Instruct-v0.2"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""Mistral-7B-Instruct-v0.2"",""offsetgroup"":""Mistral-7B-Instruct-v0.2"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.04389399],""xaxis"":""x"",""y"":[""Mistral-7B-Instruct-v0.2""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score precision=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Upstage SOLAR Instruct v1 (11B)"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""Upstage SOLAR Instruct v1 (11B)"",""offsetgroup"":""Upstage SOLAR Instruct v1 (11B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.0],""xaxis"":""x"",""y"":[""Upstage SOLAR Instruct v1 (11B)""],""yaxis"":""y"",""type"":""bar""}],""layout"":{""template"":{""data"":{""histogram2dcontour"":[{""type"":""histogram2dcontour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""choropleth"":[{""type"":""choropleth"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""histogram2d"":[{""type"":""histogram2d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmap"":[{""type"":""heatmap"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmapgl"":[{""type"":""heatmapgl"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""contourcarpet"":[{""type"":""contourcarpet"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""contour"":[{""type"":""contour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""surface"":[{""type"":""surface"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""mesh3d"":[{""type"":""mesh3d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""scatter"":[{""fillpattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2},""type"":""scatter""}],""parcoords"":[{""type"":""parcoords"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolargl"":[{""type"":""scatterpolargl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""bar"":[{""error_x"":{""color"":""#2a3f5f""},""error_y"":{""color"":""#2a3f5f""},""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""bar""}],""scattergeo"":[{""type"":""scattergeo"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolar"":[{""type"":""scatterpolar"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""histogram"":[{""marker"":{""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""histogram""}],""scattergl"":[{""type"":""scattergl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatter3d"":[{""type"":""scatter3d"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattermapbox"":[{""type"":""scattermapbox"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterternary"":[{""type"":""scatterternary"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattercarpet"":[{""type"":""scattercarpet"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""carpet"":[{""aaxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""baxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""type"":""carpet""}],""table"":[{""cells"":{""fill"":{""color"":""#EBF0F8""},""line"":{""color"":""white""}},""header"":{""fill"":{""color"":""#C8D4E3""},""line"":{""color"":""white""}},""type"":""table""}],""barpolar"":[{""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""barpolar""}],""pie"":[{""automargin"":true,""type"":""pie""}]},""layout"":{""autotypenumbers"":""strict"",""colorway"":[""#636efa"",""#EF553B"",""#00cc96"",""#ab63fa"",""#FFA15A"",""#19d3f3"",""#FF6692"",""#B6E880"",""#FF97FF"",""#FECB52""],""font"":{""color"":""#2a3f5f""},""hovermode"":""closest"",""hoverlabel"":{""align"":""left""},""paper_bgcolor"":""white"",""plot_bgcolor"":""#E5ECF6"",""polar"":{""bgcolor"":""#E5ECF6"",""angularaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""radialaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""ternary"":{""bgcolor"":""#E5ECF6"",""aaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""baxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""caxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""coloraxis"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""colorscale"":{""sequential"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""sequentialminus"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""diverging"":[[0,""#8e0152""],[0.1,""#c51b7d""],[0.2,""#de77ae""],[0.3,""#f1b6da""],[0.4,""#fde0ef""],[0.5,""#f7f7f7""],[0.6,""#e6f5d0""],[0.7,""#b8e186""],[0.8,""#7fbc41""],[0.9,""#4d9221""],[1,""#276419""]]},""xaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""yaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""scene"":{""xaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""yaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""zaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2}},""shapedefaults"":{""line"":{""color"":""#2a3f5f""}},""annotationdefaults"":{""arrowcolor"":""#2a3f5f"",""arrowhead"":0,""arrowwidth"":1},""geo"":{""bgcolor"":""white"",""landcolor"":""#E5ECF6"",""subunitcolor"":""white"",""showland"":true,""showlakes"":true,""lakecolor"":""white""},""title"":{""x"":0.05},""mapbox"":{""style"":""light""}}},""xaxis"":{""anchor"":""y"",""domain"":[0.0,1.0],""title"":{""text"":""BERT score precision""}},""yaxis"":{""anchor"":""x"",""domain"":[0.0,1.0],""title"":{""text"":""Model""},""categoryorder"":""array"",""categoryarray"":[""Upstage SOLAR Instruct v1 (11B)"",""Mistral-7B-Instruct-v0.2"",""zephyr-7b-beta"",""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""Mixtral-8x7B-Instruct-v0.1"",""llama-2-70b-chat"",""chat-bison-32k (PaLM 2 32K)"",""gemini-pro"",""chat-bison (PaLM 2)"",""RedPajama-INCITE Chat (7B)"",""Vicuna v1.5 (7B)"",""Falcon Instruct (7B)"",""Chronos Hermes (13B)"",""Snorkel Mistral PairRM DPO (7B)"",""LLaMA-2 Chat (7B)"",""01-ai Yi Chat (34B)"",""WizardLM v1.2 (13B)"",""Qwen 1.5 Chat (7B)"",""OpenHermes-2.5-Mistral (7B)"",""Mistral (7B) Instruct v0.2 (Together AI)"",""gpt-4-turbo"",""gpt-4"",""gpt-3.5-turbo""]},""legend"":{""title"":{""text"":""Model""},""tracegroupgap"":0},""title"":{""text"":""Summary metrics BERT score precision""},""barmode"":""relative""}}",,",model,BERT_score_precision,BERT_score_recall,BERT_score_F1,BLEU_score,original_text_length_part,sentence_count,length_penalty +18,gpt-3.5-turbo,0.49478123,0.50445867,0.49331823,0.00919205486407126,0.5905700146991734,4.229639819909955,89814.0 +19,gpt-4,0.4864653,0.49512562,0.4839312,0.005711113295666468,0.4763731952669352,4.266137566137566,85120.0 +20,gpt-4-turbo,0.42933634,0.4414623,0.4294052,0.0042830628392272,0.5393220459796505,4.266137566137566,85120.0 +4,Mistral (7B) Instruct v0.2 (Together AI),0.36488953,0.3797993,0.36758336,0.005650224193975447,0.5233998570385472,3.712222222222222,29298.0 +7,OpenHermes-2.5-Mistral (7B),0.3621834,0.3685358,0.36003792,0.0068684572027745494,0.312054520357568,3.5818443804034583,14928.0 +8,Qwen 1.5 Chat (7B),0.34898603,0.35945317,0.34867778,0.0033327500620805805,0.29904529709475364,3.5818443804034583,14928.0 +14,WizardLM v1.2 (13B),0.3420949,0.34746957,0.33996373,0.00373442128604677,0.28716720161049375,3.5818443804034583,14928.0 +0,01-ai Yi Chat (34B),0.33981326,0.35219854,0.34183535,0.007428840277380581,0.43251538287409536,3.5818443804034583,14928.0 +3,LLaMA-2 Chat (7B),0.32074162,0.33171847,0.32136682,0.004415024709996126,0.4084233313416049,3.5818443804034583,14928.0 +10,Snorkel Mistral PairRM DPO (7B),0.3167385,0.34785262,0.32718164,0.0029236226777824676,3.7740234383755356,3.5818443804034583,14928.0 +1,Chronos Hermes (13B),0.31285536,0.32630467,0.3150877,0.011542047908319874,0.4742810243835248,3.5818443804034583,14928.0 +2,Falcon Instruct (7B),0.30270517,0.28607234,0.29104736,0.0030232447024239606,0.0490635544441649,3.5818443804034583,14928.0 +13,Vicuna v1.5 (7B),0.28434175,0.29119453,0.2839047,0.007105541953090669,0.2781035051738079,3.6173027989821884,16948.0 +9,RedPajama-INCITE Chat (7B),0.26832756,0.27305293,0.26768887,0.0,0.0560284823193376,3.5818443804034583,14928.0 +15,chat-bison (PaLM 2),0.23123139,0.24001649,0.23214735,0.0037652345768886663,0.2927236655934559,4.281081081081081,83400.0 +17,gemini-pro,0.23109974,0.23956373,0.23199782,0.0032373504004405487,0.295286999418032,4.244871794871795,87700.0 +16,chat-bison-32k (PaLM 2 32K),0.23051436,0.23993237,0.2317056,0.003694633514634998,0.2608806894318779,4.281081081081081,83400.0 +21,llama-2-70b-chat,0.20810011,0.22406381,0.21268094,0.004560500754935232,0.29684572894554634,4.2436893203883495,88008.0 +6,Mixtral-8x7B-Instruct-v0.1,0.19137934,0.2029136,0.19449018,0.0031843990217988536,0.2665288353398184,4.161038961038961,103320.0 +11,TinyLlama/TinyLlama-1.1B-Chat-v1.0,0.122332305,0.12540509,0.12200464,0.003286423403673119,0.13915355617375091,4.244871794871795,87700.0 +22,zephyr-7b-beta,0.085546724,0.08755772,0.085219756,0.0012612839176470308,0.08796697338212889,4.159788702026735,103714.0 +5,Mistral-7B-Instruct-v0.2,0.04389399,0.045185987,0.04378006,0.000566625796313851,0.04250630683894714,4.120342654588421,113258.0 +12,Upstage SOLAR Instruct v1 (11B),0.0,0.0,0.0,0.0,0.0017662349842492329,3.5818443804034583,14928.0 +","{""x"": ""BERT_score_precision"", ""y"": ""model"", ""color"": ""model"", ""orientation"": ""h"", ""labels"": {""BERT_score_precision"": ""BERT score precision"", ""model"": ""Model""}, ""title"": ""Summary metrics BERT score precision""}" "Figure({ 'data': [{'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
BERT score R=%{x}', + 'hovertemplate': 'Model=%{y}
BERT score recall=%{x}', 'legendgroup': 'gpt-3.5-turbo', 'marker': {'color': '#636efa', 'pattern': {'shape': ''}}, 'name': 'gpt-3.5-turbo', @@ -382,12 +382,12 @@ plot_object,header,plot_json,description,df,arguments 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.48408476], dtype=float32), + 'x': array([0.50445867], dtype=float32), 'xaxis': 'x', 'y': array(['gpt-3.5-turbo'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
BERT score R=%{x}', + 'hovertemplate': 'Model=%{y}
BERT score recall=%{x}', 'legendgroup': 'gpt-4', 'marker': {'color': '#EF553B', 'pattern': {'shape': ''}}, 'name': 'gpt-4', @@ -396,12 +396,12 @@ plot_object,header,plot_json,description,df,arguments 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.472583], dtype=float32), + 'x': array([0.49512562], dtype=float32), 'xaxis': 'x', 'y': array(['gpt-4'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
BERT score R=%{x}', + 'hovertemplate': 'Model=%{y}
BERT score recall=%{x}', 'legendgroup': 'gpt-4-turbo', 'marker': {'color': '#00cc96', 'pattern': {'shape': ''}}, 'name': 'gpt-4-turbo', @@ -410,12 +410,12 @@ plot_object,header,plot_json,description,df,arguments 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.4162435], dtype=float32), + 'x': array([0.4414623], dtype=float32), 'xaxis': 'x', 'y': array(['gpt-4-turbo'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
BERT score R=%{x}', + 'hovertemplate': 'Model=%{y}
BERT score recall=%{x}', 'legendgroup': 'Mistral (7B) Instruct v0.2 (Together AI)', 'marker': {'color': '#ab63fa', 'pattern': {'shape': ''}}, 'name': 'Mistral (7B) Instruct v0.2 (Together AI)', @@ -424,12 +424,12 @@ plot_object,header,plot_json,description,df,arguments 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.3664233], dtype=float32), + 'x': array([0.3797993], dtype=float32), 'xaxis': 'x', 'y': array(['Mistral (7B) Instruct v0.2 (Together AI)'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
BERT score R=%{x}', + 'hovertemplate': 'Model=%{y}
BERT score recall=%{x}', 'legendgroup': 'OpenHermes-2.5-Mistral (7B)', 'marker': {'color': '#FFA15A', 'pattern': {'shape': ''}}, 'name': 'OpenHermes-2.5-Mistral (7B)', @@ -438,12 +438,12 @@ plot_object,header,plot_json,description,df,arguments 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.35180506], dtype=float32), + 'x': array([0.3685358], dtype=float32), 'xaxis': 'x', 'y': array(['OpenHermes-2.5-Mistral (7B)'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
BERT score R=%{x}', + 'hovertemplate': 'Model=%{y}
BERT score recall=%{x}', 'legendgroup': 'Qwen 1.5 Chat (7B)', 'marker': {'color': '#19d3f3', 'pattern': {'shape': ''}}, 'name': 'Qwen 1.5 Chat (7B)', @@ -452,12 +452,12 @@ plot_object,header,plot_json,description,df,arguments 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.34154576], dtype=float32), + 'x': array([0.35945317], dtype=float32), 'xaxis': 'x', 'y': array(['Qwen 1.5 Chat (7B)'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
BERT score R=%{x}', + 'hovertemplate': 'Model=%{y}
BERT score recall=%{x}', 'legendgroup': '01-ai Yi Chat (34B)', 'marker': {'color': '#FF6692', 'pattern': {'shape': ''}}, 'name': '01-ai Yi Chat (34B)', @@ -466,12 +466,12 @@ plot_object,header,plot_json,description,df,arguments 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.3404481], dtype=float32), + 'x': array([0.35219854], dtype=float32), 'xaxis': 'x', 'y': array(['01-ai Yi Chat (34B)'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
BERT score R=%{x}', + 'hovertemplate': 'Model=%{y}
BERT score recall=%{x}', 'legendgroup': 'Snorkel Mistral PairRM DPO (7B)', 'marker': {'color': '#B6E880', 'pattern': {'shape': ''}}, 'name': 'Snorkel Mistral PairRM DPO (7B)', @@ -480,12 +480,12 @@ plot_object,header,plot_json,description,df,arguments 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.33782956], dtype=float32), + 'x': array([0.34785262], dtype=float32), 'xaxis': 'x', 'y': array(['Snorkel Mistral PairRM DPO (7B)'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
BERT score R=%{x}', + 'hovertemplate': 'Model=%{y}
BERT score recall=%{x}', 'legendgroup': 'WizardLM v1.2 (13B)', 'marker': {'color': '#FF97FF', 'pattern': {'shape': ''}}, 'name': 'WizardLM v1.2 (13B)', @@ -494,12 +494,12 @@ plot_object,header,plot_json,description,df,arguments 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.32933056], dtype=float32), + 'x': array([0.34746957], dtype=float32), 'xaxis': 'x', 'y': array(['WizardLM v1.2 (13B)'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
BERT score R=%{x}', + 'hovertemplate': 'Model=%{y}
BERT score recall=%{x}', 'legendgroup': 'LLaMA-2 Chat (7B)', 'marker': {'color': '#FECB52', 'pattern': {'shape': ''}}, 'name': 'LLaMA-2 Chat (7B)', @@ -508,12 +508,12 @@ plot_object,header,plot_json,description,df,arguments 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.3153909], dtype=float32), + 'x': array([0.33171847], dtype=float32), 'xaxis': 'x', 'y': array(['LLaMA-2 Chat (7B)'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
BERT score R=%{x}', + 'hovertemplate': 'Model=%{y}
BERT score recall=%{x}', 'legendgroup': 'Chronos Hermes (13B)', 'marker': {'color': '#636efa', 'pattern': {'shape': ''}}, 'name': 'Chronos Hermes (13B)', @@ -522,12 +522,12 @@ plot_object,header,plot_json,description,df,arguments 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.31071666], dtype=float32), + 'x': array([0.32630467], dtype=float32), 'xaxis': 'x', 'y': array(['Chronos Hermes (13B)'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
BERT score R=%{x}', + 'hovertemplate': 'Model=%{y}
BERT score recall=%{x}', 'legendgroup': 'Vicuna v1.5 (7B)', 'marker': {'color': '#EF553B', 'pattern': {'shape': ''}}, 'name': 'Vicuna v1.5 (7B)', @@ -536,12 +536,12 @@ plot_object,header,plot_json,description,df,arguments 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.27878883], dtype=float32), + 'x': array([0.29119453], dtype=float32), 'xaxis': 'x', 'y': array(['Vicuna v1.5 (7B)'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
BERT score R=%{x}', + 'hovertemplate': 'Model=%{y}
BERT score recall=%{x}', 'legendgroup': 'Falcon Instruct (7B)', 'marker': {'color': '#00cc96', 'pattern': {'shape': ''}}, 'name': 'Falcon Instruct (7B)', @@ -550,12 +550,12 @@ plot_object,header,plot_json,description,df,arguments 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.23968808], dtype=float32), + 'x': array([0.28607234], dtype=float32), 'xaxis': 'x', 'y': array(['Falcon Instruct (7B)'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
BERT score R=%{x}', + 'hovertemplate': 'Model=%{y}
BERT score recall=%{x}', 'legendgroup': 'RedPajama-INCITE Chat (7B)', 'marker': {'color': '#ab63fa', 'pattern': {'shape': ''}}, 'name': 'RedPajama-INCITE Chat (7B)', @@ -564,54 +564,54 @@ plot_object,header,plot_json,description,df,arguments 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.23758642], dtype=float32), + 'x': array([0.27305293], dtype=float32), 'xaxis': 'x', 'y': array(['RedPajama-INCITE Chat (7B)'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
BERT score R=%{x}', - 'legendgroup': 'gemini-pro', + 'hovertemplate': 'Model=%{y}
BERT score recall=%{x}', + 'legendgroup': 'chat-bison (PaLM 2)', 'marker': {'color': '#FFA15A', 'pattern': {'shape': ''}}, - 'name': 'gemini-pro', - 'offsetgroup': 'gemini-pro', + 'name': 'chat-bison (PaLM 2)', + 'offsetgroup': 'chat-bison (PaLM 2)', 'orientation': 'h', 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.23057175], dtype=float32), + 'x': array([0.24001649], dtype=float32), 'xaxis': 'x', - 'y': array(['gemini-pro'], dtype=object), + 'y': array(['chat-bison (PaLM 2)'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
BERT score R=%{x}', - 'legendgroup': 'chat-bison (PaLM 2)', + 'hovertemplate': 'Model=%{y}
BERT score recall=%{x}', + 'legendgroup': 'chat-bison-32k (PaLM 2 32K)', 'marker': {'color': '#19d3f3', 'pattern': {'shape': ''}}, - 'name': 'chat-bison (PaLM 2)', - 'offsetgroup': 'chat-bison (PaLM 2)', + 'name': 'chat-bison-32k (PaLM 2 32K)', + 'offsetgroup': 'chat-bison-32k (PaLM 2 32K)', 'orientation': 'h', 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.23029378], dtype=float32), + 'x': array([0.23993237], dtype=float32), 'xaxis': 'x', - 'y': array(['chat-bison (PaLM 2)'], dtype=object), + 'y': array(['chat-bison-32k (PaLM 2 32K)'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
BERT score R=%{x}', - 'legendgroup': 'chat-bison-32k (PaLM 2 32K)', + 'hovertemplate': 'Model=%{y}
BERT score recall=%{x}', + 'legendgroup': 'gemini-pro', 'marker': {'color': '#FF6692', 'pattern': {'shape': ''}}, - 'name': 'chat-bison-32k (PaLM 2 32K)', - 'offsetgroup': 'chat-bison-32k (PaLM 2 32K)', + 'name': 'gemini-pro', + 'offsetgroup': 'gemini-pro', 'orientation': 'h', 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.22983725], dtype=float32), + 'x': array([0.23956373], dtype=float32), 'xaxis': 'x', - 'y': array(['chat-bison-32k (PaLM 2 32K)'], dtype=object), + 'y': array(['gemini-pro'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
BERT score R=%{x}', + 'hovertemplate': 'Model=%{y}
BERT score recall=%{x}', 'legendgroup': 'llama-2-70b-chat', 'marker': {'color': '#B6E880', 'pattern': {'shape': ''}}, 'name': 'llama-2-70b-chat', @@ -620,12 +620,12 @@ plot_object,header,plot_json,description,df,arguments 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.21472095], dtype=float32), + 'x': array([0.22406381], dtype=float32), 'xaxis': 'x', 'y': array(['llama-2-70b-chat'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
BERT score R=%{x}', + 'hovertemplate': 'Model=%{y}
BERT score recall=%{x}', 'legendgroup': 'Mixtral-8x7B-Instruct-v0.1', 'marker': {'color': '#FF97FF', 'pattern': {'shape': ''}}, 'name': 'Mixtral-8x7B-Instruct-v0.1', @@ -634,12 +634,12 @@ plot_object,header,plot_json,description,df,arguments 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.19555509], dtype=float32), + 'x': array([0.2029136], dtype=float32), 'xaxis': 'x', 'y': array(['Mixtral-8x7B-Instruct-v0.1'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
BERT score R=%{x}', + 'hovertemplate': 'Model=%{y}
BERT score recall=%{x}', 'legendgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0', 'marker': {'color': '#FECB52', 'pattern': {'shape': ''}}, 'name': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0', @@ -648,12 +648,12 @@ plot_object,header,plot_json,description,df,arguments 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.11885959], dtype=float32), + 'x': array([0.12540509], dtype=float32), 'xaxis': 'x', 'y': array(['TinyLlama/TinyLlama-1.1B-Chat-v1.0'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
BERT score R=%{x}', + 'hovertemplate': 'Model=%{y}
BERT score recall=%{x}', 'legendgroup': 'zephyr-7b-beta', 'marker': {'color': '#636efa', 'pattern': {'shape': ''}}, 'name': 'zephyr-7b-beta', @@ -662,12 +662,12 @@ plot_object,header,plot_json,description,df,arguments 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.08266569], dtype=float32), + 'x': array([0.08755772], dtype=float32), 'xaxis': 'x', 'y': array(['zephyr-7b-beta'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
BERT score R=%{x}', + 'hovertemplate': 'Model=%{y}
BERT score recall=%{x}', 'legendgroup': 'Mistral-7B-Instruct-v0.2', 'marker': {'color': '#EF553B', 'pattern': {'shape': ''}}, 'name': 'Mistral-7B-Instruct-v0.2', @@ -676,12 +676,12 @@ plot_object,header,plot_json,description,df,arguments 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.04256168], dtype=float32), + 'x': array([0.04518599], dtype=float32), 'xaxis': 'x', 'y': array(['Mistral-7B-Instruct-v0.2'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
BERT score R=%{x}', + 'hovertemplate': 'Model=%{y}
BERT score recall=%{x}', 'legendgroup': 'Upstage SOLAR Instruct v1 (11B)', 'marker': {'color': '#00cc96', 'pattern': {'shape': ''}}, 'name': 'Upstage SOLAR Instruct v1 (11B)', @@ -697,17 +697,17 @@ plot_object,header,plot_json,description,df,arguments 'layout': {'barmode': 'relative', 'legend': {'title': {'text': 'Model'}, 'tracegroupgap': 0}, 'template': '...', - 'title': {'text': 'Summary metrics BERT score R'}, - 'xaxis': {'anchor': 'y', 'domain': [0.0, 1.0], 'title': {'text': 'BERT score R'}}, + 'title': {'text': 'Summary metrics BERT score recall'}, + 'xaxis': {'anchor': 'y', 'domain': [0.0, 1.0], 'title': {'text': 'BERT score recall'}}, 'yaxis': {'anchor': 'x', 'categoryarray': [Upstage SOLAR Instruct v1 (11B), Mistral-7B-Instruct-v0.2, zephyr-7b-beta, TinyLlama/TinyLlama-1.1B-Chat-v1.0, Mixtral-8x7B-Instruct-v0.1, - llama-2-70b-chat, chat-bison-32k (PaLM 2 - 32K), chat-bison (PaLM 2), gemini-pro, - RedPajama-INCITE Chat (7B), Falcon + llama-2-70b-chat, gemini-pro, chat- + bison-32k (PaLM 2 32K), chat-bison (PaLM + 2), RedPajama-INCITE Chat (7B), Falcon Instruct (7B), Vicuna v1.5 (7B), Chronos Hermes (13B), LLaMA-2 Chat (7B), WizardLM v1.2 (13B), Snorkel Mistral @@ -719,31 +719,31 @@ plot_object,header,plot_json,description,df,arguments 'categoryorder': 'array', 'domain': [0.0, 1.0], 'title': {'text': 'Model'}}} -})",Summary metrics BERT score R,"{""data"":[{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score R=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-3.5-turbo"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""gpt-3.5-turbo"",""offsetgroup"":""gpt-3.5-turbo"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.48408476],""xaxis"":""x"",""y"":[""gpt-3.5-turbo""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score R=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""gpt-4"",""offsetgroup"":""gpt-4"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.472583],""xaxis"":""x"",""y"":[""gpt-4""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score R=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4-turbo"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""gpt-4-turbo"",""offsetgroup"":""gpt-4-turbo"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.4162435],""xaxis"":""x"",""y"":[""gpt-4-turbo""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score R=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral (7B) Instruct v0.2 (Together AI)"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""Mistral (7B) Instruct v0.2 (Together AI)"",""offsetgroup"":""Mistral (7B) Instruct v0.2 (Together AI)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.3664233],""xaxis"":""x"",""y"":[""Mistral (7B) Instruct v0.2 (Together AI)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score R=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""OpenHermes-2.5-Mistral (7B)"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""OpenHermes-2.5-Mistral (7B)"",""offsetgroup"":""OpenHermes-2.5-Mistral (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.35180506],""xaxis"":""x"",""y"":[""OpenHermes-2.5-Mistral (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score R=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Qwen 1.5 Chat (7B)"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""Qwen 1.5 Chat (7B)"",""offsetgroup"":""Qwen 1.5 Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.34154576],""xaxis"":""x"",""y"":[""Qwen 1.5 Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score R=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""01-ai Yi Chat (34B)"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""01-ai Yi Chat (34B)"",""offsetgroup"":""01-ai Yi Chat (34B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.3404481],""xaxis"":""x"",""y"":[""01-ai Yi Chat (34B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score R=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Snorkel Mistral PairRM DPO (7B)"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""Snorkel Mistral PairRM DPO (7B)"",""offsetgroup"":""Snorkel Mistral PairRM DPO (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.33782956],""xaxis"":""x"",""y"":[""Snorkel Mistral PairRM DPO (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score R=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""WizardLM v1.2 (13B)"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""WizardLM v1.2 (13B)"",""offsetgroup"":""WizardLM v1.2 (13B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.32933056],""xaxis"":""x"",""y"":[""WizardLM v1.2 (13B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score R=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""LLaMA-2 Chat (7B)"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""LLaMA-2 Chat (7B)"",""offsetgroup"":""LLaMA-2 Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.3153909],""xaxis"":""x"",""y"":[""LLaMA-2 Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score R=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Chronos Hermes (13B)"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""Chronos Hermes (13B)"",""offsetgroup"":""Chronos Hermes (13B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.31071666],""xaxis"":""x"",""y"":[""Chronos Hermes (13B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score R=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Vicuna v1.5 (7B)"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""Vicuna v1.5 (7B)"",""offsetgroup"":""Vicuna v1.5 (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.27878883],""xaxis"":""x"",""y"":[""Vicuna v1.5 (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score R=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Falcon Instruct (7B)"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""Falcon Instruct (7B)"",""offsetgroup"":""Falcon Instruct (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.23968808],""xaxis"":""x"",""y"":[""Falcon Instruct (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score R=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""RedPajama-INCITE Chat (7B)"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""RedPajama-INCITE Chat (7B)"",""offsetgroup"":""RedPajama-INCITE Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.23758642],""xaxis"":""x"",""y"":[""RedPajama-INCITE Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score R=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gemini-pro"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""gemini-pro"",""offsetgroup"":""gemini-pro"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.23057175],""xaxis"":""x"",""y"":[""gemini-pro""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score R=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison (PaLM 2)"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""chat-bison (PaLM 2)"",""offsetgroup"":""chat-bison (PaLM 2)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.23029378],""xaxis"":""x"",""y"":[""chat-bison (PaLM 2)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score R=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison-32k (PaLM 2 32K)"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""chat-bison-32k (PaLM 2 32K)"",""offsetgroup"":""chat-bison-32k (PaLM 2 32K)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.22983725],""xaxis"":""x"",""y"":[""chat-bison-32k (PaLM 2 32K)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score R=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""llama-2-70b-chat"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""llama-2-70b-chat"",""offsetgroup"":""llama-2-70b-chat"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.21472095],""xaxis"":""x"",""y"":[""llama-2-70b-chat""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score R=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mixtral-8x7B-Instruct-v0.1"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""Mixtral-8x7B-Instruct-v0.1"",""offsetgroup"":""Mixtral-8x7B-Instruct-v0.1"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.19555509],""xaxis"":""x"",""y"":[""Mixtral-8x7B-Instruct-v0.1""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score R=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""offsetgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.11885959],""xaxis"":""x"",""y"":[""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score R=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""zephyr-7b-beta"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""zephyr-7b-beta"",""offsetgroup"":""zephyr-7b-beta"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.08266569],""xaxis"":""x"",""y"":[""zephyr-7b-beta""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score R=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral-7B-Instruct-v0.2"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""Mistral-7B-Instruct-v0.2"",""offsetgroup"":""Mistral-7B-Instruct-v0.2"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.042561684],""xaxis"":""x"",""y"":[""Mistral-7B-Instruct-v0.2""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score R=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Upstage SOLAR Instruct v1 (11B)"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""Upstage SOLAR Instruct v1 (11B)"",""offsetgroup"":""Upstage SOLAR Instruct v1 (11B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.0],""xaxis"":""x"",""y"":[""Upstage SOLAR Instruct v1 (11B)""],""yaxis"":""y"",""type"":""bar""}],""layout"":{""template"":{""data"":{""histogram2dcontour"":[{""type"":""histogram2dcontour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""choropleth"":[{""type"":""choropleth"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""histogram2d"":[{""type"":""histogram2d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmap"":[{""type"":""heatmap"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmapgl"":[{""type"":""heatmapgl"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""contourcarpet"":[{""type"":""contourcarpet"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""contour"":[{""type"":""contour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""surface"":[{""type"":""surface"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""mesh3d"":[{""type"":""mesh3d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""scatter"":[{""fillpattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2},""type"":""scatter""}],""parcoords"":[{""type"":""parcoords"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolargl"":[{""type"":""scatterpolargl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""bar"":[{""error_x"":{""color"":""#2a3f5f""},""error_y"":{""color"":""#2a3f5f""},""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""bar""}],""scattergeo"":[{""type"":""scattergeo"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolar"":[{""type"":""scatterpolar"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""histogram"":[{""marker"":{""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""histogram""}],""scattergl"":[{""type"":""scattergl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatter3d"":[{""type"":""scatter3d"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattermapbox"":[{""type"":""scattermapbox"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterternary"":[{""type"":""scatterternary"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattercarpet"":[{""type"":""scattercarpet"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""carpet"":[{""aaxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""baxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""type"":""carpet""}],""table"":[{""cells"":{""fill"":{""color"":""#EBF0F8""},""line"":{""color"":""white""}},""header"":{""fill"":{""color"":""#C8D4E3""},""line"":{""color"":""white""}},""type"":""table""}],""barpolar"":[{""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""barpolar""}],""pie"":[{""automargin"":true,""type"":""pie""}]},""layout"":{""autotypenumbers"":""strict"",""colorway"":[""#636efa"",""#EF553B"",""#00cc96"",""#ab63fa"",""#FFA15A"",""#19d3f3"",""#FF6692"",""#B6E880"",""#FF97FF"",""#FECB52""],""font"":{""color"":""#2a3f5f""},""hovermode"":""closest"",""hoverlabel"":{""align"":""left""},""paper_bgcolor"":""white"",""plot_bgcolor"":""#E5ECF6"",""polar"":{""bgcolor"":""#E5ECF6"",""angularaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""radialaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""ternary"":{""bgcolor"":""#E5ECF6"",""aaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""baxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""caxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""coloraxis"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""colorscale"":{""sequential"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""sequentialminus"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""diverging"":[[0,""#8e0152""],[0.1,""#c51b7d""],[0.2,""#de77ae""],[0.3,""#f1b6da""],[0.4,""#fde0ef""],[0.5,""#f7f7f7""],[0.6,""#e6f5d0""],[0.7,""#b8e186""],[0.8,""#7fbc41""],[0.9,""#4d9221""],[1,""#276419""]]},""xaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""yaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""scene"":{""xaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""yaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""zaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2}},""shapedefaults"":{""line"":{""color"":""#2a3f5f""}},""annotationdefaults"":{""arrowcolor"":""#2a3f5f"",""arrowhead"":0,""arrowwidth"":1},""geo"":{""bgcolor"":""white"",""landcolor"":""#E5ECF6"",""subunitcolor"":""white"",""showland"":true,""showlakes"":true,""lakecolor"":""white""},""title"":{""x"":0.05},""mapbox"":{""style"":""light""}}},""xaxis"":{""anchor"":""y"",""domain"":[0.0,1.0],""title"":{""text"":""BERT score R""}},""yaxis"":{""anchor"":""x"",""domain"":[0.0,1.0],""title"":{""text"":""Model""},""categoryorder"":""array"",""categoryarray"":[""Upstage SOLAR Instruct v1 (11B)"",""Mistral-7B-Instruct-v0.2"",""zephyr-7b-beta"",""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""Mixtral-8x7B-Instruct-v0.1"",""llama-2-70b-chat"",""chat-bison-32k (PaLM 2 32K)"",""chat-bison (PaLM 2)"",""gemini-pro"",""RedPajama-INCITE Chat (7B)"",""Falcon Instruct (7B)"",""Vicuna v1.5 (7B)"",""Chronos Hermes (13B)"",""LLaMA-2 Chat (7B)"",""WizardLM v1.2 (13B)"",""Snorkel Mistral PairRM DPO (7B)"",""01-ai Yi Chat (34B)"",""Qwen 1.5 Chat (7B)"",""OpenHermes-2.5-Mistral (7B)"",""Mistral (7B) Instruct v0.2 (Together AI)"",""gpt-4-turbo"",""gpt-4"",""gpt-3.5-turbo""]},""legend"":{""title"":{""text"":""Model""},""tracegroupgap"":0},""title"":{""text"":""Summary metrics BERT score R""},""barmode"":""relative""}}",,",model,bert_score_P,bert_score_R,bert_score_F1,original_text_length_part,sentence_count,length_penalty,bleu_score -18,gpt-3.5-turbo,0.4943981,0.48408476,0.4888874,0.5905700146991734,4.229639819909955,89814.0,0.007892445077902592 -19,gpt-4,0.48605907,0.472583,0.47901583,0.4763731952669352,4.266137566137566,85120.0,0.004704572681138337 -20,gpt-4-turbo,0.42728576,0.4162435,0.42098433,0.5393220459796505,4.266137566137566,85120.0,0.0034873692407505464 -4,Mistral (7B) Instruct v0.2 (Together AI),0.3647361,0.3664233,0.36540908,0.5233998570385472,3.712222222222222,29298.0,0.005478518060743351 -7,OpenHermes-2.5-Mistral (7B),0.3618188,0.35180506,0.3565194,0.312054520357568,3.5818443804034583,14928.0,0.006563161880264231 -8,Qwen 1.5 Chat (7B),0.34855434,0.34154576,0.344803,0.29904529709475364,3.5818443804034583,14928.0,0.003185571110431172 -0,01-ai Yi Chat (34B),0.33974892,0.3404481,0.3399749,0.43251538287409536,3.5818443804034583,14928.0,0.007311566390840339 -10,Snorkel Mistral PairRM DPO (7B),0.31672964,0.33782956,0.3265383,3.7740234383755356,3.5818443804034583,14928.0,0.002907897771152987 -14,WizardLM v1.2 (13B),0.34085444,0.32933056,0.33466902,0.28716720161049375,3.5818443804034583,14928.0,0.003671383039102015 -3,LLaMA-2 Chat (7B),0.3203912,0.3153909,0.31770444,0.4084233313416049,3.5818443804034583,14928.0,0.004255859538193306 -1,Chronos Hermes (13B),0.3124825,0.31071666,0.311415,0.4742810243835248,3.5818443804034583,14928.0,0.011439012700594395 -13,Vicuna v1.5 (7B),0.284109,0.27878883,0.28129113,0.2781035051738079,3.6173027989821884,16948.0,0.006952332387656228 -2,Falcon Instruct (7B),0.2895086,0.23968808,0.2615204,0.0490635544441649,3.5818443804034583,14928.0,0.00021729364201653395 -9,RedPajama-INCITE Chat (7B),0.261367,0.23758642,0.2487217,0.0560284823193376,3.5818443804034583,14928.0,0.0 -17,gemini-pro,0.23105659,0.23057175,0.23072062,0.295286999418032,4.244871794871795,87700.0,0.0025439281189154664 -15,chat-bison (PaLM 2),0.23117188,0.23029378,0.23060663,0.2927236655934559,4.281081081081081,83400.0,0.0033173472693443363 -16,chat-bison-32k (PaLM 2 32K),0.23046139,0.22983725,0.23002876,0.2608806894318779,4.281081081081081,83400.0,0.002970914340485325 -21,llama-2-70b-chat,0.20800962,0.21472095,0.21117964,0.29684572894554634,4.2436893203883495,88008.0,0.00329426273003284 -6,Mixtral-8x7B-Instruct-v0.1,0.19128644,0.19555509,0.19330867,0.2665288353398184,4.161038961038961,103320.0,0.0026839271544750283 -11,TinyLlama/TinyLlama-1.1B-Chat-v1.0,0.122185074,0.11885959,0.12042627,0.13915355617375091,4.244871794871795,87700.0,0.002991155730532842 -22,zephyr-7b-beta,0.085390136,0.08266569,0.08394519,0.08796697338212889,4.159788702026735,103714.0,0.0010625100735849574 -5,Mistral-7B-Instruct-v0.2,0.043820098,0.042561684,0.04313921,0.04250630683894714,4.120342654588421,113258.0,0.0004930290548816363 -12,Upstage SOLAR Instruct v1 (11B),0.0,0.0,0.0,0.0017662349842492329,3.5818443804034583,14928.0,0.0 -","{""x"": ""bert_score_R"", ""y"": ""model"", ""color"": ""model"", ""orientation"": ""h"", ""labels"": {""bert_score_R"": ""BERT score R"", ""model"": ""Model""}, ""title"": ""Summary metrics BERT score R""}" +})",Summary metrics BERT score recall,"{""data"":[{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score recall=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-3.5-turbo"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""gpt-3.5-turbo"",""offsetgroup"":""gpt-3.5-turbo"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.50445867],""xaxis"":""x"",""y"":[""gpt-3.5-turbo""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score recall=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""gpt-4"",""offsetgroup"":""gpt-4"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.49512562],""xaxis"":""x"",""y"":[""gpt-4""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score recall=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4-turbo"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""gpt-4-turbo"",""offsetgroup"":""gpt-4-turbo"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.4414623],""xaxis"":""x"",""y"":[""gpt-4-turbo""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score recall=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral (7B) Instruct v0.2 (Together AI)"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""Mistral (7B) Instruct v0.2 (Together AI)"",""offsetgroup"":""Mistral (7B) Instruct v0.2 (Together AI)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.3797993],""xaxis"":""x"",""y"":[""Mistral (7B) Instruct v0.2 (Together AI)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score recall=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""OpenHermes-2.5-Mistral (7B)"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""OpenHermes-2.5-Mistral (7B)"",""offsetgroup"":""OpenHermes-2.5-Mistral (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.3685358],""xaxis"":""x"",""y"":[""OpenHermes-2.5-Mistral (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score recall=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Qwen 1.5 Chat (7B)"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""Qwen 1.5 Chat (7B)"",""offsetgroup"":""Qwen 1.5 Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.35945317],""xaxis"":""x"",""y"":[""Qwen 1.5 Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score recall=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""01-ai Yi Chat (34B)"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""01-ai Yi Chat (34B)"",""offsetgroup"":""01-ai Yi Chat (34B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.35219854],""xaxis"":""x"",""y"":[""01-ai Yi Chat (34B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score recall=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Snorkel Mistral PairRM DPO (7B)"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""Snorkel Mistral PairRM DPO (7B)"",""offsetgroup"":""Snorkel Mistral PairRM DPO (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.34785262],""xaxis"":""x"",""y"":[""Snorkel Mistral PairRM DPO (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score recall=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""WizardLM v1.2 (13B)"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""WizardLM v1.2 (13B)"",""offsetgroup"":""WizardLM v1.2 (13B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.34746957],""xaxis"":""x"",""y"":[""WizardLM v1.2 (13B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score recall=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""LLaMA-2 Chat (7B)"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""LLaMA-2 Chat (7B)"",""offsetgroup"":""LLaMA-2 Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.33171847],""xaxis"":""x"",""y"":[""LLaMA-2 Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score recall=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Chronos Hermes (13B)"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""Chronos Hermes (13B)"",""offsetgroup"":""Chronos Hermes (13B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.32630467],""xaxis"":""x"",""y"":[""Chronos Hermes (13B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score recall=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Vicuna v1.5 (7B)"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""Vicuna v1.5 (7B)"",""offsetgroup"":""Vicuna v1.5 (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.29119453],""xaxis"":""x"",""y"":[""Vicuna v1.5 (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score recall=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Falcon Instruct (7B)"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""Falcon Instruct (7B)"",""offsetgroup"":""Falcon Instruct (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.28607234],""xaxis"":""x"",""y"":[""Falcon Instruct (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score recall=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""RedPajama-INCITE Chat (7B)"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""RedPajama-INCITE Chat (7B)"",""offsetgroup"":""RedPajama-INCITE Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.27305293],""xaxis"":""x"",""y"":[""RedPajama-INCITE Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score recall=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison (PaLM 2)"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""chat-bison (PaLM 2)"",""offsetgroup"":""chat-bison (PaLM 2)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.24001649],""xaxis"":""x"",""y"":[""chat-bison (PaLM 2)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score recall=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison-32k (PaLM 2 32K)"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""chat-bison-32k (PaLM 2 32K)"",""offsetgroup"":""chat-bison-32k (PaLM 2 32K)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.23993237],""xaxis"":""x"",""y"":[""chat-bison-32k (PaLM 2 32K)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score recall=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gemini-pro"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""gemini-pro"",""offsetgroup"":""gemini-pro"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.23956373],""xaxis"":""x"",""y"":[""gemini-pro""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score recall=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""llama-2-70b-chat"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""llama-2-70b-chat"",""offsetgroup"":""llama-2-70b-chat"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.22406381],""xaxis"":""x"",""y"":[""llama-2-70b-chat""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score recall=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mixtral-8x7B-Instruct-v0.1"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""Mixtral-8x7B-Instruct-v0.1"",""offsetgroup"":""Mixtral-8x7B-Instruct-v0.1"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.2029136],""xaxis"":""x"",""y"":[""Mixtral-8x7B-Instruct-v0.1""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score recall=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""offsetgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.12540509],""xaxis"":""x"",""y"":[""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score recall=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""zephyr-7b-beta"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""zephyr-7b-beta"",""offsetgroup"":""zephyr-7b-beta"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.08755772],""xaxis"":""x"",""y"":[""zephyr-7b-beta""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score recall=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral-7B-Instruct-v0.2"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""Mistral-7B-Instruct-v0.2"",""offsetgroup"":""Mistral-7B-Instruct-v0.2"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.045185987],""xaxis"":""x"",""y"":[""Mistral-7B-Instruct-v0.2""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score recall=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Upstage SOLAR Instruct v1 (11B)"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""Upstage SOLAR Instruct v1 (11B)"",""offsetgroup"":""Upstage SOLAR Instruct v1 (11B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.0],""xaxis"":""x"",""y"":[""Upstage SOLAR Instruct v1 (11B)""],""yaxis"":""y"",""type"":""bar""}],""layout"":{""template"":{""data"":{""histogram2dcontour"":[{""type"":""histogram2dcontour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""choropleth"":[{""type"":""choropleth"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""histogram2d"":[{""type"":""histogram2d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmap"":[{""type"":""heatmap"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmapgl"":[{""type"":""heatmapgl"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""contourcarpet"":[{""type"":""contourcarpet"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""contour"":[{""type"":""contour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""surface"":[{""type"":""surface"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""mesh3d"":[{""type"":""mesh3d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""scatter"":[{""fillpattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2},""type"":""scatter""}],""parcoords"":[{""type"":""parcoords"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolargl"":[{""type"":""scatterpolargl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""bar"":[{""error_x"":{""color"":""#2a3f5f""},""error_y"":{""color"":""#2a3f5f""},""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""bar""}],""scattergeo"":[{""type"":""scattergeo"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolar"":[{""type"":""scatterpolar"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""histogram"":[{""marker"":{""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""histogram""}],""scattergl"":[{""type"":""scattergl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatter3d"":[{""type"":""scatter3d"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattermapbox"":[{""type"":""scattermapbox"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterternary"":[{""type"":""scatterternary"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattercarpet"":[{""type"":""scattercarpet"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""carpet"":[{""aaxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""baxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""type"":""carpet""}],""table"":[{""cells"":{""fill"":{""color"":""#EBF0F8""},""line"":{""color"":""white""}},""header"":{""fill"":{""color"":""#C8D4E3""},""line"":{""color"":""white""}},""type"":""table""}],""barpolar"":[{""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""barpolar""}],""pie"":[{""automargin"":true,""type"":""pie""}]},""layout"":{""autotypenumbers"":""strict"",""colorway"":[""#636efa"",""#EF553B"",""#00cc96"",""#ab63fa"",""#FFA15A"",""#19d3f3"",""#FF6692"",""#B6E880"",""#FF97FF"",""#FECB52""],""font"":{""color"":""#2a3f5f""},""hovermode"":""closest"",""hoverlabel"":{""align"":""left""},""paper_bgcolor"":""white"",""plot_bgcolor"":""#E5ECF6"",""polar"":{""bgcolor"":""#E5ECF6"",""angularaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""radialaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""ternary"":{""bgcolor"":""#E5ECF6"",""aaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""baxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""caxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""coloraxis"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""colorscale"":{""sequential"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""sequentialminus"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""diverging"":[[0,""#8e0152""],[0.1,""#c51b7d""],[0.2,""#de77ae""],[0.3,""#f1b6da""],[0.4,""#fde0ef""],[0.5,""#f7f7f7""],[0.6,""#e6f5d0""],[0.7,""#b8e186""],[0.8,""#7fbc41""],[0.9,""#4d9221""],[1,""#276419""]]},""xaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""yaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""scene"":{""xaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""yaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""zaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2}},""shapedefaults"":{""line"":{""color"":""#2a3f5f""}},""annotationdefaults"":{""arrowcolor"":""#2a3f5f"",""arrowhead"":0,""arrowwidth"":1},""geo"":{""bgcolor"":""white"",""landcolor"":""#E5ECF6"",""subunitcolor"":""white"",""showland"":true,""showlakes"":true,""lakecolor"":""white""},""title"":{""x"":0.05},""mapbox"":{""style"":""light""}}},""xaxis"":{""anchor"":""y"",""domain"":[0.0,1.0],""title"":{""text"":""BERT score recall""}},""yaxis"":{""anchor"":""x"",""domain"":[0.0,1.0],""title"":{""text"":""Model""},""categoryorder"":""array"",""categoryarray"":[""Upstage SOLAR Instruct v1 (11B)"",""Mistral-7B-Instruct-v0.2"",""zephyr-7b-beta"",""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""Mixtral-8x7B-Instruct-v0.1"",""llama-2-70b-chat"",""gemini-pro"",""chat-bison-32k (PaLM 2 32K)"",""chat-bison (PaLM 2)"",""RedPajama-INCITE Chat (7B)"",""Falcon Instruct (7B)"",""Vicuna v1.5 (7B)"",""Chronos Hermes (13B)"",""LLaMA-2 Chat (7B)"",""WizardLM v1.2 (13B)"",""Snorkel Mistral PairRM DPO (7B)"",""01-ai Yi Chat (34B)"",""Qwen 1.5 Chat (7B)"",""OpenHermes-2.5-Mistral (7B)"",""Mistral (7B) Instruct v0.2 (Together AI)"",""gpt-4-turbo"",""gpt-4"",""gpt-3.5-turbo""]},""legend"":{""title"":{""text"":""Model""},""tracegroupgap"":0},""title"":{""text"":""Summary metrics BERT score recall""},""barmode"":""relative""}}",,",model,BERT_score_precision,BERT_score_recall,BERT_score_F1,BLEU_score,original_text_length_part,sentence_count,length_penalty +18,gpt-3.5-turbo,0.49478123,0.50445867,0.49331823,0.00919205486407126,0.5905700146991734,4.229639819909955,89814.0 +19,gpt-4,0.4864653,0.49512562,0.4839312,0.005711113295666468,0.4763731952669352,4.266137566137566,85120.0 +20,gpt-4-turbo,0.42933634,0.4414623,0.4294052,0.0042830628392272,0.5393220459796505,4.266137566137566,85120.0 +4,Mistral (7B) Instruct v0.2 (Together AI),0.36488953,0.3797993,0.36758336,0.005650224193975447,0.5233998570385472,3.712222222222222,29298.0 +7,OpenHermes-2.5-Mistral (7B),0.3621834,0.3685358,0.36003792,0.0068684572027745494,0.312054520357568,3.5818443804034583,14928.0 +8,Qwen 1.5 Chat (7B),0.34898603,0.35945317,0.34867778,0.0033327500620805805,0.29904529709475364,3.5818443804034583,14928.0 +0,01-ai Yi Chat (34B),0.33981326,0.35219854,0.34183535,0.007428840277380581,0.43251538287409536,3.5818443804034583,14928.0 +10,Snorkel Mistral PairRM DPO (7B),0.3167385,0.34785262,0.32718164,0.0029236226777824676,3.7740234383755356,3.5818443804034583,14928.0 +14,WizardLM v1.2 (13B),0.3420949,0.34746957,0.33996373,0.00373442128604677,0.28716720161049375,3.5818443804034583,14928.0 +3,LLaMA-2 Chat (7B),0.32074162,0.33171847,0.32136682,0.004415024709996126,0.4084233313416049,3.5818443804034583,14928.0 +1,Chronos Hermes (13B),0.31285536,0.32630467,0.3150877,0.011542047908319874,0.4742810243835248,3.5818443804034583,14928.0 +13,Vicuna v1.5 (7B),0.28434175,0.29119453,0.2839047,0.007105541953090669,0.2781035051738079,3.6173027989821884,16948.0 +2,Falcon Instruct (7B),0.30270517,0.28607234,0.29104736,0.0030232447024239606,0.0490635544441649,3.5818443804034583,14928.0 +9,RedPajama-INCITE Chat (7B),0.26832756,0.27305293,0.26768887,0.0,0.0560284823193376,3.5818443804034583,14928.0 +15,chat-bison (PaLM 2),0.23123139,0.24001649,0.23214735,0.0037652345768886663,0.2927236655934559,4.281081081081081,83400.0 +16,chat-bison-32k (PaLM 2 32K),0.23051436,0.23993237,0.2317056,0.003694633514634998,0.2608806894318779,4.281081081081081,83400.0 +17,gemini-pro,0.23109974,0.23956373,0.23199782,0.0032373504004405487,0.295286999418032,4.244871794871795,87700.0 +21,llama-2-70b-chat,0.20810011,0.22406381,0.21268094,0.004560500754935232,0.29684572894554634,4.2436893203883495,88008.0 +6,Mixtral-8x7B-Instruct-v0.1,0.19137934,0.2029136,0.19449018,0.0031843990217988536,0.2665288353398184,4.161038961038961,103320.0 +11,TinyLlama/TinyLlama-1.1B-Chat-v1.0,0.122332305,0.12540509,0.12200464,0.003286423403673119,0.13915355617375091,4.244871794871795,87700.0 +22,zephyr-7b-beta,0.085546724,0.08755772,0.085219756,0.0012612839176470308,0.08796697338212889,4.159788702026735,103714.0 +5,Mistral-7B-Instruct-v0.2,0.04389399,0.045185987,0.04378006,0.000566625796313851,0.04250630683894714,4.120342654588421,113258.0 +12,Upstage SOLAR Instruct v1 (11B),0.0,0.0,0.0,0.0,0.0017662349842492329,3.5818443804034583,14928.0 +","{""x"": ""BERT_score_recall"", ""y"": ""model"", ""color"": ""model"", ""orientation"": ""h"", ""labels"": {""BERT_score_recall"": ""BERT score recall"", ""model"": ""Model""}, ""title"": ""Summary metrics BERT score recall""}" "Figure({ 'data': [{'alignmentgroup': 'True', 'hovertemplate': 'Model=%{y}
BERT score F1=%{x}', @@ -755,7 +755,7 @@ plot_object,header,plot_json,description,df,arguments 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.4888874], dtype=float32), + 'x': array([0.49331823], dtype=float32), 'xaxis': 'x', 'y': array(['gpt-3.5-turbo'], dtype=object), 'yaxis': 'y'}, @@ -769,7 +769,7 @@ plot_object,header,plot_json,description,df,arguments 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.47901583], dtype=float32), + 'x': array([0.4839312], dtype=float32), 'xaxis': 'x', 'y': array(['gpt-4'], dtype=object), 'yaxis': 'y'}, @@ -783,7 +783,7 @@ plot_object,header,plot_json,description,df,arguments 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.42098433], dtype=float32), + 'x': array([0.4294052], dtype=float32), 'xaxis': 'x', 'y': array(['gpt-4-turbo'], dtype=object), 'yaxis': 'y'}, @@ -797,7 +797,7 @@ plot_object,header,plot_json,description,df,arguments 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.36540908], dtype=float32), + 'x': array([0.36758336], dtype=float32), 'xaxis': 'x', 'y': array(['Mistral (7B) Instruct v0.2 (Together AI)'], dtype=object), 'yaxis': 'y'}, @@ -811,7 +811,7 @@ plot_object,header,plot_json,description,df,arguments 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.3565194], dtype=float32), + 'x': array([0.36003792], dtype=float32), 'xaxis': 'x', 'y': array(['OpenHermes-2.5-Mistral (7B)'], dtype=object), 'yaxis': 'y'}, @@ -825,7 +825,7 @@ plot_object,header,plot_json,description,df,arguments 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.344803], dtype=float32), + 'x': array([0.34867778], dtype=float32), 'xaxis': 'x', 'y': array(['Qwen 1.5 Chat (7B)'], dtype=object), 'yaxis': 'y'}, @@ -839,7 +839,7 @@ plot_object,header,plot_json,description,df,arguments 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.3399749], dtype=float32), + 'x': array([0.34183535], dtype=float32), 'xaxis': 'x', 'y': array(['01-ai Yi Chat (34B)'], dtype=object), 'yaxis': 'y'}, @@ -853,7 +853,7 @@ plot_object,header,plot_json,description,df,arguments 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.33466902], dtype=float32), + 'x': array([0.33996373], dtype=float32), 'xaxis': 'x', 'y': array(['WizardLM v1.2 (13B)'], dtype=object), 'yaxis': 'y'}, @@ -867,7 +867,7 @@ plot_object,header,plot_json,description,df,arguments 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.3265383], dtype=float32), + 'x': array([0.32718164], dtype=float32), 'xaxis': 'x', 'y': array(['Snorkel Mistral PairRM DPO (7B)'], dtype=object), 'yaxis': 'y'}, @@ -881,7 +881,7 @@ plot_object,header,plot_json,description,df,arguments 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.31770444], dtype=float32), + 'x': array([0.32136682], dtype=float32), 'xaxis': 'x', 'y': array(['LLaMA-2 Chat (7B)'], dtype=object), 'yaxis': 'y'}, @@ -895,37 +895,37 @@ plot_object,header,plot_json,description,df,arguments 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.311415], dtype=float32), + 'x': array([0.3150877], dtype=float32), 'xaxis': 'x', 'y': array(['Chronos Hermes (13B)'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', 'hovertemplate': 'Model=%{y}
BERT score F1=%{x}', - 'legendgroup': 'Vicuna v1.5 (7B)', + 'legendgroup': 'Falcon Instruct (7B)', 'marker': {'color': '#EF553B', 'pattern': {'shape': ''}}, - 'name': 'Vicuna v1.5 (7B)', - 'offsetgroup': 'Vicuna v1.5 (7B)', + 'name': 'Falcon Instruct (7B)', + 'offsetgroup': 'Falcon Instruct (7B)', 'orientation': 'h', 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.28129113], dtype=float32), + 'x': array([0.29104736], dtype=float32), 'xaxis': 'x', - 'y': array(['Vicuna v1.5 (7B)'], dtype=object), + 'y': array(['Falcon Instruct (7B)'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', 'hovertemplate': 'Model=%{y}
BERT score F1=%{x}', - 'legendgroup': 'Falcon Instruct (7B)', + 'legendgroup': 'Vicuna v1.5 (7B)', 'marker': {'color': '#00cc96', 'pattern': {'shape': ''}}, - 'name': 'Falcon Instruct (7B)', - 'offsetgroup': 'Falcon Instruct (7B)', + 'name': 'Vicuna v1.5 (7B)', + 'offsetgroup': 'Vicuna v1.5 (7B)', 'orientation': 'h', 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.2615204], dtype=float32), + 'x': array([0.2839047], dtype=float32), 'xaxis': 'x', - 'y': array(['Falcon Instruct (7B)'], dtype=object), + 'y': array(['Vicuna v1.5 (7B)'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', 'hovertemplate': 'Model=%{y}
BERT score F1=%{x}', @@ -937,37 +937,37 @@ plot_object,header,plot_json,description,df,arguments 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.2487217], dtype=float32), + 'x': array([0.26768887], dtype=float32), 'xaxis': 'x', 'y': array(['RedPajama-INCITE Chat (7B)'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', 'hovertemplate': 'Model=%{y}
BERT score F1=%{x}', - 'legendgroup': 'gemini-pro', + 'legendgroup': 'chat-bison (PaLM 2)', 'marker': {'color': '#FFA15A', 'pattern': {'shape': ''}}, - 'name': 'gemini-pro', - 'offsetgroup': 'gemini-pro', + 'name': 'chat-bison (PaLM 2)', + 'offsetgroup': 'chat-bison (PaLM 2)', 'orientation': 'h', 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.23072062], dtype=float32), + 'x': array([0.23214735], dtype=float32), 'xaxis': 'x', - 'y': array(['gemini-pro'], dtype=object), + 'y': array(['chat-bison (PaLM 2)'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', 'hovertemplate': 'Model=%{y}
BERT score F1=%{x}', - 'legendgroup': 'chat-bison (PaLM 2)', + 'legendgroup': 'gemini-pro', 'marker': {'color': '#19d3f3', 'pattern': {'shape': ''}}, - 'name': 'chat-bison (PaLM 2)', - 'offsetgroup': 'chat-bison (PaLM 2)', + 'name': 'gemini-pro', + 'offsetgroup': 'gemini-pro', 'orientation': 'h', 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.23060663], dtype=float32), + 'x': array([0.23199782], dtype=float32), 'xaxis': 'x', - 'y': array(['chat-bison (PaLM 2)'], dtype=object), + 'y': array(['gemini-pro'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', 'hovertemplate': 'Model=%{y}
BERT score F1=%{x}', @@ -979,7 +979,7 @@ plot_object,header,plot_json,description,df,arguments 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.23002876], dtype=float32), + 'x': array([0.2317056], dtype=float32), 'xaxis': 'x', 'y': array(['chat-bison-32k (PaLM 2 32K)'], dtype=object), 'yaxis': 'y'}, @@ -993,7 +993,7 @@ plot_object,header,plot_json,description,df,arguments 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.21117964], dtype=float32), + 'x': array([0.21268094], dtype=float32), 'xaxis': 'x', 'y': array(['llama-2-70b-chat'], dtype=object), 'yaxis': 'y'}, @@ -1007,7 +1007,7 @@ plot_object,header,plot_json,description,df,arguments 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.19330867], dtype=float32), + 'x': array([0.19449018], dtype=float32), 'xaxis': 'x', 'y': array(['Mixtral-8x7B-Instruct-v0.1'], dtype=object), 'yaxis': 'y'}, @@ -1021,7 +1021,7 @@ plot_object,header,plot_json,description,df,arguments 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.12042627], dtype=float32), + 'x': array([0.12200464], dtype=float32), 'xaxis': 'x', 'y': array(['TinyLlama/TinyLlama-1.1B-Chat-v1.0'], dtype=object), 'yaxis': 'y'}, @@ -1035,7 +1035,7 @@ plot_object,header,plot_json,description,df,arguments 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.08394519], dtype=float32), + 'x': array([0.08521976], dtype=float32), 'xaxis': 'x', 'y': array(['zephyr-7b-beta'], dtype=object), 'yaxis': 'y'}, @@ -1049,7 +1049,7 @@ plot_object,header,plot_json,description,df,arguments 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.04313921], dtype=float32), + 'x': array([0.04378006], dtype=float32), 'xaxis': 'x', 'y': array(['Mistral-7B-Instruct-v0.2'], dtype=object), 'yaxis': 'y'}, @@ -1079,9 +1079,9 @@ plot_object,header,plot_json,description,df,arguments TinyLlama/TinyLlama-1.1B-Chat-v1.0, Mixtral-8x7B-Instruct-v0.1, llama-2-70b-chat, chat-bison-32k (PaLM 2 - 32K), chat-bison (PaLM 2), gemini-pro, - RedPajama-INCITE Chat (7B), Falcon - Instruct (7B), Vicuna v1.5 (7B), Chronos + 32K), gemini-pro, chat-bison (PaLM 2), + RedPajama-INCITE Chat (7B), Vicuna v1.5 + (7B), Falcon Instruct (7B), Chronos Hermes (13B), LLaMA-2 Chat (7B), Snorkel Mistral PairRM DPO (7B), WizardLM v1.2 (13B), 01-ai Yi Chat (34B), Qwen 1.5 @@ -1091,48 +1091,54 @@ plot_object,header,plot_json,description,df,arguments 'categoryorder': 'array', 'domain': [0.0, 1.0], 'title': {'text': 'Model'}}} -})",Summary metrics BERT score F1,"{""data"":[{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-3.5-turbo"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""gpt-3.5-turbo"",""offsetgroup"":""gpt-3.5-turbo"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.4888874],""xaxis"":""x"",""y"":[""gpt-3.5-turbo""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""gpt-4"",""offsetgroup"":""gpt-4"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.47901583],""xaxis"":""x"",""y"":[""gpt-4""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4-turbo"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""gpt-4-turbo"",""offsetgroup"":""gpt-4-turbo"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.42098433],""xaxis"":""x"",""y"":[""gpt-4-turbo""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral (7B) Instruct v0.2 (Together AI)"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""Mistral (7B) Instruct v0.2 (Together AI)"",""offsetgroup"":""Mistral (7B) Instruct v0.2 (Together AI)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.36540908],""xaxis"":""x"",""y"":[""Mistral (7B) Instruct v0.2 (Together AI)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""OpenHermes-2.5-Mistral (7B)"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""OpenHermes-2.5-Mistral (7B)"",""offsetgroup"":""OpenHermes-2.5-Mistral (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.3565194],""xaxis"":""x"",""y"":[""OpenHermes-2.5-Mistral (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Qwen 1.5 Chat (7B)"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""Qwen 1.5 Chat (7B)"",""offsetgroup"":""Qwen 1.5 Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.344803],""xaxis"":""x"",""y"":[""Qwen 1.5 Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""01-ai Yi Chat (34B)"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""01-ai Yi Chat (34B)"",""offsetgroup"":""01-ai Yi Chat (34B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.3399749],""xaxis"":""x"",""y"":[""01-ai Yi Chat (34B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""WizardLM v1.2 (13B)"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""WizardLM v1.2 (13B)"",""offsetgroup"":""WizardLM v1.2 (13B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.33466902],""xaxis"":""x"",""y"":[""WizardLM v1.2 (13B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Snorkel Mistral PairRM DPO (7B)"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""Snorkel Mistral PairRM DPO (7B)"",""offsetgroup"":""Snorkel Mistral PairRM DPO (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.3265383],""xaxis"":""x"",""y"":[""Snorkel Mistral PairRM DPO (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""LLaMA-2 Chat (7B)"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""LLaMA-2 Chat (7B)"",""offsetgroup"":""LLaMA-2 Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.31770444],""xaxis"":""x"",""y"":[""LLaMA-2 Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Chronos Hermes (13B)"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""Chronos Hermes (13B)"",""offsetgroup"":""Chronos Hermes (13B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.311415],""xaxis"":""x"",""y"":[""Chronos Hermes (13B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Vicuna v1.5 (7B)"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""Vicuna v1.5 (7B)"",""offsetgroup"":""Vicuna v1.5 (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.28129113],""xaxis"":""x"",""y"":[""Vicuna v1.5 (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Falcon Instruct (7B)"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""Falcon Instruct (7B)"",""offsetgroup"":""Falcon Instruct (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.2615204],""xaxis"":""x"",""y"":[""Falcon Instruct (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""RedPajama-INCITE Chat (7B)"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""RedPajama-INCITE Chat (7B)"",""offsetgroup"":""RedPajama-INCITE Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.2487217],""xaxis"":""x"",""y"":[""RedPajama-INCITE Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gemini-pro"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""gemini-pro"",""offsetgroup"":""gemini-pro"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.23072062],""xaxis"":""x"",""y"":[""gemini-pro""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison (PaLM 2)"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""chat-bison (PaLM 2)"",""offsetgroup"":""chat-bison (PaLM 2)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.23060663],""xaxis"":""x"",""y"":[""chat-bison (PaLM 2)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison-32k (PaLM 2 32K)"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""chat-bison-32k (PaLM 2 32K)"",""offsetgroup"":""chat-bison-32k (PaLM 2 32K)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.23002876],""xaxis"":""x"",""y"":[""chat-bison-32k (PaLM 2 32K)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""llama-2-70b-chat"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""llama-2-70b-chat"",""offsetgroup"":""llama-2-70b-chat"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.21117964],""xaxis"":""x"",""y"":[""llama-2-70b-chat""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mixtral-8x7B-Instruct-v0.1"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""Mixtral-8x7B-Instruct-v0.1"",""offsetgroup"":""Mixtral-8x7B-Instruct-v0.1"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.19330867],""xaxis"":""x"",""y"":[""Mixtral-8x7B-Instruct-v0.1""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""offsetgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.12042627],""xaxis"":""x"",""y"":[""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""zephyr-7b-beta"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""zephyr-7b-beta"",""offsetgroup"":""zephyr-7b-beta"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.08394519],""xaxis"":""x"",""y"":[""zephyr-7b-beta""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral-7B-Instruct-v0.2"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""Mistral-7B-Instruct-v0.2"",""offsetgroup"":""Mistral-7B-Instruct-v0.2"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.04313921],""xaxis"":""x"",""y"":[""Mistral-7B-Instruct-v0.2""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Upstage SOLAR Instruct v1 (11B)"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""Upstage SOLAR Instruct v1 (11B)"",""offsetgroup"":""Upstage SOLAR Instruct v1 (11B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.0],""xaxis"":""x"",""y"":[""Upstage SOLAR Instruct v1 (11B)""],""yaxis"":""y"",""type"":""bar""}],""layout"":{""template"":{""data"":{""histogram2dcontour"":[{""type"":""histogram2dcontour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""choropleth"":[{""type"":""choropleth"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""histogram2d"":[{""type"":""histogram2d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmap"":[{""type"":""heatmap"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmapgl"":[{""type"":""heatmapgl"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""contourcarpet"":[{""type"":""contourcarpet"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""contour"":[{""type"":""contour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""surface"":[{""type"":""surface"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""mesh3d"":[{""type"":""mesh3d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""scatter"":[{""fillpattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2},""type"":""scatter""}],""parcoords"":[{""type"":""parcoords"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolargl"":[{""type"":""scatterpolargl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""bar"":[{""error_x"":{""color"":""#2a3f5f""},""error_y"":{""color"":""#2a3f5f""},""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""bar""}],""scattergeo"":[{""type"":""scattergeo"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolar"":[{""type"":""scatterpolar"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""histogram"":[{""marker"":{""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""histogram""}],""scattergl"":[{""type"":""scattergl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatter3d"":[{""type"":""scatter3d"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattermapbox"":[{""type"":""scattermapbox"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterternary"":[{""type"":""scatterternary"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattercarpet"":[{""type"":""scattercarpet"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""carpet"":[{""aaxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""baxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""type"":""carpet""}],""table"":[{""cells"":{""fill"":{""color"":""#EBF0F8""},""line"":{""color"":""white""}},""header"":{""fill"":{""color"":""#C8D4E3""},""line"":{""color"":""white""}},""type"":""table""}],""barpolar"":[{""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""barpolar""}],""pie"":[{""automargin"":true,""type"":""pie""}]},""layout"":{""autotypenumbers"":""strict"",""colorway"":[""#636efa"",""#EF553B"",""#00cc96"",""#ab63fa"",""#FFA15A"",""#19d3f3"",""#FF6692"",""#B6E880"",""#FF97FF"",""#FECB52""],""font"":{""color"":""#2a3f5f""},""hovermode"":""closest"",""hoverlabel"":{""align"":""left""},""paper_bgcolor"":""white"",""plot_bgcolor"":""#E5ECF6"",""polar"":{""bgcolor"":""#E5ECF6"",""angularaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""radialaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""ternary"":{""bgcolor"":""#E5ECF6"",""aaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""baxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""caxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""coloraxis"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""colorscale"":{""sequential"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""sequentialminus"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""diverging"":[[0,""#8e0152""],[0.1,""#c51b7d""],[0.2,""#de77ae""],[0.3,""#f1b6da""],[0.4,""#fde0ef""],[0.5,""#f7f7f7""],[0.6,""#e6f5d0""],[0.7,""#b8e186""],[0.8,""#7fbc41""],[0.9,""#4d9221""],[1,""#276419""]]},""xaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""yaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""scene"":{""xaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""yaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""zaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2}},""shapedefaults"":{""line"":{""color"":""#2a3f5f""}},""annotationdefaults"":{""arrowcolor"":""#2a3f5f"",""arrowhead"":0,""arrowwidth"":1},""geo"":{""bgcolor"":""white"",""landcolor"":""#E5ECF6"",""subunitcolor"":""white"",""showland"":true,""showlakes"":true,""lakecolor"":""white""},""title"":{""x"":0.05},""mapbox"":{""style"":""light""}}},""xaxis"":{""anchor"":""y"",""domain"":[0.0,1.0],""title"":{""text"":""BERT score F1""}},""yaxis"":{""anchor"":""x"",""domain"":[0.0,1.0],""title"":{""text"":""Model""},""categoryorder"":""array"",""categoryarray"":[""Upstage SOLAR Instruct v1 (11B)"",""Mistral-7B-Instruct-v0.2"",""zephyr-7b-beta"",""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""Mixtral-8x7B-Instruct-v0.1"",""llama-2-70b-chat"",""chat-bison-32k (PaLM 2 32K)"",""chat-bison (PaLM 2)"",""gemini-pro"",""RedPajama-INCITE Chat (7B)"",""Falcon Instruct (7B)"",""Vicuna v1.5 (7B)"",""Chronos Hermes (13B)"",""LLaMA-2 Chat (7B)"",""Snorkel Mistral PairRM DPO (7B)"",""WizardLM v1.2 (13B)"",""01-ai Yi Chat (34B)"",""Qwen 1.5 Chat (7B)"",""OpenHermes-2.5-Mistral (7B)"",""Mistral (7B) Instruct v0.2 (Together AI)"",""gpt-4-turbo"",""gpt-4"",""gpt-3.5-turbo""]},""legend"":{""title"":{""text"":""Model""},""tracegroupgap"":0},""title"":{""text"":""Summary metrics BERT score F1""},""barmode"":""relative""}}",How similar are the BERT model embeddings of the summary to the BERT model embeddings of the original text. Value is averaged for each model.,",model,bert_score_P,bert_score_R,bert_score_F1,original_text_length_part,sentence_count,length_penalty,bleu_score -18,gpt-3.5-turbo,0.4943981,0.48408476,0.4888874,0.5905700146991734,4.229639819909955,89814.0,0.007892445077902592 -19,gpt-4,0.48605907,0.472583,0.47901583,0.4763731952669352,4.266137566137566,85120.0,0.004704572681138337 -20,gpt-4-turbo,0.42728576,0.4162435,0.42098433,0.5393220459796505,4.266137566137566,85120.0,0.0034873692407505464 -4,Mistral (7B) Instruct v0.2 (Together AI),0.3647361,0.3664233,0.36540908,0.5233998570385472,3.712222222222222,29298.0,0.005478518060743351 -7,OpenHermes-2.5-Mistral (7B),0.3618188,0.35180506,0.3565194,0.312054520357568,3.5818443804034583,14928.0,0.006563161880264231 -8,Qwen 1.5 Chat (7B),0.34855434,0.34154576,0.344803,0.29904529709475364,3.5818443804034583,14928.0,0.003185571110431172 -0,01-ai Yi Chat (34B),0.33974892,0.3404481,0.3399749,0.43251538287409536,3.5818443804034583,14928.0,0.007311566390840339 -14,WizardLM v1.2 (13B),0.34085444,0.32933056,0.33466902,0.28716720161049375,3.5818443804034583,14928.0,0.003671383039102015 -10,Snorkel Mistral PairRM DPO (7B),0.31672964,0.33782956,0.3265383,3.7740234383755356,3.5818443804034583,14928.0,0.002907897771152987 -3,LLaMA-2 Chat (7B),0.3203912,0.3153909,0.31770444,0.4084233313416049,3.5818443804034583,14928.0,0.004255859538193306 -1,Chronos Hermes (13B),0.3124825,0.31071666,0.311415,0.4742810243835248,3.5818443804034583,14928.0,0.011439012700594395 -13,Vicuna v1.5 (7B),0.284109,0.27878883,0.28129113,0.2781035051738079,3.6173027989821884,16948.0,0.006952332387656228 -2,Falcon Instruct (7B),0.2895086,0.23968808,0.2615204,0.0490635544441649,3.5818443804034583,14928.0,0.00021729364201653395 -9,RedPajama-INCITE Chat (7B),0.261367,0.23758642,0.2487217,0.0560284823193376,3.5818443804034583,14928.0,0.0 -17,gemini-pro,0.23105659,0.23057175,0.23072062,0.295286999418032,4.244871794871795,87700.0,0.0025439281189154664 -15,chat-bison (PaLM 2),0.23117188,0.23029378,0.23060663,0.2927236655934559,4.281081081081081,83400.0,0.0033173472693443363 -16,chat-bison-32k (PaLM 2 32K),0.23046139,0.22983725,0.23002876,0.2608806894318779,4.281081081081081,83400.0,0.002970914340485325 -21,llama-2-70b-chat,0.20800962,0.21472095,0.21117964,0.29684572894554634,4.2436893203883495,88008.0,0.00329426273003284 -6,Mixtral-8x7B-Instruct-v0.1,0.19128644,0.19555509,0.19330867,0.2665288353398184,4.161038961038961,103320.0,0.0026839271544750283 -11,TinyLlama/TinyLlama-1.1B-Chat-v1.0,0.122185074,0.11885959,0.12042627,0.13915355617375091,4.244871794871795,87700.0,0.002991155730532842 -22,zephyr-7b-beta,0.085390136,0.08266569,0.08394519,0.08796697338212889,4.159788702026735,103714.0,0.0010625100735849574 -5,Mistral-7B-Instruct-v0.2,0.043820098,0.042561684,0.04313921,0.04250630683894714,4.120342654588421,113258.0,0.0004930290548816363 -12,Upstage SOLAR Instruct v1 (11B),0.0,0.0,0.0,0.0017662349842492329,3.5818443804034583,14928.0,0.0 -","{""x"": ""bert_score_F1"", ""y"": ""model"", ""color"": ""model"", ""orientation"": ""h"", ""labels"": {""bert_score_F1"": ""BERT score F1"", ""model"": ""Model""}, ""title"": ""Summary metrics BERT score F1""}" +})",Summary metrics BERT score F1,"{""data"":[{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-3.5-turbo"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""gpt-3.5-turbo"",""offsetgroup"":""gpt-3.5-turbo"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.49331823],""xaxis"":""x"",""y"":[""gpt-3.5-turbo""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""gpt-4"",""offsetgroup"":""gpt-4"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.4839312],""xaxis"":""x"",""y"":[""gpt-4""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4-turbo"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""gpt-4-turbo"",""offsetgroup"":""gpt-4-turbo"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.4294052],""xaxis"":""x"",""y"":[""gpt-4-turbo""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral (7B) Instruct v0.2 (Together AI)"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""Mistral (7B) Instruct v0.2 (Together AI)"",""offsetgroup"":""Mistral (7B) Instruct v0.2 (Together AI)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.36758336],""xaxis"":""x"",""y"":[""Mistral (7B) Instruct v0.2 (Together AI)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""OpenHermes-2.5-Mistral (7B)"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""OpenHermes-2.5-Mistral (7B)"",""offsetgroup"":""OpenHermes-2.5-Mistral (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.36003792],""xaxis"":""x"",""y"":[""OpenHermes-2.5-Mistral (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Qwen 1.5 Chat (7B)"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""Qwen 1.5 Chat (7B)"",""offsetgroup"":""Qwen 1.5 Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.34867778],""xaxis"":""x"",""y"":[""Qwen 1.5 Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""01-ai Yi Chat (34B)"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""01-ai Yi Chat (34B)"",""offsetgroup"":""01-ai Yi Chat (34B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.34183535],""xaxis"":""x"",""y"":[""01-ai Yi Chat (34B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""WizardLM v1.2 (13B)"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""WizardLM v1.2 (13B)"",""offsetgroup"":""WizardLM v1.2 (13B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.33996373],""xaxis"":""x"",""y"":[""WizardLM v1.2 (13B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Snorkel Mistral PairRM DPO (7B)"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""Snorkel Mistral PairRM DPO (7B)"",""offsetgroup"":""Snorkel Mistral PairRM DPO (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.32718164],""xaxis"":""x"",""y"":[""Snorkel Mistral PairRM DPO (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""LLaMA-2 Chat (7B)"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""LLaMA-2 Chat (7B)"",""offsetgroup"":""LLaMA-2 Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.32136682],""xaxis"":""x"",""y"":[""LLaMA-2 Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Chronos Hermes (13B)"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""Chronos Hermes (13B)"",""offsetgroup"":""Chronos Hermes (13B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.3150877],""xaxis"":""x"",""y"":[""Chronos Hermes (13B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Falcon Instruct (7B)"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""Falcon Instruct (7B)"",""offsetgroup"":""Falcon Instruct (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.29104736],""xaxis"":""x"",""y"":[""Falcon Instruct (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Vicuna v1.5 (7B)"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""Vicuna v1.5 (7B)"",""offsetgroup"":""Vicuna v1.5 (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.2839047],""xaxis"":""x"",""y"":[""Vicuna v1.5 (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""RedPajama-INCITE Chat (7B)"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""RedPajama-INCITE Chat (7B)"",""offsetgroup"":""RedPajama-INCITE Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.26768887],""xaxis"":""x"",""y"":[""RedPajama-INCITE Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison (PaLM 2)"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""chat-bison (PaLM 2)"",""offsetgroup"":""chat-bison (PaLM 2)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.23214735],""xaxis"":""x"",""y"":[""chat-bison (PaLM 2)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gemini-pro"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""gemini-pro"",""offsetgroup"":""gemini-pro"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.23199782],""xaxis"":""x"",""y"":[""gemini-pro""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison-32k (PaLM 2 32K)"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""chat-bison-32k (PaLM 2 32K)"",""offsetgroup"":""chat-bison-32k (PaLM 2 32K)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.2317056],""xaxis"":""x"",""y"":[""chat-bison-32k (PaLM 2 32K)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""llama-2-70b-chat"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""llama-2-70b-chat"",""offsetgroup"":""llama-2-70b-chat"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.21268094],""xaxis"":""x"",""y"":[""llama-2-70b-chat""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mixtral-8x7B-Instruct-v0.1"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""Mixtral-8x7B-Instruct-v0.1"",""offsetgroup"":""Mixtral-8x7B-Instruct-v0.1"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.19449018],""xaxis"":""x"",""y"":[""Mixtral-8x7B-Instruct-v0.1""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""offsetgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.12200464],""xaxis"":""x"",""y"":[""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""zephyr-7b-beta"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""zephyr-7b-beta"",""offsetgroup"":""zephyr-7b-beta"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.085219756],""xaxis"":""x"",""y"":[""zephyr-7b-beta""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral-7B-Instruct-v0.2"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""Mistral-7B-Instruct-v0.2"",""offsetgroup"":""Mistral-7B-Instruct-v0.2"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.04378006],""xaxis"":""x"",""y"":[""Mistral-7B-Instruct-v0.2""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBERT score F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Upstage SOLAR Instruct v1 (11B)"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""Upstage SOLAR Instruct v1 (11B)"",""offsetgroup"":""Upstage SOLAR Instruct v1 (11B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.0],""xaxis"":""x"",""y"":[""Upstage SOLAR Instruct v1 (11B)""],""yaxis"":""y"",""type"":""bar""}],""layout"":{""template"":{""data"":{""histogram2dcontour"":[{""type"":""histogram2dcontour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""choropleth"":[{""type"":""choropleth"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""histogram2d"":[{""type"":""histogram2d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmap"":[{""type"":""heatmap"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmapgl"":[{""type"":""heatmapgl"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""contourcarpet"":[{""type"":""contourcarpet"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""contour"":[{""type"":""contour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""surface"":[{""type"":""surface"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""mesh3d"":[{""type"":""mesh3d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""scatter"":[{""fillpattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2},""type"":""scatter""}],""parcoords"":[{""type"":""parcoords"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolargl"":[{""type"":""scatterpolargl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""bar"":[{""error_x"":{""color"":""#2a3f5f""},""error_y"":{""color"":""#2a3f5f""},""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""bar""}],""scattergeo"":[{""type"":""scattergeo"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolar"":[{""type"":""scatterpolar"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""histogram"":[{""marker"":{""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""histogram""}],""scattergl"":[{""type"":""scattergl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatter3d"":[{""type"":""scatter3d"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattermapbox"":[{""type"":""scattermapbox"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterternary"":[{""type"":""scatterternary"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattercarpet"":[{""type"":""scattercarpet"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""carpet"":[{""aaxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""baxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""type"":""carpet""}],""table"":[{""cells"":{""fill"":{""color"":""#EBF0F8""},""line"":{""color"":""white""}},""header"":{""fill"":{""color"":""#C8D4E3""},""line"":{""color"":""white""}},""type"":""table""}],""barpolar"":[{""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""barpolar""}],""pie"":[{""automargin"":true,""type"":""pie""}]},""layout"":{""autotypenumbers"":""strict"",""colorway"":[""#636efa"",""#EF553B"",""#00cc96"",""#ab63fa"",""#FFA15A"",""#19d3f3"",""#FF6692"",""#B6E880"",""#FF97FF"",""#FECB52""],""font"":{""color"":""#2a3f5f""},""hovermode"":""closest"",""hoverlabel"":{""align"":""left""},""paper_bgcolor"":""white"",""plot_bgcolor"":""#E5ECF6"",""polar"":{""bgcolor"":""#E5ECF6"",""angularaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""radialaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""ternary"":{""bgcolor"":""#E5ECF6"",""aaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""baxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""caxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""coloraxis"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""colorscale"":{""sequential"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""sequentialminus"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""diverging"":[[0,""#8e0152""],[0.1,""#c51b7d""],[0.2,""#de77ae""],[0.3,""#f1b6da""],[0.4,""#fde0ef""],[0.5,""#f7f7f7""],[0.6,""#e6f5d0""],[0.7,""#b8e186""],[0.8,""#7fbc41""],[0.9,""#4d9221""],[1,""#276419""]]},""xaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""yaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""scene"":{""xaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""yaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""zaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2}},""shapedefaults"":{""line"":{""color"":""#2a3f5f""}},""annotationdefaults"":{""arrowcolor"":""#2a3f5f"",""arrowhead"":0,""arrowwidth"":1},""geo"":{""bgcolor"":""white"",""landcolor"":""#E5ECF6"",""subunitcolor"":""white"",""showland"":true,""showlakes"":true,""lakecolor"":""white""},""title"":{""x"":0.05},""mapbox"":{""style"":""light""}}},""xaxis"":{""anchor"":""y"",""domain"":[0.0,1.0],""title"":{""text"":""BERT score F1""}},""yaxis"":{""anchor"":""x"",""domain"":[0.0,1.0],""title"":{""text"":""Model""},""categoryorder"":""array"",""categoryarray"":[""Upstage SOLAR Instruct v1 (11B)"",""Mistral-7B-Instruct-v0.2"",""zephyr-7b-beta"",""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""Mixtral-8x7B-Instruct-v0.1"",""llama-2-70b-chat"",""chat-bison-32k (PaLM 2 32K)"",""gemini-pro"",""chat-bison (PaLM 2)"",""RedPajama-INCITE Chat (7B)"",""Vicuna v1.5 (7B)"",""Falcon Instruct (7B)"",""Chronos Hermes (13B)"",""LLaMA-2 Chat (7B)"",""Snorkel Mistral PairRM DPO (7B)"",""WizardLM v1.2 (13B)"",""01-ai Yi Chat (34B)"",""Qwen 1.5 Chat (7B)"",""OpenHermes-2.5-Mistral (7B)"",""Mistral (7B) Instruct v0.2 (Together AI)"",""gpt-4-turbo"",""gpt-4"",""gpt-3.5-turbo""]},""legend"":{""title"":{""text"":""Model""},""tracegroupgap"":0},""title"":{""text"":""Summary metrics BERT score F1""},""barmode"":""relative""}}"," + BERT score uses contextual embeddings from pre-trained BERT model to compare summarized text to reference texts.
+ For reference texts we used reference summarizations from the dataset, article title and original article text.
+ BERT score measures the similarity at both the token and sentence levels, capturing semantic nuances and contextual relevance. + + More about this metric can be read here: [link](https://arxiv.org/pdf/1904.09675.pdf).
+ Higher score indicates better alignment between the generated and reference text. The value is averaged for each model.",",model,BERT_score_precision,BERT_score_recall,BERT_score_F1,BLEU_score,original_text_length_part,sentence_count,length_penalty +18,gpt-3.5-turbo,0.49478123,0.50445867,0.49331823,0.00919205486407126,0.5905700146991734,4.229639819909955,89814.0 +19,gpt-4,0.4864653,0.49512562,0.4839312,0.005711113295666468,0.4763731952669352,4.266137566137566,85120.0 +20,gpt-4-turbo,0.42933634,0.4414623,0.4294052,0.0042830628392272,0.5393220459796505,4.266137566137566,85120.0 +4,Mistral (7B) Instruct v0.2 (Together AI),0.36488953,0.3797993,0.36758336,0.005650224193975447,0.5233998570385472,3.712222222222222,29298.0 +7,OpenHermes-2.5-Mistral (7B),0.3621834,0.3685358,0.36003792,0.0068684572027745494,0.312054520357568,3.5818443804034583,14928.0 +8,Qwen 1.5 Chat (7B),0.34898603,0.35945317,0.34867778,0.0033327500620805805,0.29904529709475364,3.5818443804034583,14928.0 +0,01-ai Yi Chat (34B),0.33981326,0.35219854,0.34183535,0.007428840277380581,0.43251538287409536,3.5818443804034583,14928.0 +14,WizardLM v1.2 (13B),0.3420949,0.34746957,0.33996373,0.00373442128604677,0.28716720161049375,3.5818443804034583,14928.0 +10,Snorkel Mistral PairRM DPO (7B),0.3167385,0.34785262,0.32718164,0.0029236226777824676,3.7740234383755356,3.5818443804034583,14928.0 +3,LLaMA-2 Chat (7B),0.32074162,0.33171847,0.32136682,0.004415024709996126,0.4084233313416049,3.5818443804034583,14928.0 +1,Chronos Hermes (13B),0.31285536,0.32630467,0.3150877,0.011542047908319874,0.4742810243835248,3.5818443804034583,14928.0 +2,Falcon Instruct (7B),0.30270517,0.28607234,0.29104736,0.0030232447024239606,0.0490635544441649,3.5818443804034583,14928.0 +13,Vicuna v1.5 (7B),0.28434175,0.29119453,0.2839047,0.007105541953090669,0.2781035051738079,3.6173027989821884,16948.0 +9,RedPajama-INCITE Chat (7B),0.26832756,0.27305293,0.26768887,0.0,0.0560284823193376,3.5818443804034583,14928.0 +15,chat-bison (PaLM 2),0.23123139,0.24001649,0.23214735,0.0037652345768886663,0.2927236655934559,4.281081081081081,83400.0 +17,gemini-pro,0.23109974,0.23956373,0.23199782,0.0032373504004405487,0.295286999418032,4.244871794871795,87700.0 +16,chat-bison-32k (PaLM 2 32K),0.23051436,0.23993237,0.2317056,0.003694633514634998,0.2608806894318779,4.281081081081081,83400.0 +21,llama-2-70b-chat,0.20810011,0.22406381,0.21268094,0.004560500754935232,0.29684572894554634,4.2436893203883495,88008.0 +6,Mixtral-8x7B-Instruct-v0.1,0.19137934,0.2029136,0.19449018,0.0031843990217988536,0.2665288353398184,4.161038961038961,103320.0 +11,TinyLlama/TinyLlama-1.1B-Chat-v1.0,0.122332305,0.12540509,0.12200464,0.003286423403673119,0.13915355617375091,4.244871794871795,87700.0 +22,zephyr-7b-beta,0.085546724,0.08755772,0.085219756,0.0012612839176470308,0.08796697338212889,4.159788702026735,103714.0 +5,Mistral-7B-Instruct-v0.2,0.04389399,0.045185987,0.04378006,0.000566625796313851,0.04250630683894714,4.120342654588421,113258.0 +12,Upstage SOLAR Instruct v1 (11B),0.0,0.0,0.0,0.0,0.0017662349842492329,3.5818443804034583,14928.0 +","{""x"": ""BERT_score_F1"", ""y"": ""model"", ""color"": ""model"", ""orientation"": ""h"", ""labels"": {""BERT_score_F1"": ""BERT score F1"", ""model"": ""Model""}, ""title"": ""Summary metrics BERT score F1""}" "Figure({ 'data': [{'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
original text length part=%{x}', - 'legendgroup': 'Snorkel Mistral PairRM DPO (7B)', + 'hovertemplate': 'Model=%{y}
BLEU score=%{x}', + 'legendgroup': 'Chronos Hermes (13B)', 'marker': {'color': '#636efa', 'pattern': {'shape': ''}}, - 'name': 'Snorkel Mistral PairRM DPO (7B)', - 'offsetgroup': 'Snorkel Mistral PairRM DPO (7B)', + 'name': 'Chronos Hermes (13B)', + 'offsetgroup': 'Chronos Hermes (13B)', 'orientation': 'h', 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([3.77402344]), + 'x': array([0.01154205]), 'xaxis': 'x', - 'y': array(['Snorkel Mistral PairRM DPO (7B)'], dtype=object), + 'y': array(['Chronos Hermes (13B)'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
original text length part=%{x}', + 'hovertemplate': 'Model=%{y}
BLEU score=%{x}', 'legendgroup': 'gpt-3.5-turbo', 'marker': {'color': '#EF553B', 'pattern': {'shape': ''}}, 'name': 'gpt-3.5-turbo', @@ -1141,292 +1147,292 @@ plot_object,header,plot_json,description,df,arguments 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.59057001]), + 'x': array([0.00919205]), 'xaxis': 'x', 'y': array(['gpt-3.5-turbo'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
original text length part=%{x}', - 'legendgroup': 'gpt-4-turbo', + 'hovertemplate': 'Model=%{y}
BLEU score=%{x}', + 'legendgroup': '01-ai Yi Chat (34B)', 'marker': {'color': '#00cc96', 'pattern': {'shape': ''}}, - 'name': 'gpt-4-turbo', - 'offsetgroup': 'gpt-4-turbo', + 'name': '01-ai Yi Chat (34B)', + 'offsetgroup': '01-ai Yi Chat (34B)', 'orientation': 'h', 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.53932205]), + 'x': array([0.00742884]), 'xaxis': 'x', - 'y': array(['gpt-4-turbo'], dtype=object), + 'y': array(['01-ai Yi Chat (34B)'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
original text length part=%{x}', - 'legendgroup': 'Mistral (7B) Instruct v0.2 (Together AI)', + 'hovertemplate': 'Model=%{y}
BLEU score=%{x}', + 'legendgroup': 'Vicuna v1.5 (7B)', 'marker': {'color': '#ab63fa', 'pattern': {'shape': ''}}, - 'name': 'Mistral (7B) Instruct v0.2 (Together AI)', - 'offsetgroup': 'Mistral (7B) Instruct v0.2 (Together AI)', + 'name': 'Vicuna v1.5 (7B)', + 'offsetgroup': 'Vicuna v1.5 (7B)', 'orientation': 'h', 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.52339986]), + 'x': array([0.00710554]), 'xaxis': 'x', - 'y': array(['Mistral (7B) Instruct v0.2 (Together AI)'], dtype=object), + 'y': array(['Vicuna v1.5 (7B)'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
original text length part=%{x}', - 'legendgroup': 'gpt-4', + 'hovertemplate': 'Model=%{y}
BLEU score=%{x}', + 'legendgroup': 'OpenHermes-2.5-Mistral (7B)', 'marker': {'color': '#FFA15A', 'pattern': {'shape': ''}}, - 'name': 'gpt-4', - 'offsetgroup': 'gpt-4', + 'name': 'OpenHermes-2.5-Mistral (7B)', + 'offsetgroup': 'OpenHermes-2.5-Mistral (7B)', 'orientation': 'h', 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.4763732]), + 'x': array([0.00686846]), 'xaxis': 'x', - 'y': array(['gpt-4'], dtype=object), + 'y': array(['OpenHermes-2.5-Mistral (7B)'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
original text length part=%{x}', - 'legendgroup': 'Chronos Hermes (13B)', + 'hovertemplate': 'Model=%{y}
BLEU score=%{x}', + 'legendgroup': 'gpt-4', 'marker': {'color': '#19d3f3', 'pattern': {'shape': ''}}, - 'name': 'Chronos Hermes (13B)', - 'offsetgroup': 'Chronos Hermes (13B)', + 'name': 'gpt-4', + 'offsetgroup': 'gpt-4', 'orientation': 'h', 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.47428102]), + 'x': array([0.00571111]), 'xaxis': 'x', - 'y': array(['Chronos Hermes (13B)'], dtype=object), + 'y': array(['gpt-4'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
original text length part=%{x}', - 'legendgroup': '01-ai Yi Chat (34B)', + 'hovertemplate': 'Model=%{y}
BLEU score=%{x}', + 'legendgroup': 'Mistral (7B) Instruct v0.2 (Together AI)', 'marker': {'color': '#FF6692', 'pattern': {'shape': ''}}, - 'name': '01-ai Yi Chat (34B)', - 'offsetgroup': '01-ai Yi Chat (34B)', + 'name': 'Mistral (7B) Instruct v0.2 (Together AI)', + 'offsetgroup': 'Mistral (7B) Instruct v0.2 (Together AI)', 'orientation': 'h', 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.43251538]), + 'x': array([0.00565022]), 'xaxis': 'x', - 'y': array(['01-ai Yi Chat (34B)'], dtype=object), + 'y': array(['Mistral (7B) Instruct v0.2 (Together AI)'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
original text length part=%{x}', - 'legendgroup': 'LLaMA-2 Chat (7B)', + 'hovertemplate': 'Model=%{y}
BLEU score=%{x}', + 'legendgroup': 'llama-2-70b-chat', 'marker': {'color': '#B6E880', 'pattern': {'shape': ''}}, - 'name': 'LLaMA-2 Chat (7B)', - 'offsetgroup': 'LLaMA-2 Chat (7B)', + 'name': 'llama-2-70b-chat', + 'offsetgroup': 'llama-2-70b-chat', 'orientation': 'h', 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.40842333]), + 'x': array([0.0045605]), 'xaxis': 'x', - 'y': array(['LLaMA-2 Chat (7B)'], dtype=object), + 'y': array(['llama-2-70b-chat'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
original text length part=%{x}', - 'legendgroup': 'OpenHermes-2.5-Mistral (7B)', + 'hovertemplate': 'Model=%{y}
BLEU score=%{x}', + 'legendgroup': 'LLaMA-2 Chat (7B)', 'marker': {'color': '#FF97FF', 'pattern': {'shape': ''}}, - 'name': 'OpenHermes-2.5-Mistral (7B)', - 'offsetgroup': 'OpenHermes-2.5-Mistral (7B)', + 'name': 'LLaMA-2 Chat (7B)', + 'offsetgroup': 'LLaMA-2 Chat (7B)', 'orientation': 'h', 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.31205452]), + 'x': array([0.00441502]), 'xaxis': 'x', - 'y': array(['OpenHermes-2.5-Mistral (7B)'], dtype=object), + 'y': array(['LLaMA-2 Chat (7B)'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
original text length part=%{x}', - 'legendgroup': 'Qwen 1.5 Chat (7B)', + 'hovertemplate': 'Model=%{y}
BLEU score=%{x}', + 'legendgroup': 'gpt-4-turbo', 'marker': {'color': '#FECB52', 'pattern': {'shape': ''}}, - 'name': 'Qwen 1.5 Chat (7B)', - 'offsetgroup': 'Qwen 1.5 Chat (7B)', + 'name': 'gpt-4-turbo', + 'offsetgroup': 'gpt-4-turbo', 'orientation': 'h', 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.2990453]), + 'x': array([0.00428306]), 'xaxis': 'x', - 'y': array(['Qwen 1.5 Chat (7B)'], dtype=object), + 'y': array(['gpt-4-turbo'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
original text length part=%{x}', - 'legendgroup': 'llama-2-70b-chat', + 'hovertemplate': 'Model=%{y}
BLEU score=%{x}', + 'legendgroup': 'chat-bison (PaLM 2)', 'marker': {'color': '#636efa', 'pattern': {'shape': ''}}, - 'name': 'llama-2-70b-chat', - 'offsetgroup': 'llama-2-70b-chat', + 'name': 'chat-bison (PaLM 2)', + 'offsetgroup': 'chat-bison (PaLM 2)', 'orientation': 'h', 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.29684573]), + 'x': array([0.00376523]), 'xaxis': 'x', - 'y': array(['llama-2-70b-chat'], dtype=object), + 'y': array(['chat-bison (PaLM 2)'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
original text length part=%{x}', - 'legendgroup': 'gemini-pro', + 'hovertemplate': 'Model=%{y}
BLEU score=%{x}', + 'legendgroup': 'WizardLM v1.2 (13B)', 'marker': {'color': '#EF553B', 'pattern': {'shape': ''}}, - 'name': 'gemini-pro', - 'offsetgroup': 'gemini-pro', + 'name': 'WizardLM v1.2 (13B)', + 'offsetgroup': 'WizardLM v1.2 (13B)', 'orientation': 'h', 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.295287]), + 'x': array([0.00373442]), 'xaxis': 'x', - 'y': array(['gemini-pro'], dtype=object), + 'y': array(['WizardLM v1.2 (13B)'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
original text length part=%{x}', - 'legendgroup': 'chat-bison (PaLM 2)', + 'hovertemplate': 'Model=%{y}
BLEU score=%{x}', + 'legendgroup': 'chat-bison-32k (PaLM 2 32K)', 'marker': {'color': '#00cc96', 'pattern': {'shape': ''}}, - 'name': 'chat-bison (PaLM 2)', - 'offsetgroup': 'chat-bison (PaLM 2)', + 'name': 'chat-bison-32k (PaLM 2 32K)', + 'offsetgroup': 'chat-bison-32k (PaLM 2 32K)', 'orientation': 'h', 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.29272367]), + 'x': array([0.00369463]), 'xaxis': 'x', - 'y': array(['chat-bison (PaLM 2)'], dtype=object), + 'y': array(['chat-bison-32k (PaLM 2 32K)'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
original text length part=%{x}', - 'legendgroup': 'WizardLM v1.2 (13B)', + 'hovertemplate': 'Model=%{y}
BLEU score=%{x}', + 'legendgroup': 'Qwen 1.5 Chat (7B)', 'marker': {'color': '#ab63fa', 'pattern': {'shape': ''}}, - 'name': 'WizardLM v1.2 (13B)', - 'offsetgroup': 'WizardLM v1.2 (13B)', + 'name': 'Qwen 1.5 Chat (7B)', + 'offsetgroup': 'Qwen 1.5 Chat (7B)', 'orientation': 'h', 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.2871672]), + 'x': array([0.00333275]), 'xaxis': 'x', - 'y': array(['WizardLM v1.2 (13B)'], dtype=object), + 'y': array(['Qwen 1.5 Chat (7B)'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
original text length part=%{x}', - 'legendgroup': 'Vicuna v1.5 (7B)', + 'hovertemplate': 'Model=%{y}
BLEU score=%{x}', + 'legendgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0', 'marker': {'color': '#FFA15A', 'pattern': {'shape': ''}}, - 'name': 'Vicuna v1.5 (7B)', - 'offsetgroup': 'Vicuna v1.5 (7B)', + 'name': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0', + 'offsetgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0', 'orientation': 'h', 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.27810351]), + 'x': array([0.00328642]), 'xaxis': 'x', - 'y': array(['Vicuna v1.5 (7B)'], dtype=object), + 'y': array(['TinyLlama/TinyLlama-1.1B-Chat-v1.0'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
original text length part=%{x}', - 'legendgroup': 'Mixtral-8x7B-Instruct-v0.1', + 'hovertemplate': 'Model=%{y}
BLEU score=%{x}', + 'legendgroup': 'gemini-pro', 'marker': {'color': '#19d3f3', 'pattern': {'shape': ''}}, - 'name': 'Mixtral-8x7B-Instruct-v0.1', - 'offsetgroup': 'Mixtral-8x7B-Instruct-v0.1', + 'name': 'gemini-pro', + 'offsetgroup': 'gemini-pro', 'orientation': 'h', 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.26652884]), + 'x': array([0.00323735]), 'xaxis': 'x', - 'y': array(['Mixtral-8x7B-Instruct-v0.1'], dtype=object), + 'y': array(['gemini-pro'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
original text length part=%{x}', - 'legendgroup': 'chat-bison-32k (PaLM 2 32K)', + 'hovertemplate': 'Model=%{y}
BLEU score=%{x}', + 'legendgroup': 'Mixtral-8x7B-Instruct-v0.1', 'marker': {'color': '#FF6692', 'pattern': {'shape': ''}}, - 'name': 'chat-bison-32k (PaLM 2 32K)', - 'offsetgroup': 'chat-bison-32k (PaLM 2 32K)', + 'name': 'Mixtral-8x7B-Instruct-v0.1', + 'offsetgroup': 'Mixtral-8x7B-Instruct-v0.1', 'orientation': 'h', 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.26088069]), + 'x': array([0.0031844]), 'xaxis': 'x', - 'y': array(['chat-bison-32k (PaLM 2 32K)'], dtype=object), + 'y': array(['Mixtral-8x7B-Instruct-v0.1'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
original text length part=%{x}', - 'legendgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0', + 'hovertemplate': 'Model=%{y}
BLEU score=%{x}', + 'legendgroup': 'Falcon Instruct (7B)', 'marker': {'color': '#B6E880', 'pattern': {'shape': ''}}, - 'name': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0', - 'offsetgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0', + 'name': 'Falcon Instruct (7B)', + 'offsetgroup': 'Falcon Instruct (7B)', 'orientation': 'h', 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.13915356]), + 'x': array([0.00302324]), 'xaxis': 'x', - 'y': array(['TinyLlama/TinyLlama-1.1B-Chat-v1.0'], dtype=object), + 'y': array(['Falcon Instruct (7B)'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
original text length part=%{x}', - 'legendgroup': 'zephyr-7b-beta', + 'hovertemplate': 'Model=%{y}
BLEU score=%{x}', + 'legendgroup': 'Snorkel Mistral PairRM DPO (7B)', 'marker': {'color': '#FF97FF', 'pattern': {'shape': ''}}, - 'name': 'zephyr-7b-beta', - 'offsetgroup': 'zephyr-7b-beta', + 'name': 'Snorkel Mistral PairRM DPO (7B)', + 'offsetgroup': 'Snorkel Mistral PairRM DPO (7B)', 'orientation': 'h', 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.08796697]), + 'x': array([0.00292362]), 'xaxis': 'x', - 'y': array(['zephyr-7b-beta'], dtype=object), + 'y': array(['Snorkel Mistral PairRM DPO (7B)'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
original text length part=%{x}', - 'legendgroup': 'RedPajama-INCITE Chat (7B)', + 'hovertemplate': 'Model=%{y}
BLEU score=%{x}', + 'legendgroup': 'zephyr-7b-beta', 'marker': {'color': '#FECB52', 'pattern': {'shape': ''}}, - 'name': 'RedPajama-INCITE Chat (7B)', - 'offsetgroup': 'RedPajama-INCITE Chat (7B)', + 'name': 'zephyr-7b-beta', + 'offsetgroup': 'zephyr-7b-beta', 'orientation': 'h', 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.05602848]), + 'x': array([0.00126128]), 'xaxis': 'x', - 'y': array(['RedPajama-INCITE Chat (7B)'], dtype=object), + 'y': array(['zephyr-7b-beta'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
original text length part=%{x}', - 'legendgroup': 'Falcon Instruct (7B)', + 'hovertemplate': 'Model=%{y}
BLEU score=%{x}', + 'legendgroup': 'Mistral-7B-Instruct-v0.2', 'marker': {'color': '#636efa', 'pattern': {'shape': ''}}, - 'name': 'Falcon Instruct (7B)', - 'offsetgroup': 'Falcon Instruct (7B)', + 'name': 'Mistral-7B-Instruct-v0.2', + 'offsetgroup': 'Mistral-7B-Instruct-v0.2', 'orientation': 'h', 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.04906355]), + 'x': array([0.00056663]), 'xaxis': 'x', - 'y': array(['Falcon Instruct (7B)'], dtype=object), + 'y': array(['Mistral-7B-Instruct-v0.2'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
original text length part=%{x}', - 'legendgroup': 'Mistral-7B-Instruct-v0.2', + 'hovertemplate': 'Model=%{y}
BLEU score=%{x}', + 'legendgroup': 'RedPajama-INCITE Chat (7B)', 'marker': {'color': '#EF553B', 'pattern': {'shape': ''}}, - 'name': 'Mistral-7B-Instruct-v0.2', - 'offsetgroup': 'Mistral-7B-Instruct-v0.2', + 'name': 'RedPajama-INCITE Chat (7B)', + 'offsetgroup': 'RedPajama-INCITE Chat (7B)', 'orientation': 'h', 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.04250631]), + 'x': array([0.]), 'xaxis': 'x', - 'y': array(['Mistral-7B-Instruct-v0.2'], dtype=object), + 'y': array(['RedPajama-INCITE Chat (7B)'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
original text length part=%{x}', + 'hovertemplate': 'Model=%{y}
BLEU score=%{x}', 'legendgroup': 'Upstage SOLAR Instruct v1 (11B)', 'marker': {'color': '#00cc96', 'pattern': {'shape': ''}}, 'name': 'Upstage SOLAR Instruct v1 (11B)', @@ -1435,91 +1441,98 @@ plot_object,header,plot_json,description,df,arguments 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.00176623]), + 'x': array([0.]), 'xaxis': 'x', 'y': array(['Upstage SOLAR Instruct v1 (11B)'], dtype=object), 'yaxis': 'y'}], 'layout': {'barmode': 'relative', 'legend': {'title': {'text': 'Model'}, 'tracegroupgap': 0}, 'template': '...', - 'title': {'text': 'Summary metrics original text length part'}, - 'xaxis': {'anchor': 'y', 'domain': [0.0, 1.0], 'title': {'text': 'original text length part'}}, + 'title': {'text': 'Summary metrics BLEU score'}, + 'xaxis': {'anchor': 'y', 'domain': [0.0, 1.0], 'title': {'text': 'BLEU score'}}, 'yaxis': {'anchor': 'x', 'categoryarray': [Upstage SOLAR Instruct v1 (11B), - Mistral-7B-Instruct-v0.2, Falcon - Instruct (7B), RedPajama-INCITE Chat - (7B), zephyr-7b-beta, - TinyLlama/TinyLlama-1.1B-Chat-v1.0, - chat-bison-32k (PaLM 2 32K), - Mixtral-8x7B-Instruct-v0.1, Vicuna v1.5 - (7B), WizardLM v1.2 (13B), chat-bison - (PaLM 2), gemini-pro, llama-2-70b-chat, - Qwen 1.5 Chat (7B), - OpenHermes-2.5-Mistral (7B), LLaMA-2 - Chat (7B), 01-ai Yi Chat (34B), Chronos - Hermes (13B), gpt-4, Mistral (7B) - Instruct v0.2 (Together AI), - gpt-4-turbo, gpt-3.5-turbo, Snorkel - Mistral PairRM DPO (7B)], + RedPajama-INCITE Chat (7B), + Mistral-7B-Instruct-v0.2, + zephyr-7b-beta, Snorkel Mistral PairRM + DPO (7B), Falcon Instruct (7B), + Mixtral-8x7B-Instruct-v0.1, gemini-pro, + TinyLlama/TinyLlama-1.1B-Chat-v1.0, Qwen + 1.5 Chat (7B), chat-bison-32k (PaLM 2 + 32K), WizardLM v1.2 (13B), chat-bison + (PaLM 2), gpt-4-turbo, LLaMA-2 Chat + (7B), llama-2-70b-chat, Mistral (7B) + Instruct v0.2 (Together AI), gpt-4, + OpenHermes-2.5-Mistral (7B), Vicuna v1.5 + (7B), 01-ai Yi Chat (34B), + gpt-3.5-turbo, Chronos Hermes (13B)], 'categoryorder': 'array', 'domain': [0.0, 1.0], 'title': {'text': 'Model'}}} -})",Summary metrics original text length part,"{""data"":[{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eoriginal text length part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Snorkel Mistral PairRM DPO (7B)"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""Snorkel Mistral PairRM DPO (7B)"",""offsetgroup"":""Snorkel Mistral PairRM DPO (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[3.7740234383755356],""xaxis"":""x"",""y"":[""Snorkel Mistral PairRM DPO (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eoriginal text length part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-3.5-turbo"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""gpt-3.5-turbo"",""offsetgroup"":""gpt-3.5-turbo"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.5905700146991734],""xaxis"":""x"",""y"":[""gpt-3.5-turbo""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eoriginal text length part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4-turbo"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""gpt-4-turbo"",""offsetgroup"":""gpt-4-turbo"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.5393220459796505],""xaxis"":""x"",""y"":[""gpt-4-turbo""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eoriginal text length part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral (7B) Instruct v0.2 (Together AI)"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""Mistral (7B) Instruct v0.2 (Together AI)"",""offsetgroup"":""Mistral (7B) Instruct v0.2 (Together AI)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.5233998570385472],""xaxis"":""x"",""y"":[""Mistral (7B) Instruct v0.2 (Together AI)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eoriginal text length part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""gpt-4"",""offsetgroup"":""gpt-4"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.4763731952669352],""xaxis"":""x"",""y"":[""gpt-4""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eoriginal text length part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Chronos Hermes (13B)"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""Chronos Hermes (13B)"",""offsetgroup"":""Chronos Hermes (13B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.4742810243835248],""xaxis"":""x"",""y"":[""Chronos Hermes (13B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eoriginal text length part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""01-ai Yi Chat (34B)"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""01-ai Yi Chat (34B)"",""offsetgroup"":""01-ai Yi Chat (34B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.43251538287409536],""xaxis"":""x"",""y"":[""01-ai Yi Chat (34B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eoriginal text length part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""LLaMA-2 Chat (7B)"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""LLaMA-2 Chat (7B)"",""offsetgroup"":""LLaMA-2 Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.4084233313416049],""xaxis"":""x"",""y"":[""LLaMA-2 Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eoriginal text length part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""OpenHermes-2.5-Mistral (7B)"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""OpenHermes-2.5-Mistral (7B)"",""offsetgroup"":""OpenHermes-2.5-Mistral (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.312054520357568],""xaxis"":""x"",""y"":[""OpenHermes-2.5-Mistral (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eoriginal text length part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Qwen 1.5 Chat (7B)"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""Qwen 1.5 Chat (7B)"",""offsetgroup"":""Qwen 1.5 Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.29904529709475364],""xaxis"":""x"",""y"":[""Qwen 1.5 Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eoriginal text length part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""llama-2-70b-chat"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""llama-2-70b-chat"",""offsetgroup"":""llama-2-70b-chat"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.29684572894554634],""xaxis"":""x"",""y"":[""llama-2-70b-chat""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eoriginal text length part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gemini-pro"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""gemini-pro"",""offsetgroup"":""gemini-pro"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.295286999418032],""xaxis"":""x"",""y"":[""gemini-pro""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eoriginal text length part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison (PaLM 2)"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""chat-bison (PaLM 2)"",""offsetgroup"":""chat-bison (PaLM 2)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.2927236655934559],""xaxis"":""x"",""y"":[""chat-bison (PaLM 2)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eoriginal text length part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""WizardLM v1.2 (13B)"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""WizardLM v1.2 (13B)"",""offsetgroup"":""WizardLM v1.2 (13B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.28716720161049375],""xaxis"":""x"",""y"":[""WizardLM v1.2 (13B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eoriginal text length part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Vicuna v1.5 (7B)"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""Vicuna v1.5 (7B)"",""offsetgroup"":""Vicuna v1.5 (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.2781035051738079],""xaxis"":""x"",""y"":[""Vicuna v1.5 (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eoriginal text length part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mixtral-8x7B-Instruct-v0.1"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""Mixtral-8x7B-Instruct-v0.1"",""offsetgroup"":""Mixtral-8x7B-Instruct-v0.1"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.2665288353398184],""xaxis"":""x"",""y"":[""Mixtral-8x7B-Instruct-v0.1""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eoriginal text length part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison-32k (PaLM 2 32K)"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""chat-bison-32k (PaLM 2 32K)"",""offsetgroup"":""chat-bison-32k (PaLM 2 32K)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.2608806894318779],""xaxis"":""x"",""y"":[""chat-bison-32k (PaLM 2 32K)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eoriginal text length part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""offsetgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.13915355617375091],""xaxis"":""x"",""y"":[""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eoriginal text length part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""zephyr-7b-beta"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""zephyr-7b-beta"",""offsetgroup"":""zephyr-7b-beta"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.08796697338212889],""xaxis"":""x"",""y"":[""zephyr-7b-beta""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eoriginal text length part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""RedPajama-INCITE Chat (7B)"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""RedPajama-INCITE Chat (7B)"",""offsetgroup"":""RedPajama-INCITE Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.0560284823193376],""xaxis"":""x"",""y"":[""RedPajama-INCITE Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eoriginal text length part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Falcon Instruct (7B)"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""Falcon Instruct (7B)"",""offsetgroup"":""Falcon Instruct (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.0490635544441649],""xaxis"":""x"",""y"":[""Falcon Instruct (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eoriginal text length part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral-7B-Instruct-v0.2"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""Mistral-7B-Instruct-v0.2"",""offsetgroup"":""Mistral-7B-Instruct-v0.2"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.04250630683894714],""xaxis"":""x"",""y"":[""Mistral-7B-Instruct-v0.2""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eoriginal text length part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Upstage SOLAR Instruct v1 (11B)"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""Upstage SOLAR Instruct v1 (11B)"",""offsetgroup"":""Upstage SOLAR Instruct v1 (11B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.0017662349842492329],""xaxis"":""x"",""y"":[""Upstage SOLAR Instruct v1 (11B)""],""yaxis"":""y"",""type"":""bar""}],""layout"":{""template"":{""data"":{""histogram2dcontour"":[{""type"":""histogram2dcontour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""choropleth"":[{""type"":""choropleth"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""histogram2d"":[{""type"":""histogram2d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmap"":[{""type"":""heatmap"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmapgl"":[{""type"":""heatmapgl"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""contourcarpet"":[{""type"":""contourcarpet"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""contour"":[{""type"":""contour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""surface"":[{""type"":""surface"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""mesh3d"":[{""type"":""mesh3d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""scatter"":[{""fillpattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2},""type"":""scatter""}],""parcoords"":[{""type"":""parcoords"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolargl"":[{""type"":""scatterpolargl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""bar"":[{""error_x"":{""color"":""#2a3f5f""},""error_y"":{""color"":""#2a3f5f""},""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""bar""}],""scattergeo"":[{""type"":""scattergeo"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolar"":[{""type"":""scatterpolar"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""histogram"":[{""marker"":{""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""histogram""}],""scattergl"":[{""type"":""scattergl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatter3d"":[{""type"":""scatter3d"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattermapbox"":[{""type"":""scattermapbox"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterternary"":[{""type"":""scatterternary"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattercarpet"":[{""type"":""scattercarpet"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""carpet"":[{""aaxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""baxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""type"":""carpet""}],""table"":[{""cells"":{""fill"":{""color"":""#EBF0F8""},""line"":{""color"":""white""}},""header"":{""fill"":{""color"":""#C8D4E3""},""line"":{""color"":""white""}},""type"":""table""}],""barpolar"":[{""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""barpolar""}],""pie"":[{""automargin"":true,""type"":""pie""}]},""layout"":{""autotypenumbers"":""strict"",""colorway"":[""#636efa"",""#EF553B"",""#00cc96"",""#ab63fa"",""#FFA15A"",""#19d3f3"",""#FF6692"",""#B6E880"",""#FF97FF"",""#FECB52""],""font"":{""color"":""#2a3f5f""},""hovermode"":""closest"",""hoverlabel"":{""align"":""left""},""paper_bgcolor"":""white"",""plot_bgcolor"":""#E5ECF6"",""polar"":{""bgcolor"":""#E5ECF6"",""angularaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""radialaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""ternary"":{""bgcolor"":""#E5ECF6"",""aaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""baxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""caxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""coloraxis"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""colorscale"":{""sequential"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""sequentialminus"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""diverging"":[[0,""#8e0152""],[0.1,""#c51b7d""],[0.2,""#de77ae""],[0.3,""#f1b6da""],[0.4,""#fde0ef""],[0.5,""#f7f7f7""],[0.6,""#e6f5d0""],[0.7,""#b8e186""],[0.8,""#7fbc41""],[0.9,""#4d9221""],[1,""#276419""]]},""xaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""yaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""scene"":{""xaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""yaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""zaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2}},""shapedefaults"":{""line"":{""color"":""#2a3f5f""}},""annotationdefaults"":{""arrowcolor"":""#2a3f5f"",""arrowhead"":0,""arrowwidth"":1},""geo"":{""bgcolor"":""white"",""landcolor"":""#E5ECF6"",""subunitcolor"":""white"",""showland"":true,""showlakes"":true,""lakecolor"":""white""},""title"":{""x"":0.05},""mapbox"":{""style"":""light""}}},""xaxis"":{""anchor"":""y"",""domain"":[0.0,1.0],""title"":{""text"":""original text length part""}},""yaxis"":{""anchor"":""x"",""domain"":[0.0,1.0],""title"":{""text"":""Model""},""categoryorder"":""array"",""categoryarray"":[""Upstage SOLAR Instruct v1 (11B)"",""Mistral-7B-Instruct-v0.2"",""Falcon Instruct (7B)"",""RedPajama-INCITE Chat (7B)"",""zephyr-7b-beta"",""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""chat-bison-32k (PaLM 2 32K)"",""Mixtral-8x7B-Instruct-v0.1"",""Vicuna v1.5 (7B)"",""WizardLM v1.2 (13B)"",""chat-bison (PaLM 2)"",""gemini-pro"",""llama-2-70b-chat"",""Qwen 1.5 Chat (7B)"",""OpenHermes-2.5-Mistral (7B)"",""LLaMA-2 Chat (7B)"",""01-ai Yi Chat (34B)"",""Chronos Hermes (13B)"",""gpt-4"",""Mistral (7B) Instruct v0.2 (Together AI)"",""gpt-4-turbo"",""gpt-3.5-turbo"",""Snorkel Mistral PairRM DPO (7B)""]},""legend"":{""title"":{""text"":""Model""},""tracegroupgap"":0},""title"":{""text"":""Summary metrics original text length part""},""barmode"":""relative""}}","How long is the summarization compared to the original text, calculated as: `len(summarized_text) + 1 / len(original_text) + 1`. Value is averaged for each model.",",model,bert_score_P,bert_score_R,bert_score_F1,original_text_length_part,sentence_count,length_penalty,bleu_score -10,Snorkel Mistral PairRM DPO (7B),0.31672964,0.33782956,0.3265383,3.7740234383755356,3.5818443804034583,14928.0,0.002907897771152987 -18,gpt-3.5-turbo,0.4943981,0.48408476,0.4888874,0.5905700146991734,4.229639819909955,89814.0,0.007892445077902592 -20,gpt-4-turbo,0.42728576,0.4162435,0.42098433,0.5393220459796505,4.266137566137566,85120.0,0.0034873692407505464 -4,Mistral (7B) Instruct v0.2 (Together AI),0.3647361,0.3664233,0.36540908,0.5233998570385472,3.712222222222222,29298.0,0.005478518060743351 -19,gpt-4,0.48605907,0.472583,0.47901583,0.4763731952669352,4.266137566137566,85120.0,0.004704572681138337 -1,Chronos Hermes (13B),0.3124825,0.31071666,0.311415,0.4742810243835248,3.5818443804034583,14928.0,0.011439012700594395 -0,01-ai Yi Chat (34B),0.33974892,0.3404481,0.3399749,0.43251538287409536,3.5818443804034583,14928.0,0.007311566390840339 -3,LLaMA-2 Chat (7B),0.3203912,0.3153909,0.31770444,0.4084233313416049,3.5818443804034583,14928.0,0.004255859538193306 -7,OpenHermes-2.5-Mistral (7B),0.3618188,0.35180506,0.3565194,0.312054520357568,3.5818443804034583,14928.0,0.006563161880264231 -8,Qwen 1.5 Chat (7B),0.34855434,0.34154576,0.344803,0.29904529709475364,3.5818443804034583,14928.0,0.003185571110431172 -21,llama-2-70b-chat,0.20800962,0.21472095,0.21117964,0.29684572894554634,4.2436893203883495,88008.0,0.00329426273003284 -17,gemini-pro,0.23105659,0.23057175,0.23072062,0.295286999418032,4.244871794871795,87700.0,0.0025439281189154664 -15,chat-bison (PaLM 2),0.23117188,0.23029378,0.23060663,0.2927236655934559,4.281081081081081,83400.0,0.0033173472693443363 -14,WizardLM v1.2 (13B),0.34085444,0.32933056,0.33466902,0.28716720161049375,3.5818443804034583,14928.0,0.003671383039102015 -13,Vicuna v1.5 (7B),0.284109,0.27878883,0.28129113,0.2781035051738079,3.6173027989821884,16948.0,0.006952332387656228 -6,Mixtral-8x7B-Instruct-v0.1,0.19128644,0.19555509,0.19330867,0.2665288353398184,4.161038961038961,103320.0,0.0026839271544750283 -16,chat-bison-32k (PaLM 2 32K),0.23046139,0.22983725,0.23002876,0.2608806894318779,4.281081081081081,83400.0,0.002970914340485325 -11,TinyLlama/TinyLlama-1.1B-Chat-v1.0,0.122185074,0.11885959,0.12042627,0.13915355617375091,4.244871794871795,87700.0,0.002991155730532842 -22,zephyr-7b-beta,0.085390136,0.08266569,0.08394519,0.08796697338212889,4.159788702026735,103714.0,0.0010625100735849574 -9,RedPajama-INCITE Chat (7B),0.261367,0.23758642,0.2487217,0.0560284823193376,3.5818443804034583,14928.0,0.0 -2,Falcon Instruct (7B),0.2895086,0.23968808,0.2615204,0.0490635544441649,3.5818443804034583,14928.0,0.00021729364201653395 -5,Mistral-7B-Instruct-v0.2,0.043820098,0.042561684,0.04313921,0.04250630683894714,4.120342654588421,113258.0,0.0004930290548816363 -12,Upstage SOLAR Instruct v1 (11B),0.0,0.0,0.0,0.0017662349842492329,3.5818443804034583,14928.0,0.0 -","{""x"": ""original_text_length_part"", ""y"": ""model"", ""color"": ""model"", ""orientation"": ""h"", ""labels"": {""original_text_length_part"": ""original text length part"", ""model"": ""Model""}, ""title"": ""Summary metrics original text length part""}" +})",Summary metrics BLEU score,"{""data"":[{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBLEU score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Chronos Hermes (13B)"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""Chronos Hermes (13B)"",""offsetgroup"":""Chronos Hermes (13B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.011542047908319874],""xaxis"":""x"",""y"":[""Chronos Hermes (13B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBLEU score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-3.5-turbo"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""gpt-3.5-turbo"",""offsetgroup"":""gpt-3.5-turbo"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.00919205486407126],""xaxis"":""x"",""y"":[""gpt-3.5-turbo""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBLEU score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""01-ai Yi Chat (34B)"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""01-ai Yi Chat (34B)"",""offsetgroup"":""01-ai Yi Chat (34B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.007428840277380581],""xaxis"":""x"",""y"":[""01-ai Yi Chat (34B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBLEU score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Vicuna v1.5 (7B)"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""Vicuna v1.5 (7B)"",""offsetgroup"":""Vicuna v1.5 (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.007105541953090669],""xaxis"":""x"",""y"":[""Vicuna v1.5 (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBLEU score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""OpenHermes-2.5-Mistral (7B)"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""OpenHermes-2.5-Mistral (7B)"",""offsetgroup"":""OpenHermes-2.5-Mistral (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.0068684572027745494],""xaxis"":""x"",""y"":[""OpenHermes-2.5-Mistral (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBLEU score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""gpt-4"",""offsetgroup"":""gpt-4"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.005711113295666468],""xaxis"":""x"",""y"":[""gpt-4""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBLEU score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral (7B) Instruct v0.2 (Together AI)"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""Mistral (7B) Instruct v0.2 (Together AI)"",""offsetgroup"":""Mistral (7B) Instruct v0.2 (Together AI)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.005650224193975447],""xaxis"":""x"",""y"":[""Mistral (7B) Instruct v0.2 (Together AI)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBLEU score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""llama-2-70b-chat"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""llama-2-70b-chat"",""offsetgroup"":""llama-2-70b-chat"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.004560500754935232],""xaxis"":""x"",""y"":[""llama-2-70b-chat""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBLEU score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""LLaMA-2 Chat (7B)"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""LLaMA-2 Chat (7B)"",""offsetgroup"":""LLaMA-2 Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.004415024709996126],""xaxis"":""x"",""y"":[""LLaMA-2 Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBLEU score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4-turbo"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""gpt-4-turbo"",""offsetgroup"":""gpt-4-turbo"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.0042830628392272],""xaxis"":""x"",""y"":[""gpt-4-turbo""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBLEU score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison (PaLM 2)"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""chat-bison (PaLM 2)"",""offsetgroup"":""chat-bison (PaLM 2)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.0037652345768886663],""xaxis"":""x"",""y"":[""chat-bison (PaLM 2)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBLEU score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""WizardLM v1.2 (13B)"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""WizardLM v1.2 (13B)"",""offsetgroup"":""WizardLM v1.2 (13B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.00373442128604677],""xaxis"":""x"",""y"":[""WizardLM v1.2 (13B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBLEU score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison-32k (PaLM 2 32K)"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""chat-bison-32k (PaLM 2 32K)"",""offsetgroup"":""chat-bison-32k (PaLM 2 32K)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.003694633514634998],""xaxis"":""x"",""y"":[""chat-bison-32k (PaLM 2 32K)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBLEU score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Qwen 1.5 Chat (7B)"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""Qwen 1.5 Chat (7B)"",""offsetgroup"":""Qwen 1.5 Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.0033327500620805805],""xaxis"":""x"",""y"":[""Qwen 1.5 Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBLEU score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""offsetgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.003286423403673119],""xaxis"":""x"",""y"":[""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBLEU score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gemini-pro"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""gemini-pro"",""offsetgroup"":""gemini-pro"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.0032373504004405487],""xaxis"":""x"",""y"":[""gemini-pro""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBLEU score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mixtral-8x7B-Instruct-v0.1"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""Mixtral-8x7B-Instruct-v0.1"",""offsetgroup"":""Mixtral-8x7B-Instruct-v0.1"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.0031843990217988536],""xaxis"":""x"",""y"":[""Mixtral-8x7B-Instruct-v0.1""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBLEU score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Falcon Instruct (7B)"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""Falcon Instruct (7B)"",""offsetgroup"":""Falcon Instruct (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.0030232447024239606],""xaxis"":""x"",""y"":[""Falcon Instruct (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBLEU score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Snorkel Mistral PairRM DPO (7B)"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""Snorkel Mistral PairRM DPO (7B)"",""offsetgroup"":""Snorkel Mistral PairRM DPO (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.0029236226777824676],""xaxis"":""x"",""y"":[""Snorkel Mistral PairRM DPO (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBLEU score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""zephyr-7b-beta"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""zephyr-7b-beta"",""offsetgroup"":""zephyr-7b-beta"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.0012612839176470308],""xaxis"":""x"",""y"":[""zephyr-7b-beta""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBLEU score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral-7B-Instruct-v0.2"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""Mistral-7B-Instruct-v0.2"",""offsetgroup"":""Mistral-7B-Instruct-v0.2"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.000566625796313851],""xaxis"":""x"",""y"":[""Mistral-7B-Instruct-v0.2""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBLEU score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""RedPajama-INCITE Chat (7B)"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""RedPajama-INCITE Chat (7B)"",""offsetgroup"":""RedPajama-INCITE Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.0],""xaxis"":""x"",""y"":[""RedPajama-INCITE Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBLEU score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Upstage SOLAR Instruct v1 (11B)"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""Upstage SOLAR Instruct v1 (11B)"",""offsetgroup"":""Upstage SOLAR Instruct v1 (11B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.0],""xaxis"":""x"",""y"":[""Upstage SOLAR Instruct v1 (11B)""],""yaxis"":""y"",""type"":""bar""}],""layout"":{""template"":{""data"":{""histogram2dcontour"":[{""type"":""histogram2dcontour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""choropleth"":[{""type"":""choropleth"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""histogram2d"":[{""type"":""histogram2d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmap"":[{""type"":""heatmap"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmapgl"":[{""type"":""heatmapgl"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""contourcarpet"":[{""type"":""contourcarpet"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""contour"":[{""type"":""contour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""surface"":[{""type"":""surface"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""mesh3d"":[{""type"":""mesh3d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""scatter"":[{""fillpattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2},""type"":""scatter""}],""parcoords"":[{""type"":""parcoords"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolargl"":[{""type"":""scatterpolargl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""bar"":[{""error_x"":{""color"":""#2a3f5f""},""error_y"":{""color"":""#2a3f5f""},""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""bar""}],""scattergeo"":[{""type"":""scattergeo"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolar"":[{""type"":""scatterpolar"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""histogram"":[{""marker"":{""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""histogram""}],""scattergl"":[{""type"":""scattergl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatter3d"":[{""type"":""scatter3d"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattermapbox"":[{""type"":""scattermapbox"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterternary"":[{""type"":""scatterternary"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattercarpet"":[{""type"":""scattercarpet"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""carpet"":[{""aaxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""baxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""type"":""carpet""}],""table"":[{""cells"":{""fill"":{""color"":""#EBF0F8""},""line"":{""color"":""white""}},""header"":{""fill"":{""color"":""#C8D4E3""},""line"":{""color"":""white""}},""type"":""table""}],""barpolar"":[{""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""barpolar""}],""pie"":[{""automargin"":true,""type"":""pie""}]},""layout"":{""autotypenumbers"":""strict"",""colorway"":[""#636efa"",""#EF553B"",""#00cc96"",""#ab63fa"",""#FFA15A"",""#19d3f3"",""#FF6692"",""#B6E880"",""#FF97FF"",""#FECB52""],""font"":{""color"":""#2a3f5f""},""hovermode"":""closest"",""hoverlabel"":{""align"":""left""},""paper_bgcolor"":""white"",""plot_bgcolor"":""#E5ECF6"",""polar"":{""bgcolor"":""#E5ECF6"",""angularaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""radialaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""ternary"":{""bgcolor"":""#E5ECF6"",""aaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""baxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""caxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""coloraxis"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""colorscale"":{""sequential"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""sequentialminus"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""diverging"":[[0,""#8e0152""],[0.1,""#c51b7d""],[0.2,""#de77ae""],[0.3,""#f1b6da""],[0.4,""#fde0ef""],[0.5,""#f7f7f7""],[0.6,""#e6f5d0""],[0.7,""#b8e186""],[0.8,""#7fbc41""],[0.9,""#4d9221""],[1,""#276419""]]},""xaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""yaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""scene"":{""xaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""yaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""zaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2}},""shapedefaults"":{""line"":{""color"":""#2a3f5f""}},""annotationdefaults"":{""arrowcolor"":""#2a3f5f"",""arrowhead"":0,""arrowwidth"":1},""geo"":{""bgcolor"":""white"",""landcolor"":""#E5ECF6"",""subunitcolor"":""white"",""showland"":true,""showlakes"":true,""lakecolor"":""white""},""title"":{""x"":0.05},""mapbox"":{""style"":""light""}}},""xaxis"":{""anchor"":""y"",""domain"":[0.0,1.0],""title"":{""text"":""BLEU score""}},""yaxis"":{""anchor"":""x"",""domain"":[0.0,1.0],""title"":{""text"":""Model""},""categoryorder"":""array"",""categoryarray"":[""Upstage SOLAR Instruct v1 (11B)"",""RedPajama-INCITE Chat (7B)"",""Mistral-7B-Instruct-v0.2"",""zephyr-7b-beta"",""Snorkel Mistral PairRM DPO (7B)"",""Falcon Instruct (7B)"",""Mixtral-8x7B-Instruct-v0.1"",""gemini-pro"",""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""Qwen 1.5 Chat (7B)"",""chat-bison-32k (PaLM 2 32K)"",""WizardLM v1.2 (13B)"",""chat-bison (PaLM 2)"",""gpt-4-turbo"",""LLaMA-2 Chat (7B)"",""llama-2-70b-chat"",""Mistral (7B) Instruct v0.2 (Together AI)"",""gpt-4"",""OpenHermes-2.5-Mistral (7B)"",""Vicuna v1.5 (7B)"",""01-ai Yi Chat (34B)"",""gpt-3.5-turbo"",""Chronos Hermes (13B)""]},""legend"":{""title"":{""text"":""Model""},""tracegroupgap"":0},""title"":{""text"":""Summary metrics BLEU score""},""barmode"":""relative""}}"," + BLEU (BiLingual Evaluation Understudy) measures similarity between n-grams + (contiguous sequences of n words) in the generated and reference texts, + considering brevity penalties and length normalization.
+ For reference texts we used reference summarizations from the dataset, article title and original article text.
+ Maximum -gram size was set to 3. Unlike BERT score this metric doesn't handle synonyms, semantic nuance and context. + + More about this metric can be read here: [link](https://aclanthology.org/P02-1040.pdf).
+ Higher score indicates better alignment between the generated and reference text. The value is averaged for each model.",",model,BERT_score_precision,BERT_score_recall,BERT_score_F1,BLEU_score,original_text_length_part,sentence_count,length_penalty +1,Chronos Hermes (13B),0.31285536,0.32630467,0.3150877,0.011542047908319874,0.4742810243835248,3.5818443804034583,14928.0 +18,gpt-3.5-turbo,0.49478123,0.50445867,0.49331823,0.00919205486407126,0.5905700146991734,4.229639819909955,89814.0 +0,01-ai Yi Chat (34B),0.33981326,0.35219854,0.34183535,0.007428840277380581,0.43251538287409536,3.5818443804034583,14928.0 +13,Vicuna v1.5 (7B),0.28434175,0.29119453,0.2839047,0.007105541953090669,0.2781035051738079,3.6173027989821884,16948.0 +7,OpenHermes-2.5-Mistral (7B),0.3621834,0.3685358,0.36003792,0.0068684572027745494,0.312054520357568,3.5818443804034583,14928.0 +19,gpt-4,0.4864653,0.49512562,0.4839312,0.005711113295666468,0.4763731952669352,4.266137566137566,85120.0 +4,Mistral (7B) Instruct v0.2 (Together AI),0.36488953,0.3797993,0.36758336,0.005650224193975447,0.5233998570385472,3.712222222222222,29298.0 +21,llama-2-70b-chat,0.20810011,0.22406381,0.21268094,0.004560500754935232,0.29684572894554634,4.2436893203883495,88008.0 +3,LLaMA-2 Chat (7B),0.32074162,0.33171847,0.32136682,0.004415024709996126,0.4084233313416049,3.5818443804034583,14928.0 +20,gpt-4-turbo,0.42933634,0.4414623,0.4294052,0.0042830628392272,0.5393220459796505,4.266137566137566,85120.0 +15,chat-bison (PaLM 2),0.23123139,0.24001649,0.23214735,0.0037652345768886663,0.2927236655934559,4.281081081081081,83400.0 +14,WizardLM v1.2 (13B),0.3420949,0.34746957,0.33996373,0.00373442128604677,0.28716720161049375,3.5818443804034583,14928.0 +16,chat-bison-32k (PaLM 2 32K),0.23051436,0.23993237,0.2317056,0.003694633514634998,0.2608806894318779,4.281081081081081,83400.0 +8,Qwen 1.5 Chat (7B),0.34898603,0.35945317,0.34867778,0.0033327500620805805,0.29904529709475364,3.5818443804034583,14928.0 +11,TinyLlama/TinyLlama-1.1B-Chat-v1.0,0.122332305,0.12540509,0.12200464,0.003286423403673119,0.13915355617375091,4.244871794871795,87700.0 +17,gemini-pro,0.23109974,0.23956373,0.23199782,0.0032373504004405487,0.295286999418032,4.244871794871795,87700.0 +6,Mixtral-8x7B-Instruct-v0.1,0.19137934,0.2029136,0.19449018,0.0031843990217988536,0.2665288353398184,4.161038961038961,103320.0 +2,Falcon Instruct (7B),0.30270517,0.28607234,0.29104736,0.0030232447024239606,0.0490635544441649,3.5818443804034583,14928.0 +10,Snorkel Mistral PairRM DPO (7B),0.3167385,0.34785262,0.32718164,0.0029236226777824676,3.7740234383755356,3.5818443804034583,14928.0 +22,zephyr-7b-beta,0.085546724,0.08755772,0.085219756,0.0012612839176470308,0.08796697338212889,4.159788702026735,103714.0 +5,Mistral-7B-Instruct-v0.2,0.04389399,0.045185987,0.04378006,0.000566625796313851,0.04250630683894714,4.120342654588421,113258.0 +9,RedPajama-INCITE Chat (7B),0.26832756,0.27305293,0.26768887,0.0,0.0560284823193376,3.5818443804034583,14928.0 +12,Upstage SOLAR Instruct v1 (11B),0.0,0.0,0.0,0.0,0.0017662349842492329,3.5818443804034583,14928.0 +","{""x"": ""BLEU_score"", ""y"": ""model"", ""color"": ""model"", ""orientation"": ""h"", ""labels"": {""BLEU_score"": ""BLEU score"", ""model"": ""Model""}, ""title"": ""Summary metrics BLEU score""}" "Figure({ 'data': [{'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
sentence count=%{x}', - 'legendgroup': 'chat-bison (PaLM 2)', + 'hovertemplate': 'Model=%{y}
original text length part=%{x}', + 'legendgroup': 'Snorkel Mistral PairRM DPO (7B)', 'marker': {'color': '#636efa', 'pattern': {'shape': ''}}, - 'name': 'chat-bison (PaLM 2)', - 'offsetgroup': 'chat-bison (PaLM 2)', + 'name': 'Snorkel Mistral PairRM DPO (7B)', + 'offsetgroup': 'Snorkel Mistral PairRM DPO (7B)', 'orientation': 'h', 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([4.28108108]), + 'x': array([3.77402344]), 'xaxis': 'x', - 'y': array(['chat-bison (PaLM 2)'], dtype=object), + 'y': array(['Snorkel Mistral PairRM DPO (7B)'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
sentence count=%{x}', - 'legendgroup': 'chat-bison-32k (PaLM 2 32K)', + 'hovertemplate': 'Model=%{y}
original text length part=%{x}', + 'legendgroup': 'gpt-3.5-turbo', 'marker': {'color': '#EF553B', 'pattern': {'shape': ''}}, - 'name': 'chat-bison-32k (PaLM 2 32K)', - 'offsetgroup': 'chat-bison-32k (PaLM 2 32K)', + 'name': 'gpt-3.5-turbo', + 'offsetgroup': 'gpt-3.5-turbo', 'orientation': 'h', 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([4.28108108]), + 'x': array([0.59057001]), 'xaxis': 'x', - 'y': array(['chat-bison-32k (PaLM 2 32K)'], dtype=object), + 'y': array(['gpt-3.5-turbo'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
sentence count=%{x}', + 'hovertemplate': 'Model=%{y}
original text length part=%{x}', 'legendgroup': 'gpt-4-turbo', 'marker': {'color': '#00cc96', 'pattern': {'shape': ''}}, 'name': 'gpt-4-turbo', @@ -1528,278 +1541,278 @@ plot_object,header,plot_json,description,df,arguments 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([4.26613757]), + 'x': array([0.53932205]), 'xaxis': 'x', 'y': array(['gpt-4-turbo'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
sentence count=%{x}', - 'legendgroup': 'gpt-4', + 'hovertemplate': 'Model=%{y}
original text length part=%{x}', + 'legendgroup': 'Mistral (7B) Instruct v0.2 (Together AI)', 'marker': {'color': '#ab63fa', 'pattern': {'shape': ''}}, - 'name': 'gpt-4', - 'offsetgroup': 'gpt-4', + 'name': 'Mistral (7B) Instruct v0.2 (Together AI)', + 'offsetgroup': 'Mistral (7B) Instruct v0.2 (Together AI)', 'orientation': 'h', 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([4.26613757]), + 'x': array([0.52339986]), 'xaxis': 'x', - 'y': array(['gpt-4'], dtype=object), + 'y': array(['Mistral (7B) Instruct v0.2 (Together AI)'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
sentence count=%{x}', - 'legendgroup': 'gemini-pro', + 'hovertemplate': 'Model=%{y}
original text length part=%{x}', + 'legendgroup': 'gpt-4', 'marker': {'color': '#FFA15A', 'pattern': {'shape': ''}}, - 'name': 'gemini-pro', - 'offsetgroup': 'gemini-pro', + 'name': 'gpt-4', + 'offsetgroup': 'gpt-4', 'orientation': 'h', 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([4.24487179]), + 'x': array([0.4763732]), 'xaxis': 'x', - 'y': array(['gemini-pro'], dtype=object), + 'y': array(['gpt-4'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
sentence count=%{x}', - 'legendgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0', + 'hovertemplate': 'Model=%{y}
original text length part=%{x}', + 'legendgroup': 'Chronos Hermes (13B)', 'marker': {'color': '#19d3f3', 'pattern': {'shape': ''}}, - 'name': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0', - 'offsetgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0', + 'name': 'Chronos Hermes (13B)', + 'offsetgroup': 'Chronos Hermes (13B)', 'orientation': 'h', 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([4.24487179]), + 'x': array([0.47428102]), 'xaxis': 'x', - 'y': array(['TinyLlama/TinyLlama-1.1B-Chat-v1.0'], dtype=object), + 'y': array(['Chronos Hermes (13B)'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
sentence count=%{x}', - 'legendgroup': 'llama-2-70b-chat', + 'hovertemplate': 'Model=%{y}
original text length part=%{x}', + 'legendgroup': '01-ai Yi Chat (34B)', 'marker': {'color': '#FF6692', 'pattern': {'shape': ''}}, - 'name': 'llama-2-70b-chat', - 'offsetgroup': 'llama-2-70b-chat', + 'name': '01-ai Yi Chat (34B)', + 'offsetgroup': '01-ai Yi Chat (34B)', 'orientation': 'h', 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([4.24368932]), + 'x': array([0.43251538]), 'xaxis': 'x', - 'y': array(['llama-2-70b-chat'], dtype=object), + 'y': array(['01-ai Yi Chat (34B)'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
sentence count=%{x}', - 'legendgroup': 'gpt-3.5-turbo', + 'hovertemplate': 'Model=%{y}
original text length part=%{x}', + 'legendgroup': 'LLaMA-2 Chat (7B)', 'marker': {'color': '#B6E880', 'pattern': {'shape': ''}}, - 'name': 'gpt-3.5-turbo', - 'offsetgroup': 'gpt-3.5-turbo', + 'name': 'LLaMA-2 Chat (7B)', + 'offsetgroup': 'LLaMA-2 Chat (7B)', 'orientation': 'h', 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([4.22963982]), + 'x': array([0.40842333]), 'xaxis': 'x', - 'y': array(['gpt-3.5-turbo'], dtype=object), + 'y': array(['LLaMA-2 Chat (7B)'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
sentence count=%{x}', - 'legendgroup': 'Mixtral-8x7B-Instruct-v0.1', + 'hovertemplate': 'Model=%{y}
original text length part=%{x}', + 'legendgroup': 'OpenHermes-2.5-Mistral (7B)', 'marker': {'color': '#FF97FF', 'pattern': {'shape': ''}}, - 'name': 'Mixtral-8x7B-Instruct-v0.1', - 'offsetgroup': 'Mixtral-8x7B-Instruct-v0.1', + 'name': 'OpenHermes-2.5-Mistral (7B)', + 'offsetgroup': 'OpenHermes-2.5-Mistral (7B)', 'orientation': 'h', 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([4.16103896]), + 'x': array([0.31205452]), 'xaxis': 'x', - 'y': array(['Mixtral-8x7B-Instruct-v0.1'], dtype=object), + 'y': array(['OpenHermes-2.5-Mistral (7B)'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
sentence count=%{x}', - 'legendgroup': 'zephyr-7b-beta', + 'hovertemplate': 'Model=%{y}
original text length part=%{x}', + 'legendgroup': 'Qwen 1.5 Chat (7B)', 'marker': {'color': '#FECB52', 'pattern': {'shape': ''}}, - 'name': 'zephyr-7b-beta', - 'offsetgroup': 'zephyr-7b-beta', + 'name': 'Qwen 1.5 Chat (7B)', + 'offsetgroup': 'Qwen 1.5 Chat (7B)', 'orientation': 'h', 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([4.1597887]), + 'x': array([0.2990453]), 'xaxis': 'x', - 'y': array(['zephyr-7b-beta'], dtype=object), + 'y': array(['Qwen 1.5 Chat (7B)'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
sentence count=%{x}', - 'legendgroup': 'Mistral-7B-Instruct-v0.2', + 'hovertemplate': 'Model=%{y}
original text length part=%{x}', + 'legendgroup': 'llama-2-70b-chat', 'marker': {'color': '#636efa', 'pattern': {'shape': ''}}, - 'name': 'Mistral-7B-Instruct-v0.2', - 'offsetgroup': 'Mistral-7B-Instruct-v0.2', + 'name': 'llama-2-70b-chat', + 'offsetgroup': 'llama-2-70b-chat', 'orientation': 'h', 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([4.12034265]), + 'x': array([0.29684573]), 'xaxis': 'x', - 'y': array(['Mistral-7B-Instruct-v0.2'], dtype=object), + 'y': array(['llama-2-70b-chat'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
sentence count=%{x}', - 'legendgroup': 'Mistral (7B) Instruct v0.2 (Together AI)', + 'hovertemplate': 'Model=%{y}
original text length part=%{x}', + 'legendgroup': 'gemini-pro', 'marker': {'color': '#EF553B', 'pattern': {'shape': ''}}, - 'name': 'Mistral (7B) Instruct v0.2 (Together AI)', - 'offsetgroup': 'Mistral (7B) Instruct v0.2 (Together AI)', + 'name': 'gemini-pro', + 'offsetgroup': 'gemini-pro', 'orientation': 'h', 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([3.71222222]), + 'x': array([0.295287]), 'xaxis': 'x', - 'y': array(['Mistral (7B) Instruct v0.2 (Together AI)'], dtype=object), + 'y': array(['gemini-pro'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
sentence count=%{x}', - 'legendgroup': 'Vicuna v1.5 (7B)', + 'hovertemplate': 'Model=%{y}
original text length part=%{x}', + 'legendgroup': 'chat-bison (PaLM 2)', 'marker': {'color': '#00cc96', 'pattern': {'shape': ''}}, - 'name': 'Vicuna v1.5 (7B)', - 'offsetgroup': 'Vicuna v1.5 (7B)', + 'name': 'chat-bison (PaLM 2)', + 'offsetgroup': 'chat-bison (PaLM 2)', 'orientation': 'h', 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([3.6173028]), + 'x': array([0.29272367]), 'xaxis': 'x', - 'y': array(['Vicuna v1.5 (7B)'], dtype=object), + 'y': array(['chat-bison (PaLM 2)'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
sentence count=%{x}', - 'legendgroup': 'Falcon Instruct (7B)', + 'hovertemplate': 'Model=%{y}
original text length part=%{x}', + 'legendgroup': 'WizardLM v1.2 (13B)', 'marker': {'color': '#ab63fa', 'pattern': {'shape': ''}}, - 'name': 'Falcon Instruct (7B)', - 'offsetgroup': 'Falcon Instruct (7B)', + 'name': 'WizardLM v1.2 (13B)', + 'offsetgroup': 'WizardLM v1.2 (13B)', 'orientation': 'h', 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([3.58184438]), + 'x': array([0.2871672]), 'xaxis': 'x', - 'y': array(['Falcon Instruct (7B)'], dtype=object), + 'y': array(['WizardLM v1.2 (13B)'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
sentence count=%{x}', - 'legendgroup': 'RedPajama-INCITE Chat (7B)', + 'hovertemplate': 'Model=%{y}
original text length part=%{x}', + 'legendgroup': 'Vicuna v1.5 (7B)', 'marker': {'color': '#FFA15A', 'pattern': {'shape': ''}}, - 'name': 'RedPajama-INCITE Chat (7B)', - 'offsetgroup': 'RedPajama-INCITE Chat (7B)', + 'name': 'Vicuna v1.5 (7B)', + 'offsetgroup': 'Vicuna v1.5 (7B)', 'orientation': 'h', 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([3.58184438]), + 'x': array([0.27810351]), 'xaxis': 'x', - 'y': array(['RedPajama-INCITE Chat (7B)'], dtype=object), + 'y': array(['Vicuna v1.5 (7B)'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
sentence count=%{x}', - 'legendgroup': 'Snorkel Mistral PairRM DPO (7B)', + 'hovertemplate': 'Model=%{y}
original text length part=%{x}', + 'legendgroup': 'Mixtral-8x7B-Instruct-v0.1', 'marker': {'color': '#19d3f3', 'pattern': {'shape': ''}}, - 'name': 'Snorkel Mistral PairRM DPO (7B)', - 'offsetgroup': 'Snorkel Mistral PairRM DPO (7B)', + 'name': 'Mixtral-8x7B-Instruct-v0.1', + 'offsetgroup': 'Mixtral-8x7B-Instruct-v0.1', 'orientation': 'h', 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([3.58184438]), + 'x': array([0.26652884]), 'xaxis': 'x', - 'y': array(['Snorkel Mistral PairRM DPO (7B)'], dtype=object), + 'y': array(['Mixtral-8x7B-Instruct-v0.1'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
sentence count=%{x}', - 'legendgroup': 'WizardLM v1.2 (13B)', + 'hovertemplate': 'Model=%{y}
original text length part=%{x}', + 'legendgroup': 'chat-bison-32k (PaLM 2 32K)', 'marker': {'color': '#FF6692', 'pattern': {'shape': ''}}, - 'name': 'WizardLM v1.2 (13B)', - 'offsetgroup': 'WizardLM v1.2 (13B)', + 'name': 'chat-bison-32k (PaLM 2 32K)', + 'offsetgroup': 'chat-bison-32k (PaLM 2 32K)', 'orientation': 'h', 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([3.58184438]), + 'x': array([0.26088069]), 'xaxis': 'x', - 'y': array(['WizardLM v1.2 (13B)'], dtype=object), + 'y': array(['chat-bison-32k (PaLM 2 32K)'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
sentence count=%{x}', - 'legendgroup': 'Qwen 1.5 Chat (7B)', + 'hovertemplate': 'Model=%{y}
original text length part=%{x}', + 'legendgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0', 'marker': {'color': '#B6E880', 'pattern': {'shape': ''}}, - 'name': 'Qwen 1.5 Chat (7B)', - 'offsetgroup': 'Qwen 1.5 Chat (7B)', + 'name': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0', + 'offsetgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0', 'orientation': 'h', 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([3.58184438]), + 'x': array([0.13915356]), 'xaxis': 'x', - 'y': array(['Qwen 1.5 Chat (7B)'], dtype=object), + 'y': array(['TinyLlama/TinyLlama-1.1B-Chat-v1.0'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
sentence count=%{x}', - 'legendgroup': 'OpenHermes-2.5-Mistral (7B)', + 'hovertemplate': 'Model=%{y}
original text length part=%{x}', + 'legendgroup': 'zephyr-7b-beta', 'marker': {'color': '#FF97FF', 'pattern': {'shape': ''}}, - 'name': 'OpenHermes-2.5-Mistral (7B)', - 'offsetgroup': 'OpenHermes-2.5-Mistral (7B)', + 'name': 'zephyr-7b-beta', + 'offsetgroup': 'zephyr-7b-beta', 'orientation': 'h', 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([3.58184438]), + 'x': array([0.08796697]), 'xaxis': 'x', - 'y': array(['OpenHermes-2.5-Mistral (7B)'], dtype=object), + 'y': array(['zephyr-7b-beta'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
sentence count=%{x}', - 'legendgroup': 'LLaMA-2 Chat (7B)', + 'hovertemplate': 'Model=%{y}
original text length part=%{x}', + 'legendgroup': 'RedPajama-INCITE Chat (7B)', 'marker': {'color': '#FECB52', 'pattern': {'shape': ''}}, - 'name': 'LLaMA-2 Chat (7B)', - 'offsetgroup': 'LLaMA-2 Chat (7B)', + 'name': 'RedPajama-INCITE Chat (7B)', + 'offsetgroup': 'RedPajama-INCITE Chat (7B)', 'orientation': 'h', 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([3.58184438]), + 'x': array([0.05602848]), 'xaxis': 'x', - 'y': array(['LLaMA-2 Chat (7B)'], dtype=object), + 'y': array(['RedPajama-INCITE Chat (7B)'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
sentence count=%{x}', - 'legendgroup': '01-ai Yi Chat (34B)', + 'hovertemplate': 'Model=%{y}
original text length part=%{x}', + 'legendgroup': 'Falcon Instruct (7B)', 'marker': {'color': '#636efa', 'pattern': {'shape': ''}}, - 'name': '01-ai Yi Chat (34B)', - 'offsetgroup': '01-ai Yi Chat (34B)', + 'name': 'Falcon Instruct (7B)', + 'offsetgroup': 'Falcon Instruct (7B)', 'orientation': 'h', 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([3.58184438]), + 'x': array([0.04906355]), 'xaxis': 'x', - 'y': array(['01-ai Yi Chat (34B)'], dtype=object), + 'y': array(['Falcon Instruct (7B)'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
sentence count=%{x}', - 'legendgroup': 'Chronos Hermes (13B)', + 'hovertemplate': 'Model=%{y}
original text length part=%{x}', + 'legendgroup': 'Mistral-7B-Instruct-v0.2', 'marker': {'color': '#EF553B', 'pattern': {'shape': ''}}, - 'name': 'Chronos Hermes (13B)', - 'offsetgroup': 'Chronos Hermes (13B)', + 'name': 'Mistral-7B-Instruct-v0.2', + 'offsetgroup': 'Mistral-7B-Instruct-v0.2', 'orientation': 'h', 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([3.58184438]), + 'x': array([0.04250631]), 'xaxis': 'x', - 'y': array(['Chronos Hermes (13B)'], dtype=object), + 'y': array(['Mistral-7B-Instruct-v0.2'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
sentence count=%{x}', + 'hovertemplate': 'Model=%{y}
original text length part=%{x}', 'legendgroup': 'Upstage SOLAR Instruct v1 (11B)', 'marker': {'color': '#00cc96', 'pattern': {'shape': ''}}, 'name': 'Upstage SOLAR Instruct v1 (11B)', @@ -1808,218 +1821,221 @@ plot_object,header,plot_json,description,df,arguments 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([3.58184438]), + 'x': array([0.00176623]), 'xaxis': 'x', 'y': array(['Upstage SOLAR Instruct v1 (11B)'], dtype=object), 'yaxis': 'y'}], 'layout': {'barmode': 'relative', 'legend': {'title': {'text': 'Model'}, 'tracegroupgap': 0}, 'template': '...', - 'title': {'text': 'Summary metrics sentence count'}, - 'xaxis': {'anchor': 'y', 'domain': [0.0, 1.0], 'title': {'text': 'sentence count'}}, + 'title': {'text': 'Summary metrics original text length part'}, + 'xaxis': {'anchor': 'y', 'domain': [0.0, 1.0], 'title': {'text': 'original text length part'}}, 'yaxis': {'anchor': 'x', 'categoryarray': [Upstage SOLAR Instruct v1 (11B), - Chronos Hermes (13B), 01-ai Yi Chat - (34B), LLaMA-2 Chat (7B), - OpenHermes-2.5-Mistral (7B), Qwen 1.5 - Chat (7B), WizardLM v1.2 (13B), Snorkel - Mistral PairRM DPO (7B), RedPajama- - INCITE Chat (7B), Falcon Instruct (7B), - Vicuna v1.5 (7B), Mistral (7B) Instruct - v0.2 (Together AI), - Mistral-7B-Instruct-v0.2, - zephyr-7b-beta, - Mixtral-8x7B-Instruct-v0.1, - gpt-3.5-turbo, llama-2-70b-chat, + Mistral-7B-Instruct-v0.2, Falcon + Instruct (7B), RedPajama-INCITE Chat + (7B), zephyr-7b-beta, TinyLlama/TinyLlama-1.1B-Chat-v1.0, - gemini-pro, gpt-4, gpt-4-turbo, chat- - bison-32k (PaLM 2 32K), chat-bison (PaLM - 2)], + chat-bison-32k (PaLM 2 32K), + Mixtral-8x7B-Instruct-v0.1, Vicuna v1.5 + (7B), WizardLM v1.2 (13B), chat-bison + (PaLM 2), gemini-pro, llama-2-70b-chat, + Qwen 1.5 Chat (7B), + OpenHermes-2.5-Mistral (7B), LLaMA-2 + Chat (7B), 01-ai Yi Chat (34B), Chronos + Hermes (13B), gpt-4, Mistral (7B) + Instruct v0.2 (Together AI), + gpt-4-turbo, gpt-3.5-turbo, Snorkel + Mistral PairRM DPO (7B)], 'categoryorder': 'array', 'domain': [0.0, 1.0], 'title': {'text': 'Model'}}} -})",Summary metrics sentence count,"{""data"":[{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003esentence count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison (PaLM 2)"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""chat-bison (PaLM 2)"",""offsetgroup"":""chat-bison (PaLM 2)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[4.281081081081081],""xaxis"":""x"",""y"":[""chat-bison (PaLM 2)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003esentence count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison-32k (PaLM 2 32K)"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""chat-bison-32k (PaLM 2 32K)"",""offsetgroup"":""chat-bison-32k (PaLM 2 32K)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[4.281081081081081],""xaxis"":""x"",""y"":[""chat-bison-32k (PaLM 2 32K)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003esentence count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4-turbo"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""gpt-4-turbo"",""offsetgroup"":""gpt-4-turbo"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[4.266137566137566],""xaxis"":""x"",""y"":[""gpt-4-turbo""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003esentence count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""gpt-4"",""offsetgroup"":""gpt-4"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[4.266137566137566],""xaxis"":""x"",""y"":[""gpt-4""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003esentence count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gemini-pro"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""gemini-pro"",""offsetgroup"":""gemini-pro"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[4.244871794871795],""xaxis"":""x"",""y"":[""gemini-pro""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003esentence count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""offsetgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[4.244871794871795],""xaxis"":""x"",""y"":[""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003esentence count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""llama-2-70b-chat"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""llama-2-70b-chat"",""offsetgroup"":""llama-2-70b-chat"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[4.2436893203883495],""xaxis"":""x"",""y"":[""llama-2-70b-chat""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003esentence count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-3.5-turbo"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""gpt-3.5-turbo"",""offsetgroup"":""gpt-3.5-turbo"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[4.229639819909955],""xaxis"":""x"",""y"":[""gpt-3.5-turbo""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003esentence count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mixtral-8x7B-Instruct-v0.1"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""Mixtral-8x7B-Instruct-v0.1"",""offsetgroup"":""Mixtral-8x7B-Instruct-v0.1"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[4.161038961038961],""xaxis"":""x"",""y"":[""Mixtral-8x7B-Instruct-v0.1""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003esentence count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""zephyr-7b-beta"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""zephyr-7b-beta"",""offsetgroup"":""zephyr-7b-beta"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[4.159788702026735],""xaxis"":""x"",""y"":[""zephyr-7b-beta""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003esentence count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral-7B-Instruct-v0.2"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""Mistral-7B-Instruct-v0.2"",""offsetgroup"":""Mistral-7B-Instruct-v0.2"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[4.120342654588421],""xaxis"":""x"",""y"":[""Mistral-7B-Instruct-v0.2""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003esentence count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral (7B) Instruct v0.2 (Together AI)"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""Mistral (7B) Instruct v0.2 (Together AI)"",""offsetgroup"":""Mistral (7B) Instruct v0.2 (Together AI)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[3.712222222222222],""xaxis"":""x"",""y"":[""Mistral (7B) Instruct v0.2 (Together AI)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003esentence count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Vicuna v1.5 (7B)"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""Vicuna v1.5 (7B)"",""offsetgroup"":""Vicuna v1.5 (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[3.6173027989821884],""xaxis"":""x"",""y"":[""Vicuna v1.5 (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003esentence count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Falcon Instruct (7B)"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""Falcon Instruct (7B)"",""offsetgroup"":""Falcon Instruct (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[3.5818443804034583],""xaxis"":""x"",""y"":[""Falcon Instruct (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003esentence count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""RedPajama-INCITE Chat (7B)"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""RedPajama-INCITE Chat (7B)"",""offsetgroup"":""RedPajama-INCITE Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[3.5818443804034583],""xaxis"":""x"",""y"":[""RedPajama-INCITE Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003esentence count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Snorkel Mistral PairRM DPO (7B)"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""Snorkel Mistral PairRM DPO (7B)"",""offsetgroup"":""Snorkel Mistral PairRM DPO (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[3.5818443804034583],""xaxis"":""x"",""y"":[""Snorkel Mistral PairRM DPO (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003esentence count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""WizardLM v1.2 (13B)"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""WizardLM v1.2 (13B)"",""offsetgroup"":""WizardLM v1.2 (13B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[3.5818443804034583],""xaxis"":""x"",""y"":[""WizardLM v1.2 (13B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003esentence count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Qwen 1.5 Chat (7B)"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""Qwen 1.5 Chat (7B)"",""offsetgroup"":""Qwen 1.5 Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[3.5818443804034583],""xaxis"":""x"",""y"":[""Qwen 1.5 Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003esentence count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""OpenHermes-2.5-Mistral (7B)"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""OpenHermes-2.5-Mistral (7B)"",""offsetgroup"":""OpenHermes-2.5-Mistral (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[3.5818443804034583],""xaxis"":""x"",""y"":[""OpenHermes-2.5-Mistral (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003esentence count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""LLaMA-2 Chat (7B)"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""LLaMA-2 Chat (7B)"",""offsetgroup"":""LLaMA-2 Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[3.5818443804034583],""xaxis"":""x"",""y"":[""LLaMA-2 Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003esentence count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""01-ai Yi Chat (34B)"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""01-ai Yi Chat (34B)"",""offsetgroup"":""01-ai Yi Chat (34B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[3.5818443804034583],""xaxis"":""x"",""y"":[""01-ai Yi Chat (34B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003esentence count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Chronos Hermes (13B)"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""Chronos Hermes (13B)"",""offsetgroup"":""Chronos Hermes (13B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[3.5818443804034583],""xaxis"":""x"",""y"":[""Chronos Hermes (13B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003esentence count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Upstage SOLAR Instruct v1 (11B)"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""Upstage SOLAR Instruct v1 (11B)"",""offsetgroup"":""Upstage SOLAR Instruct v1 (11B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[3.5818443804034583],""xaxis"":""x"",""y"":[""Upstage SOLAR Instruct v1 (11B)""],""yaxis"":""y"",""type"":""bar""}],""layout"":{""template"":{""data"":{""histogram2dcontour"":[{""type"":""histogram2dcontour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""choropleth"":[{""type"":""choropleth"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""histogram2d"":[{""type"":""histogram2d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmap"":[{""type"":""heatmap"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmapgl"":[{""type"":""heatmapgl"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""contourcarpet"":[{""type"":""contourcarpet"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""contour"":[{""type"":""contour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""surface"":[{""type"":""surface"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""mesh3d"":[{""type"":""mesh3d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""scatter"":[{""fillpattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2},""type"":""scatter""}],""parcoords"":[{""type"":""parcoords"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolargl"":[{""type"":""scatterpolargl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""bar"":[{""error_x"":{""color"":""#2a3f5f""},""error_y"":{""color"":""#2a3f5f""},""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""bar""}],""scattergeo"":[{""type"":""scattergeo"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolar"":[{""type"":""scatterpolar"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""histogram"":[{""marker"":{""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""histogram""}],""scattergl"":[{""type"":""scattergl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatter3d"":[{""type"":""scatter3d"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattermapbox"":[{""type"":""scattermapbox"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterternary"":[{""type"":""scatterternary"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattercarpet"":[{""type"":""scattercarpet"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""carpet"":[{""aaxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""baxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""type"":""carpet""}],""table"":[{""cells"":{""fill"":{""color"":""#EBF0F8""},""line"":{""color"":""white""}},""header"":{""fill"":{""color"":""#C8D4E3""},""line"":{""color"":""white""}},""type"":""table""}],""barpolar"":[{""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""barpolar""}],""pie"":[{""automargin"":true,""type"":""pie""}]},""layout"":{""autotypenumbers"":""strict"",""colorway"":[""#636efa"",""#EF553B"",""#00cc96"",""#ab63fa"",""#FFA15A"",""#19d3f3"",""#FF6692"",""#B6E880"",""#FF97FF"",""#FECB52""],""font"":{""color"":""#2a3f5f""},""hovermode"":""closest"",""hoverlabel"":{""align"":""left""},""paper_bgcolor"":""white"",""plot_bgcolor"":""#E5ECF6"",""polar"":{""bgcolor"":""#E5ECF6"",""angularaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""radialaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""ternary"":{""bgcolor"":""#E5ECF6"",""aaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""baxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""caxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""coloraxis"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""colorscale"":{""sequential"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""sequentialminus"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""diverging"":[[0,""#8e0152""],[0.1,""#c51b7d""],[0.2,""#de77ae""],[0.3,""#f1b6da""],[0.4,""#fde0ef""],[0.5,""#f7f7f7""],[0.6,""#e6f5d0""],[0.7,""#b8e186""],[0.8,""#7fbc41""],[0.9,""#4d9221""],[1,""#276419""]]},""xaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""yaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""scene"":{""xaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""yaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""zaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2}},""shapedefaults"":{""line"":{""color"":""#2a3f5f""}},""annotationdefaults"":{""arrowcolor"":""#2a3f5f"",""arrowhead"":0,""arrowwidth"":1},""geo"":{""bgcolor"":""white"",""landcolor"":""#E5ECF6"",""subunitcolor"":""white"",""showland"":true,""showlakes"":true,""lakecolor"":""white""},""title"":{""x"":0.05},""mapbox"":{""style"":""light""}}},""xaxis"":{""anchor"":""y"",""domain"":[0.0,1.0],""title"":{""text"":""sentence count""}},""yaxis"":{""anchor"":""x"",""domain"":[0.0,1.0],""title"":{""text"":""Model""},""categoryorder"":""array"",""categoryarray"":[""Upstage SOLAR Instruct v1 (11B)"",""Chronos Hermes (13B)"",""01-ai Yi Chat (34B)"",""LLaMA-2 Chat (7B)"",""OpenHermes-2.5-Mistral (7B)"",""Qwen 1.5 Chat (7B)"",""WizardLM v1.2 (13B)"",""Snorkel Mistral PairRM DPO (7B)"",""RedPajama-INCITE Chat (7B)"",""Falcon Instruct (7B)"",""Vicuna v1.5 (7B)"",""Mistral (7B) Instruct v0.2 (Together AI)"",""Mistral-7B-Instruct-v0.2"",""zephyr-7b-beta"",""Mixtral-8x7B-Instruct-v0.1"",""gpt-3.5-turbo"",""llama-2-70b-chat"",""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""gemini-pro"",""gpt-4"",""gpt-4-turbo"",""chat-bison-32k (PaLM 2 32K)"",""chat-bison (PaLM 2)""]},""legend"":{""title"":{""text"":""Model""},""tracegroupgap"":0},""title"":{""text"":""Summary metrics sentence count""},""barmode"":""relative""}}",Average sentence count of the summary.,",model,bert_score_P,bert_score_R,bert_score_F1,original_text_length_part,sentence_count,length_penalty,bleu_score -15,chat-bison (PaLM 2),0.23117188,0.23029378,0.23060663,0.2927236655934559,4.281081081081081,83400.0,0.0033173472693443363 -16,chat-bison-32k (PaLM 2 32K),0.23046139,0.22983725,0.23002876,0.2608806894318779,4.281081081081081,83400.0,0.002970914340485325 -20,gpt-4-turbo,0.42728576,0.4162435,0.42098433,0.5393220459796505,4.266137566137566,85120.0,0.0034873692407505464 -19,gpt-4,0.48605907,0.472583,0.47901583,0.4763731952669352,4.266137566137566,85120.0,0.004704572681138337 -17,gemini-pro,0.23105659,0.23057175,0.23072062,0.295286999418032,4.244871794871795,87700.0,0.0025439281189154664 -11,TinyLlama/TinyLlama-1.1B-Chat-v1.0,0.122185074,0.11885959,0.12042627,0.13915355617375091,4.244871794871795,87700.0,0.002991155730532842 -21,llama-2-70b-chat,0.20800962,0.21472095,0.21117964,0.29684572894554634,4.2436893203883495,88008.0,0.00329426273003284 -18,gpt-3.5-turbo,0.4943981,0.48408476,0.4888874,0.5905700146991734,4.229639819909955,89814.0,0.007892445077902592 -6,Mixtral-8x7B-Instruct-v0.1,0.19128644,0.19555509,0.19330867,0.2665288353398184,4.161038961038961,103320.0,0.0026839271544750283 -22,zephyr-7b-beta,0.085390136,0.08266569,0.08394519,0.08796697338212889,4.159788702026735,103714.0,0.0010625100735849574 -5,Mistral-7B-Instruct-v0.2,0.043820098,0.042561684,0.04313921,0.04250630683894714,4.120342654588421,113258.0,0.0004930290548816363 -4,Mistral (7B) Instruct v0.2 (Together AI),0.3647361,0.3664233,0.36540908,0.5233998570385472,3.712222222222222,29298.0,0.005478518060743351 -13,Vicuna v1.5 (7B),0.284109,0.27878883,0.28129113,0.2781035051738079,3.6173027989821884,16948.0,0.006952332387656228 -2,Falcon Instruct (7B),0.2895086,0.23968808,0.2615204,0.0490635544441649,3.5818443804034583,14928.0,0.00021729364201653395 -9,RedPajama-INCITE Chat (7B),0.261367,0.23758642,0.2487217,0.0560284823193376,3.5818443804034583,14928.0,0.0 -10,Snorkel Mistral PairRM DPO (7B),0.31672964,0.33782956,0.3265383,3.7740234383755356,3.5818443804034583,14928.0,0.002907897771152987 -14,WizardLM v1.2 (13B),0.34085444,0.32933056,0.33466902,0.28716720161049375,3.5818443804034583,14928.0,0.003671383039102015 -8,Qwen 1.5 Chat (7B),0.34855434,0.34154576,0.344803,0.29904529709475364,3.5818443804034583,14928.0,0.003185571110431172 -7,OpenHermes-2.5-Mistral (7B),0.3618188,0.35180506,0.3565194,0.312054520357568,3.5818443804034583,14928.0,0.006563161880264231 -3,LLaMA-2 Chat (7B),0.3203912,0.3153909,0.31770444,0.4084233313416049,3.5818443804034583,14928.0,0.004255859538193306 -0,01-ai Yi Chat (34B),0.33974892,0.3404481,0.3399749,0.43251538287409536,3.5818443804034583,14928.0,0.007311566390840339 -1,Chronos Hermes (13B),0.3124825,0.31071666,0.311415,0.4742810243835248,3.5818443804034583,14928.0,0.011439012700594395 -12,Upstage SOLAR Instruct v1 (11B),0.0,0.0,0.0,0.0017662349842492329,3.5818443804034583,14928.0,0.0 -","{""x"": ""sentence_count"", ""y"": ""model"", ""color"": ""model"", ""orientation"": ""h"", ""labels"": {""sentence_count"": ""sentence count"", ""model"": ""Model""}, ""title"": ""Summary metrics sentence count""}" +})",Summary metrics original text length part,"{""data"":[{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eoriginal text length part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Snorkel Mistral PairRM DPO (7B)"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""Snorkel Mistral PairRM DPO (7B)"",""offsetgroup"":""Snorkel Mistral PairRM DPO (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[3.7740234383755356],""xaxis"":""x"",""y"":[""Snorkel Mistral PairRM DPO (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eoriginal text length part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-3.5-turbo"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""gpt-3.5-turbo"",""offsetgroup"":""gpt-3.5-turbo"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.5905700146991734],""xaxis"":""x"",""y"":[""gpt-3.5-turbo""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eoriginal text length part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4-turbo"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""gpt-4-turbo"",""offsetgroup"":""gpt-4-turbo"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.5393220459796505],""xaxis"":""x"",""y"":[""gpt-4-turbo""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eoriginal text length part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral (7B) Instruct v0.2 (Together AI)"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""Mistral (7B) Instruct v0.2 (Together AI)"",""offsetgroup"":""Mistral (7B) Instruct v0.2 (Together AI)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.5233998570385472],""xaxis"":""x"",""y"":[""Mistral (7B) Instruct v0.2 (Together AI)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eoriginal text length part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""gpt-4"",""offsetgroup"":""gpt-4"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.4763731952669352],""xaxis"":""x"",""y"":[""gpt-4""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eoriginal text length part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Chronos Hermes (13B)"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""Chronos Hermes (13B)"",""offsetgroup"":""Chronos Hermes (13B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.4742810243835248],""xaxis"":""x"",""y"":[""Chronos Hermes (13B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eoriginal text length part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""01-ai Yi Chat (34B)"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""01-ai Yi Chat (34B)"",""offsetgroup"":""01-ai Yi Chat (34B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.43251538287409536],""xaxis"":""x"",""y"":[""01-ai Yi Chat (34B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eoriginal text length part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""LLaMA-2 Chat (7B)"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""LLaMA-2 Chat (7B)"",""offsetgroup"":""LLaMA-2 Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.4084233313416049],""xaxis"":""x"",""y"":[""LLaMA-2 Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eoriginal text length part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""OpenHermes-2.5-Mistral (7B)"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""OpenHermes-2.5-Mistral (7B)"",""offsetgroup"":""OpenHermes-2.5-Mistral (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.312054520357568],""xaxis"":""x"",""y"":[""OpenHermes-2.5-Mistral (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eoriginal text length part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Qwen 1.5 Chat (7B)"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""Qwen 1.5 Chat (7B)"",""offsetgroup"":""Qwen 1.5 Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.29904529709475364],""xaxis"":""x"",""y"":[""Qwen 1.5 Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eoriginal text length part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""llama-2-70b-chat"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""llama-2-70b-chat"",""offsetgroup"":""llama-2-70b-chat"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.29684572894554634],""xaxis"":""x"",""y"":[""llama-2-70b-chat""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eoriginal text length part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gemini-pro"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""gemini-pro"",""offsetgroup"":""gemini-pro"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.295286999418032],""xaxis"":""x"",""y"":[""gemini-pro""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eoriginal text length part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison (PaLM 2)"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""chat-bison (PaLM 2)"",""offsetgroup"":""chat-bison (PaLM 2)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.2927236655934559],""xaxis"":""x"",""y"":[""chat-bison (PaLM 2)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eoriginal text length part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""WizardLM v1.2 (13B)"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""WizardLM v1.2 (13B)"",""offsetgroup"":""WizardLM v1.2 (13B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.28716720161049375],""xaxis"":""x"",""y"":[""WizardLM v1.2 (13B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eoriginal text length part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Vicuna v1.5 (7B)"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""Vicuna v1.5 (7B)"",""offsetgroup"":""Vicuna v1.5 (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.2781035051738079],""xaxis"":""x"",""y"":[""Vicuna v1.5 (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eoriginal text length part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mixtral-8x7B-Instruct-v0.1"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""Mixtral-8x7B-Instruct-v0.1"",""offsetgroup"":""Mixtral-8x7B-Instruct-v0.1"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.2665288353398184],""xaxis"":""x"",""y"":[""Mixtral-8x7B-Instruct-v0.1""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eoriginal text length part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison-32k (PaLM 2 32K)"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""chat-bison-32k (PaLM 2 32K)"",""offsetgroup"":""chat-bison-32k (PaLM 2 32K)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.2608806894318779],""xaxis"":""x"",""y"":[""chat-bison-32k (PaLM 2 32K)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eoriginal text length part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""offsetgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.13915355617375091],""xaxis"":""x"",""y"":[""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eoriginal text length part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""zephyr-7b-beta"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""zephyr-7b-beta"",""offsetgroup"":""zephyr-7b-beta"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.08796697338212889],""xaxis"":""x"",""y"":[""zephyr-7b-beta""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eoriginal text length part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""RedPajama-INCITE Chat (7B)"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""RedPajama-INCITE Chat (7B)"",""offsetgroup"":""RedPajama-INCITE Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.0560284823193376],""xaxis"":""x"",""y"":[""RedPajama-INCITE Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eoriginal text length part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Falcon Instruct (7B)"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""Falcon Instruct (7B)"",""offsetgroup"":""Falcon Instruct (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.0490635544441649],""xaxis"":""x"",""y"":[""Falcon Instruct (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eoriginal text length part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral-7B-Instruct-v0.2"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""Mistral-7B-Instruct-v0.2"",""offsetgroup"":""Mistral-7B-Instruct-v0.2"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.04250630683894714],""xaxis"":""x"",""y"":[""Mistral-7B-Instruct-v0.2""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eoriginal text length part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Upstage SOLAR Instruct v1 (11B)"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""Upstage SOLAR Instruct v1 (11B)"",""offsetgroup"":""Upstage SOLAR Instruct v1 (11B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.0017662349842492329],""xaxis"":""x"",""y"":[""Upstage SOLAR Instruct v1 (11B)""],""yaxis"":""y"",""type"":""bar""}],""layout"":{""template"":{""data"":{""histogram2dcontour"":[{""type"":""histogram2dcontour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""choropleth"":[{""type"":""choropleth"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""histogram2d"":[{""type"":""histogram2d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmap"":[{""type"":""heatmap"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmapgl"":[{""type"":""heatmapgl"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""contourcarpet"":[{""type"":""contourcarpet"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""contour"":[{""type"":""contour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""surface"":[{""type"":""surface"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""mesh3d"":[{""type"":""mesh3d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""scatter"":[{""fillpattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2},""type"":""scatter""}],""parcoords"":[{""type"":""parcoords"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolargl"":[{""type"":""scatterpolargl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""bar"":[{""error_x"":{""color"":""#2a3f5f""},""error_y"":{""color"":""#2a3f5f""},""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""bar""}],""scattergeo"":[{""type"":""scattergeo"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolar"":[{""type"":""scatterpolar"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""histogram"":[{""marker"":{""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""histogram""}],""scattergl"":[{""type"":""scattergl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatter3d"":[{""type"":""scatter3d"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattermapbox"":[{""type"":""scattermapbox"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterternary"":[{""type"":""scatterternary"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattercarpet"":[{""type"":""scattercarpet"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""carpet"":[{""aaxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""baxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""type"":""carpet""}],""table"":[{""cells"":{""fill"":{""color"":""#EBF0F8""},""line"":{""color"":""white""}},""header"":{""fill"":{""color"":""#C8D4E3""},""line"":{""color"":""white""}},""type"":""table""}],""barpolar"":[{""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""barpolar""}],""pie"":[{""automargin"":true,""type"":""pie""}]},""layout"":{""autotypenumbers"":""strict"",""colorway"":[""#636efa"",""#EF553B"",""#00cc96"",""#ab63fa"",""#FFA15A"",""#19d3f3"",""#FF6692"",""#B6E880"",""#FF97FF"",""#FECB52""],""font"":{""color"":""#2a3f5f""},""hovermode"":""closest"",""hoverlabel"":{""align"":""left""},""paper_bgcolor"":""white"",""plot_bgcolor"":""#E5ECF6"",""polar"":{""bgcolor"":""#E5ECF6"",""angularaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""radialaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""ternary"":{""bgcolor"":""#E5ECF6"",""aaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""baxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""caxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""coloraxis"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""colorscale"":{""sequential"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""sequentialminus"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""diverging"":[[0,""#8e0152""],[0.1,""#c51b7d""],[0.2,""#de77ae""],[0.3,""#f1b6da""],[0.4,""#fde0ef""],[0.5,""#f7f7f7""],[0.6,""#e6f5d0""],[0.7,""#b8e186""],[0.8,""#7fbc41""],[0.9,""#4d9221""],[1,""#276419""]]},""xaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""yaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""scene"":{""xaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""yaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""zaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2}},""shapedefaults"":{""line"":{""color"":""#2a3f5f""}},""annotationdefaults"":{""arrowcolor"":""#2a3f5f"",""arrowhead"":0,""arrowwidth"":1},""geo"":{""bgcolor"":""white"",""landcolor"":""#E5ECF6"",""subunitcolor"":""white"",""showland"":true,""showlakes"":true,""lakecolor"":""white""},""title"":{""x"":0.05},""mapbox"":{""style"":""light""}}},""xaxis"":{""anchor"":""y"",""domain"":[0.0,1.0],""title"":{""text"":""original text length part""}},""yaxis"":{""anchor"":""x"",""domain"":[0.0,1.0],""title"":{""text"":""Model""},""categoryorder"":""array"",""categoryarray"":[""Upstage SOLAR Instruct v1 (11B)"",""Mistral-7B-Instruct-v0.2"",""Falcon Instruct (7B)"",""RedPajama-INCITE Chat (7B)"",""zephyr-7b-beta"",""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""chat-bison-32k (PaLM 2 32K)"",""Mixtral-8x7B-Instruct-v0.1"",""Vicuna v1.5 (7B)"",""WizardLM v1.2 (13B)"",""chat-bison (PaLM 2)"",""gemini-pro"",""llama-2-70b-chat"",""Qwen 1.5 Chat (7B)"",""OpenHermes-2.5-Mistral (7B)"",""LLaMA-2 Chat (7B)"",""01-ai Yi Chat (34B)"",""Chronos Hermes (13B)"",""gpt-4"",""Mistral (7B) Instruct v0.2 (Together AI)"",""gpt-4-turbo"",""gpt-3.5-turbo"",""Snorkel Mistral PairRM DPO (7B)""]},""legend"":{""title"":{""text"":""Model""},""tracegroupgap"":0},""title"":{""text"":""Summary metrics original text length part""},""barmode"":""relative""}}","How long is the summarization compared to the original text, + calculated as: `len(summarized_text) + 1 / len(original_text) + 1`. + + The value is averaged for each model. + ",",model,BERT_score_precision,BERT_score_recall,BERT_score_F1,BLEU_score,original_text_length_part,sentence_count,length_penalty +10,Snorkel Mistral PairRM DPO (7B),0.3167385,0.34785262,0.32718164,0.0029236226777824676,3.7740234383755356,3.5818443804034583,14928.0 +18,gpt-3.5-turbo,0.49478123,0.50445867,0.49331823,0.00919205486407126,0.5905700146991734,4.229639819909955,89814.0 +20,gpt-4-turbo,0.42933634,0.4414623,0.4294052,0.0042830628392272,0.5393220459796505,4.266137566137566,85120.0 +4,Mistral (7B) Instruct v0.2 (Together AI),0.36488953,0.3797993,0.36758336,0.005650224193975447,0.5233998570385472,3.712222222222222,29298.0 +19,gpt-4,0.4864653,0.49512562,0.4839312,0.005711113295666468,0.4763731952669352,4.266137566137566,85120.0 +1,Chronos Hermes (13B),0.31285536,0.32630467,0.3150877,0.011542047908319874,0.4742810243835248,3.5818443804034583,14928.0 +0,01-ai Yi Chat (34B),0.33981326,0.35219854,0.34183535,0.007428840277380581,0.43251538287409536,3.5818443804034583,14928.0 +3,LLaMA-2 Chat (7B),0.32074162,0.33171847,0.32136682,0.004415024709996126,0.4084233313416049,3.5818443804034583,14928.0 +7,OpenHermes-2.5-Mistral (7B),0.3621834,0.3685358,0.36003792,0.0068684572027745494,0.312054520357568,3.5818443804034583,14928.0 +8,Qwen 1.5 Chat (7B),0.34898603,0.35945317,0.34867778,0.0033327500620805805,0.29904529709475364,3.5818443804034583,14928.0 +21,llama-2-70b-chat,0.20810011,0.22406381,0.21268094,0.004560500754935232,0.29684572894554634,4.2436893203883495,88008.0 +17,gemini-pro,0.23109974,0.23956373,0.23199782,0.0032373504004405487,0.295286999418032,4.244871794871795,87700.0 +15,chat-bison (PaLM 2),0.23123139,0.24001649,0.23214735,0.0037652345768886663,0.2927236655934559,4.281081081081081,83400.0 +14,WizardLM v1.2 (13B),0.3420949,0.34746957,0.33996373,0.00373442128604677,0.28716720161049375,3.5818443804034583,14928.0 +13,Vicuna v1.5 (7B),0.28434175,0.29119453,0.2839047,0.007105541953090669,0.2781035051738079,3.6173027989821884,16948.0 +6,Mixtral-8x7B-Instruct-v0.1,0.19137934,0.2029136,0.19449018,0.0031843990217988536,0.2665288353398184,4.161038961038961,103320.0 +16,chat-bison-32k (PaLM 2 32K),0.23051436,0.23993237,0.2317056,0.003694633514634998,0.2608806894318779,4.281081081081081,83400.0 +11,TinyLlama/TinyLlama-1.1B-Chat-v1.0,0.122332305,0.12540509,0.12200464,0.003286423403673119,0.13915355617375091,4.244871794871795,87700.0 +22,zephyr-7b-beta,0.085546724,0.08755772,0.085219756,0.0012612839176470308,0.08796697338212889,4.159788702026735,103714.0 +9,RedPajama-INCITE Chat (7B),0.26832756,0.27305293,0.26768887,0.0,0.0560284823193376,3.5818443804034583,14928.0 +2,Falcon Instruct (7B),0.30270517,0.28607234,0.29104736,0.0030232447024239606,0.0490635544441649,3.5818443804034583,14928.0 +5,Mistral-7B-Instruct-v0.2,0.04389399,0.045185987,0.04378006,0.000566625796313851,0.04250630683894714,4.120342654588421,113258.0 +12,Upstage SOLAR Instruct v1 (11B),0.0,0.0,0.0,0.0,0.0017662349842492329,3.5818443804034583,14928.0 +","{""x"": ""original_text_length_part"", ""y"": ""model"", ""color"": ""model"", ""orientation"": ""h"", ""labels"": {""original_text_length_part"": ""original text length part"", ""model"": ""Model""}, ""title"": ""Summary metrics original text length part""}" "Figure({ 'data': [{'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
length penalty=%{x}', - 'legendgroup': 'Mistral-7B-Instruct-v0.2', + 'hovertemplate': 'Model=%{y}
sentence count=%{x}', + 'legendgroup': 'chat-bison (PaLM 2)', 'marker': {'color': '#636efa', 'pattern': {'shape': ''}}, - 'name': 'Mistral-7B-Instruct-v0.2', - 'offsetgroup': 'Mistral-7B-Instruct-v0.2', + 'name': 'chat-bison (PaLM 2)', + 'offsetgroup': 'chat-bison (PaLM 2)', 'orientation': 'h', 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([113258.]), + 'x': array([4.28108108]), 'xaxis': 'x', - 'y': array(['Mistral-7B-Instruct-v0.2'], dtype=object), + 'y': array(['chat-bison (PaLM 2)'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
length penalty=%{x}', - 'legendgroup': 'zephyr-7b-beta', + 'hovertemplate': 'Model=%{y}
sentence count=%{x}', + 'legendgroup': 'chat-bison-32k (PaLM 2 32K)', 'marker': {'color': '#EF553B', 'pattern': {'shape': ''}}, - 'name': 'zephyr-7b-beta', - 'offsetgroup': 'zephyr-7b-beta', + 'name': 'chat-bison-32k (PaLM 2 32K)', + 'offsetgroup': 'chat-bison-32k (PaLM 2 32K)', 'orientation': 'h', 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([103714.]), + 'x': array([4.28108108]), 'xaxis': 'x', - 'y': array(['zephyr-7b-beta'], dtype=object), + 'y': array(['chat-bison-32k (PaLM 2 32K)'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
length penalty=%{x}', - 'legendgroup': 'Mixtral-8x7B-Instruct-v0.1', + 'hovertemplate': 'Model=%{y}
sentence count=%{x}', + 'legendgroup': 'gpt-4-turbo', 'marker': {'color': '#00cc96', 'pattern': {'shape': ''}}, - 'name': 'Mixtral-8x7B-Instruct-v0.1', - 'offsetgroup': 'Mixtral-8x7B-Instruct-v0.1', + 'name': 'gpt-4-turbo', + 'offsetgroup': 'gpt-4-turbo', 'orientation': 'h', 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([103320.]), + 'x': array([4.26613757]), 'xaxis': 'x', - 'y': array(['Mixtral-8x7B-Instruct-v0.1'], dtype=object), + 'y': array(['gpt-4-turbo'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
length penalty=%{x}', - 'legendgroup': 'gpt-3.5-turbo', + 'hovertemplate': 'Model=%{y}
sentence count=%{x}', + 'legendgroup': 'gpt-4', 'marker': {'color': '#ab63fa', 'pattern': {'shape': ''}}, - 'name': 'gpt-3.5-turbo', - 'offsetgroup': 'gpt-3.5-turbo', + 'name': 'gpt-4', + 'offsetgroup': 'gpt-4', 'orientation': 'h', 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([89814.]), + 'x': array([4.26613757]), 'xaxis': 'x', - 'y': array(['gpt-3.5-turbo'], dtype=object), + 'y': array(['gpt-4'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
length penalty=%{x}', - 'legendgroup': 'llama-2-70b-chat', + 'hovertemplate': 'Model=%{y}
sentence count=%{x}', + 'legendgroup': 'gemini-pro', 'marker': {'color': '#FFA15A', 'pattern': {'shape': ''}}, - 'name': 'llama-2-70b-chat', - 'offsetgroup': 'llama-2-70b-chat', + 'name': 'gemini-pro', + 'offsetgroup': 'gemini-pro', 'orientation': 'h', 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([88008.]), + 'x': array([4.24487179]), 'xaxis': 'x', - 'y': array(['llama-2-70b-chat'], dtype=object), + 'y': array(['gemini-pro'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
length penalty=%{x}', - 'legendgroup': 'gemini-pro', + 'hovertemplate': 'Model=%{y}
sentence count=%{x}', + 'legendgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0', 'marker': {'color': '#19d3f3', 'pattern': {'shape': ''}}, - 'name': 'gemini-pro', - 'offsetgroup': 'gemini-pro', + 'name': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0', + 'offsetgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0', 'orientation': 'h', 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([87700.]), + 'x': array([4.24487179]), 'xaxis': 'x', - 'y': array(['gemini-pro'], dtype=object), + 'y': array(['TinyLlama/TinyLlama-1.1B-Chat-v1.0'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
length penalty=%{x}', - 'legendgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0', + 'hovertemplate': 'Model=%{y}
sentence count=%{x}', + 'legendgroup': 'llama-2-70b-chat', 'marker': {'color': '#FF6692', 'pattern': {'shape': ''}}, - 'name': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0', - 'offsetgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0', + 'name': 'llama-2-70b-chat', + 'offsetgroup': 'llama-2-70b-chat', 'orientation': 'h', 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([87700.]), + 'x': array([4.24368932]), 'xaxis': 'x', - 'y': array(['TinyLlama/TinyLlama-1.1B-Chat-v1.0'], dtype=object), + 'y': array(['llama-2-70b-chat'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
length penalty=%{x}', - 'legendgroup': 'gpt-4-turbo', + 'hovertemplate': 'Model=%{y}
sentence count=%{x}', + 'legendgroup': 'gpt-3.5-turbo', 'marker': {'color': '#B6E880', 'pattern': {'shape': ''}}, - 'name': 'gpt-4-turbo', - 'offsetgroup': 'gpt-4-turbo', + 'name': 'gpt-3.5-turbo', + 'offsetgroup': 'gpt-3.5-turbo', 'orientation': 'h', 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([85120.]), + 'x': array([4.22963982]), 'xaxis': 'x', - 'y': array(['gpt-4-turbo'], dtype=object), + 'y': array(['gpt-3.5-turbo'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
length penalty=%{x}', - 'legendgroup': 'gpt-4', + 'hovertemplate': 'Model=%{y}
sentence count=%{x}', + 'legendgroup': 'Mixtral-8x7B-Instruct-v0.1', 'marker': {'color': '#FF97FF', 'pattern': {'shape': ''}}, - 'name': 'gpt-4', - 'offsetgroup': 'gpt-4', + 'name': 'Mixtral-8x7B-Instruct-v0.1', + 'offsetgroup': 'Mixtral-8x7B-Instruct-v0.1', 'orientation': 'h', 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([85120.]), + 'x': array([4.16103896]), 'xaxis': 'x', - 'y': array(['gpt-4'], dtype=object), + 'y': array(['Mixtral-8x7B-Instruct-v0.1'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
length penalty=%{x}', - 'legendgroup': 'chat-bison (PaLM 2)', + 'hovertemplate': 'Model=%{y}
sentence count=%{x}', + 'legendgroup': 'zephyr-7b-beta', 'marker': {'color': '#FECB52', 'pattern': {'shape': ''}}, - 'name': 'chat-bison (PaLM 2)', - 'offsetgroup': 'chat-bison (PaLM 2)', + 'name': 'zephyr-7b-beta', + 'offsetgroup': 'zephyr-7b-beta', 'orientation': 'h', 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([83400.]), + 'x': array([4.1597887]), 'xaxis': 'x', - 'y': array(['chat-bison (PaLM 2)'], dtype=object), + 'y': array(['zephyr-7b-beta'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
length penalty=%{x}', - 'legendgroup': 'chat-bison-32k (PaLM 2 32K)', + 'hovertemplate': 'Model=%{y}
sentence count=%{x}', + 'legendgroup': 'Mistral-7B-Instruct-v0.2', 'marker': {'color': '#636efa', 'pattern': {'shape': ''}}, - 'name': 'chat-bison-32k (PaLM 2 32K)', - 'offsetgroup': 'chat-bison-32k (PaLM 2 32K)', + 'name': 'Mistral-7B-Instruct-v0.2', + 'offsetgroup': 'Mistral-7B-Instruct-v0.2', 'orientation': 'h', 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([83400.]), + 'x': array([4.12034265]), 'xaxis': 'x', - 'y': array(['chat-bison-32k (PaLM 2 32K)'], dtype=object), + 'y': array(['Mistral-7B-Instruct-v0.2'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
length penalty=%{x}', + 'hovertemplate': 'Model=%{y}
sentence count=%{x}', 'legendgroup': 'Mistral (7B) Instruct v0.2 (Together AI)', 'marker': {'color': '#EF553B', 'pattern': {'shape': ''}}, 'name': 'Mistral (7B) Instruct v0.2 (Together AI)', @@ -2028,12 +2044,12 @@ plot_object,header,plot_json,description,df,arguments 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([29298.]), + 'x': array([3.71222222]), 'xaxis': 'x', 'y': array(['Mistral (7B) Instruct v0.2 (Together AI)'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
length penalty=%{x}', + 'hovertemplate': 'Model=%{y}
sentence count=%{x}', 'legendgroup': 'Vicuna v1.5 (7B)', 'marker': {'color': '#00cc96', 'pattern': {'shape': ''}}, 'name': 'Vicuna v1.5 (7B)', @@ -2042,12 +2058,12 @@ plot_object,header,plot_json,description,df,arguments 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([16948.]), + 'x': array([3.6173028]), 'xaxis': 'x', 'y': array(['Vicuna v1.5 (7B)'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
length penalty=%{x}', + 'hovertemplate': 'Model=%{y}
sentence count=%{x}', 'legendgroup': 'Falcon Instruct (7B)', 'marker': {'color': '#ab63fa', 'pattern': {'shape': ''}}, 'name': 'Falcon Instruct (7B)', @@ -2056,12 +2072,12 @@ plot_object,header,plot_json,description,df,arguments 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([14928.]), + 'x': array([3.58184438]), 'xaxis': 'x', 'y': array(['Falcon Instruct (7B)'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
length penalty=%{x}', + 'hovertemplate': 'Model=%{y}
sentence count=%{x}', 'legendgroup': 'RedPajama-INCITE Chat (7B)', 'marker': {'color': '#FFA15A', 'pattern': {'shape': ''}}, 'name': 'RedPajama-INCITE Chat (7B)', @@ -2070,12 +2086,12 @@ plot_object,header,plot_json,description,df,arguments 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([14928.]), + 'x': array([3.58184438]), 'xaxis': 'x', 'y': array(['RedPajama-INCITE Chat (7B)'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
length penalty=%{x}', + 'hovertemplate': 'Model=%{y}
sentence count=%{x}', 'legendgroup': 'Snorkel Mistral PairRM DPO (7B)', 'marker': {'color': '#19d3f3', 'pattern': {'shape': ''}}, 'name': 'Snorkel Mistral PairRM DPO (7B)', @@ -2084,12 +2100,12 @@ plot_object,header,plot_json,description,df,arguments 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([14928.]), + 'x': array([3.58184438]), 'xaxis': 'x', 'y': array(['Snorkel Mistral PairRM DPO (7B)'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
length penalty=%{x}', + 'hovertemplate': 'Model=%{y}
sentence count=%{x}', 'legendgroup': 'WizardLM v1.2 (13B)', 'marker': {'color': '#FF6692', 'pattern': {'shape': ''}}, 'name': 'WizardLM v1.2 (13B)', @@ -2098,12 +2114,12 @@ plot_object,header,plot_json,description,df,arguments 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([14928.]), + 'x': array([3.58184438]), 'xaxis': 'x', 'y': array(['WizardLM v1.2 (13B)'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
length penalty=%{x}', + 'hovertemplate': 'Model=%{y}
sentence count=%{x}', 'legendgroup': 'Qwen 1.5 Chat (7B)', 'marker': {'color': '#B6E880', 'pattern': {'shape': ''}}, 'name': 'Qwen 1.5 Chat (7B)', @@ -2112,12 +2128,12 @@ plot_object,header,plot_json,description,df,arguments 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([14928.]), + 'x': array([3.58184438]), 'xaxis': 'x', 'y': array(['Qwen 1.5 Chat (7B)'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
length penalty=%{x}', + 'hovertemplate': 'Model=%{y}
sentence count=%{x}', 'legendgroup': 'OpenHermes-2.5-Mistral (7B)', 'marker': {'color': '#FF97FF', 'pattern': {'shape': ''}}, 'name': 'OpenHermes-2.5-Mistral (7B)', @@ -2126,12 +2142,12 @@ plot_object,header,plot_json,description,df,arguments 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([14928.]), + 'x': array([3.58184438]), 'xaxis': 'x', 'y': array(['OpenHermes-2.5-Mistral (7B)'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
length penalty=%{x}', + 'hovertemplate': 'Model=%{y}
sentence count=%{x}', 'legendgroup': 'LLaMA-2 Chat (7B)', 'marker': {'color': '#FECB52', 'pattern': {'shape': ''}}, 'name': 'LLaMA-2 Chat (7B)', @@ -2140,12 +2156,12 @@ plot_object,header,plot_json,description,df,arguments 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([14928.]), + 'x': array([3.58184438]), 'xaxis': 'x', 'y': array(['LLaMA-2 Chat (7B)'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
length penalty=%{x}', + 'hovertemplate': 'Model=%{y}
sentence count=%{x}', 'legendgroup': '01-ai Yi Chat (34B)', 'marker': {'color': '#636efa', 'pattern': {'shape': ''}}, 'name': '01-ai Yi Chat (34B)', @@ -2154,12 +2170,12 @@ plot_object,header,plot_json,description,df,arguments 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([14928.]), + 'x': array([3.58184438]), 'xaxis': 'x', 'y': array(['01-ai Yi Chat (34B)'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
length penalty=%{x}', + 'hovertemplate': 'Model=%{y}
sentence count=%{x}', 'legendgroup': 'Chronos Hermes (13B)', 'marker': {'color': '#EF553B', 'pattern': {'shape': ''}}, 'name': 'Chronos Hermes (13B)', @@ -2168,12 +2184,12 @@ plot_object,header,plot_json,description,df,arguments 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([14928.]), + 'x': array([3.58184438]), 'xaxis': 'x', 'y': array(['Chronos Hermes (13B)'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
length penalty=%{x}', + 'hovertemplate': 'Model=%{y}
sentence count=%{x}', 'legendgroup': 'Upstage SOLAR Instruct v1 (11B)', 'marker': {'color': '#00cc96', 'pattern': {'shape': ''}}, 'name': 'Upstage SOLAR Instruct v1 (11B)', @@ -2182,15 +2198,15 @@ plot_object,header,plot_json,description,df,arguments 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([14928.]), + 'x': array([3.58184438]), 'xaxis': 'x', 'y': array(['Upstage SOLAR Instruct v1 (11B)'], dtype=object), 'yaxis': 'y'}], 'layout': {'barmode': 'relative', 'legend': {'title': {'text': 'Model'}, 'tracegroupgap': 0}, 'template': '...', - 'title': {'text': 'Summary metrics length penalty'}, - 'xaxis': {'anchor': 'y', 'domain': [0.0, 1.0], 'title': {'text': 'length penalty'}}, + 'title': {'text': 'Summary metrics sentence count'}, + 'xaxis': {'anchor': 'y', 'domain': [0.0, 1.0], 'title': {'text': 'sentence count'}}, 'yaxis': {'anchor': 'x', 'categoryarray': [Upstage SOLAR Instruct v1 (11B), Chronos Hermes (13B), 01-ai Yi Chat @@ -2200,256 +2216,256 @@ plot_object,header,plot_json,description,df,arguments Mistral PairRM DPO (7B), RedPajama- INCITE Chat (7B), Falcon Instruct (7B), Vicuna v1.5 (7B), Mistral (7B) Instruct - v0.2 (Together AI), chat-bison-32k (PaLM - 2 32K), chat-bison (PaLM 2), gpt-4, - gpt-4-turbo, - TinyLlama/TinyLlama-1.1B-Chat-v1.0, - gemini-pro, llama-2-70b-chat, - gpt-3.5-turbo, - Mixtral-8x7B-Instruct-v0.1, + v0.2 (Together AI), + Mistral-7B-Instruct-v0.2, zephyr-7b-beta, - Mistral-7B-Instruct-v0.2], + Mixtral-8x7B-Instruct-v0.1, + gpt-3.5-turbo, llama-2-70b-chat, + TinyLlama/TinyLlama-1.1B-Chat-v1.0, + gemini-pro, gpt-4, gpt-4-turbo, chat- + bison-32k (PaLM 2 32K), chat-bison (PaLM + 2)], 'categoryorder': 'array', 'domain': [0.0, 1.0], 'title': {'text': 'Model'}}} -})",Summary metrics length penalty,"{""data"":[{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003elength penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral-7B-Instruct-v0.2"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""Mistral-7B-Instruct-v0.2"",""offsetgroup"":""Mistral-7B-Instruct-v0.2"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[113258.0],""xaxis"":""x"",""y"":[""Mistral-7B-Instruct-v0.2""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003elength penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""zephyr-7b-beta"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""zephyr-7b-beta"",""offsetgroup"":""zephyr-7b-beta"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[103714.0],""xaxis"":""x"",""y"":[""zephyr-7b-beta""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003elength penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mixtral-8x7B-Instruct-v0.1"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""Mixtral-8x7B-Instruct-v0.1"",""offsetgroup"":""Mixtral-8x7B-Instruct-v0.1"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[103320.0],""xaxis"":""x"",""y"":[""Mixtral-8x7B-Instruct-v0.1""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003elength penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-3.5-turbo"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""gpt-3.5-turbo"",""offsetgroup"":""gpt-3.5-turbo"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[89814.0],""xaxis"":""x"",""y"":[""gpt-3.5-turbo""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003elength penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""llama-2-70b-chat"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""llama-2-70b-chat"",""offsetgroup"":""llama-2-70b-chat"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[88008.0],""xaxis"":""x"",""y"":[""llama-2-70b-chat""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003elength penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gemini-pro"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""gemini-pro"",""offsetgroup"":""gemini-pro"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[87700.0],""xaxis"":""x"",""y"":[""gemini-pro""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003elength penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""offsetgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[87700.0],""xaxis"":""x"",""y"":[""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003elength penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4-turbo"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""gpt-4-turbo"",""offsetgroup"":""gpt-4-turbo"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[85120.0],""xaxis"":""x"",""y"":[""gpt-4-turbo""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003elength penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""gpt-4"",""offsetgroup"":""gpt-4"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[85120.0],""xaxis"":""x"",""y"":[""gpt-4""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003elength penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison (PaLM 2)"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""chat-bison (PaLM 2)"",""offsetgroup"":""chat-bison (PaLM 2)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[83400.0],""xaxis"":""x"",""y"":[""chat-bison (PaLM 2)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003elength penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison-32k (PaLM 2 32K)"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""chat-bison-32k (PaLM 2 32K)"",""offsetgroup"":""chat-bison-32k (PaLM 2 32K)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[83400.0],""xaxis"":""x"",""y"":[""chat-bison-32k (PaLM 2 32K)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003elength penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral (7B) Instruct v0.2 (Together AI)"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""Mistral (7B) Instruct v0.2 (Together AI)"",""offsetgroup"":""Mistral (7B) Instruct v0.2 (Together AI)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[29298.0],""xaxis"":""x"",""y"":[""Mistral (7B) Instruct v0.2 (Together AI)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003elength penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Vicuna v1.5 (7B)"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""Vicuna v1.5 (7B)"",""offsetgroup"":""Vicuna v1.5 (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[16948.0],""xaxis"":""x"",""y"":[""Vicuna v1.5 (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003elength penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Falcon Instruct (7B)"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""Falcon Instruct (7B)"",""offsetgroup"":""Falcon Instruct (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[14928.0],""xaxis"":""x"",""y"":[""Falcon Instruct (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003elength penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""RedPajama-INCITE Chat (7B)"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""RedPajama-INCITE Chat (7B)"",""offsetgroup"":""RedPajama-INCITE Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[14928.0],""xaxis"":""x"",""y"":[""RedPajama-INCITE Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003elength penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Snorkel Mistral PairRM DPO (7B)"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""Snorkel Mistral PairRM DPO (7B)"",""offsetgroup"":""Snorkel Mistral PairRM DPO (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[14928.0],""xaxis"":""x"",""y"":[""Snorkel Mistral PairRM DPO (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003elength penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""WizardLM v1.2 (13B)"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""WizardLM v1.2 (13B)"",""offsetgroup"":""WizardLM v1.2 (13B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[14928.0],""xaxis"":""x"",""y"":[""WizardLM v1.2 (13B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003elength penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Qwen 1.5 Chat (7B)"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""Qwen 1.5 Chat (7B)"",""offsetgroup"":""Qwen 1.5 Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[14928.0],""xaxis"":""x"",""y"":[""Qwen 1.5 Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003elength penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""OpenHermes-2.5-Mistral (7B)"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""OpenHermes-2.5-Mistral (7B)"",""offsetgroup"":""OpenHermes-2.5-Mistral (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[14928.0],""xaxis"":""x"",""y"":[""OpenHermes-2.5-Mistral (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003elength penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""LLaMA-2 Chat (7B)"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""LLaMA-2 Chat (7B)"",""offsetgroup"":""LLaMA-2 Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[14928.0],""xaxis"":""x"",""y"":[""LLaMA-2 Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003elength penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""01-ai Yi Chat (34B)"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""01-ai Yi Chat (34B)"",""offsetgroup"":""01-ai Yi Chat (34B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[14928.0],""xaxis"":""x"",""y"":[""01-ai Yi Chat (34B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003elength penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Chronos Hermes (13B)"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""Chronos Hermes (13B)"",""offsetgroup"":""Chronos Hermes (13B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[14928.0],""xaxis"":""x"",""y"":[""Chronos Hermes (13B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003elength penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Upstage SOLAR Instruct v1 (11B)"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""Upstage SOLAR Instruct v1 (11B)"",""offsetgroup"":""Upstage SOLAR Instruct v1 (11B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[14928.0],""xaxis"":""x"",""y"":[""Upstage SOLAR Instruct v1 (11B)""],""yaxis"":""y"",""type"":""bar""}],""layout"":{""template"":{""data"":{""histogram2dcontour"":[{""type"":""histogram2dcontour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""choropleth"":[{""type"":""choropleth"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""histogram2d"":[{""type"":""histogram2d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmap"":[{""type"":""heatmap"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmapgl"":[{""type"":""heatmapgl"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""contourcarpet"":[{""type"":""contourcarpet"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""contour"":[{""type"":""contour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""surface"":[{""type"":""surface"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""mesh3d"":[{""type"":""mesh3d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""scatter"":[{""fillpattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2},""type"":""scatter""}],""parcoords"":[{""type"":""parcoords"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolargl"":[{""type"":""scatterpolargl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""bar"":[{""error_x"":{""color"":""#2a3f5f""},""error_y"":{""color"":""#2a3f5f""},""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""bar""}],""scattergeo"":[{""type"":""scattergeo"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolar"":[{""type"":""scatterpolar"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""histogram"":[{""marker"":{""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""histogram""}],""scattergl"":[{""type"":""scattergl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatter3d"":[{""type"":""scatter3d"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattermapbox"":[{""type"":""scattermapbox"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterternary"":[{""type"":""scatterternary"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattercarpet"":[{""type"":""scattercarpet"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""carpet"":[{""aaxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""baxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""type"":""carpet""}],""table"":[{""cells"":{""fill"":{""color"":""#EBF0F8""},""line"":{""color"":""white""}},""header"":{""fill"":{""color"":""#C8D4E3""},""line"":{""color"":""white""}},""type"":""table""}],""barpolar"":[{""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""barpolar""}],""pie"":[{""automargin"":true,""type"":""pie""}]},""layout"":{""autotypenumbers"":""strict"",""colorway"":[""#636efa"",""#EF553B"",""#00cc96"",""#ab63fa"",""#FFA15A"",""#19d3f3"",""#FF6692"",""#B6E880"",""#FF97FF"",""#FECB52""],""font"":{""color"":""#2a3f5f""},""hovermode"":""closest"",""hoverlabel"":{""align"":""left""},""paper_bgcolor"":""white"",""plot_bgcolor"":""#E5ECF6"",""polar"":{""bgcolor"":""#E5ECF6"",""angularaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""radialaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""ternary"":{""bgcolor"":""#E5ECF6"",""aaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""baxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""caxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""coloraxis"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""colorscale"":{""sequential"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""sequentialminus"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""diverging"":[[0,""#8e0152""],[0.1,""#c51b7d""],[0.2,""#de77ae""],[0.3,""#f1b6da""],[0.4,""#fde0ef""],[0.5,""#f7f7f7""],[0.6,""#e6f5d0""],[0.7,""#b8e186""],[0.8,""#7fbc41""],[0.9,""#4d9221""],[1,""#276419""]]},""xaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""yaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""scene"":{""xaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""yaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""zaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2}},""shapedefaults"":{""line"":{""color"":""#2a3f5f""}},""annotationdefaults"":{""arrowcolor"":""#2a3f5f"",""arrowhead"":0,""arrowwidth"":1},""geo"":{""bgcolor"":""white"",""landcolor"":""#E5ECF6"",""subunitcolor"":""white"",""showland"":true,""showlakes"":true,""lakecolor"":""white""},""title"":{""x"":0.05},""mapbox"":{""style"":""light""}}},""xaxis"":{""anchor"":""y"",""domain"":[0.0,1.0],""title"":{""text"":""length penalty""}},""yaxis"":{""anchor"":""x"",""domain"":[0.0,1.0],""title"":{""text"":""Model""},""categoryorder"":""array"",""categoryarray"":[""Upstage SOLAR Instruct v1 (11B)"",""Chronos Hermes (13B)"",""01-ai Yi Chat (34B)"",""LLaMA-2 Chat (7B)"",""OpenHermes-2.5-Mistral (7B)"",""Qwen 1.5 Chat (7B)"",""WizardLM v1.2 (13B)"",""Snorkel Mistral PairRM DPO (7B)"",""RedPajama-INCITE Chat (7B)"",""Falcon Instruct (7B)"",""Vicuna v1.5 (7B)"",""Mistral (7B) Instruct v0.2 (Together AI)"",""chat-bison-32k (PaLM 2 32K)"",""chat-bison (PaLM 2)"",""gpt-4"",""gpt-4-turbo"",""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""gemini-pro"",""llama-2-70b-chat"",""gpt-3.5-turbo"",""Mixtral-8x7B-Instruct-v0.1"",""zephyr-7b-beta"",""Mistral-7B-Instruct-v0.2""]},""legend"":{""title"":{""text"":""Model""},""tracegroupgap"":0},""title"":{""text"":""Summary metrics length penalty""},""barmode"":""relative""}}",It is assumed that good quality summary contains between 2 and 5 sentences (inclusive range). The penalty is a difference between summary sentence count and this range. It is summed for each model.,",model,bert_score_P,bert_score_R,bert_score_F1,original_text_length_part,sentence_count,length_penalty,bleu_score -5,Mistral-7B-Instruct-v0.2,0.043820098,0.042561684,0.04313921,0.04250630683894714,4.120342654588421,113258.0,0.0004930290548816363 -22,zephyr-7b-beta,0.085390136,0.08266569,0.08394519,0.08796697338212889,4.159788702026735,103714.0,0.0010625100735849574 -6,Mixtral-8x7B-Instruct-v0.1,0.19128644,0.19555509,0.19330867,0.2665288353398184,4.161038961038961,103320.0,0.0026839271544750283 -18,gpt-3.5-turbo,0.4943981,0.48408476,0.4888874,0.5905700146991734,4.229639819909955,89814.0,0.007892445077902592 -21,llama-2-70b-chat,0.20800962,0.21472095,0.21117964,0.29684572894554634,4.2436893203883495,88008.0,0.00329426273003284 -17,gemini-pro,0.23105659,0.23057175,0.23072062,0.295286999418032,4.244871794871795,87700.0,0.0025439281189154664 -11,TinyLlama/TinyLlama-1.1B-Chat-v1.0,0.122185074,0.11885959,0.12042627,0.13915355617375091,4.244871794871795,87700.0,0.002991155730532842 -20,gpt-4-turbo,0.42728576,0.4162435,0.42098433,0.5393220459796505,4.266137566137566,85120.0,0.0034873692407505464 -19,gpt-4,0.48605907,0.472583,0.47901583,0.4763731952669352,4.266137566137566,85120.0,0.004704572681138337 -15,chat-bison (PaLM 2),0.23117188,0.23029378,0.23060663,0.2927236655934559,4.281081081081081,83400.0,0.0033173472693443363 -16,chat-bison-32k (PaLM 2 32K),0.23046139,0.22983725,0.23002876,0.2608806894318779,4.281081081081081,83400.0,0.002970914340485325 -4,Mistral (7B) Instruct v0.2 (Together AI),0.3647361,0.3664233,0.36540908,0.5233998570385472,3.712222222222222,29298.0,0.005478518060743351 -13,Vicuna v1.5 (7B),0.284109,0.27878883,0.28129113,0.2781035051738079,3.6173027989821884,16948.0,0.006952332387656228 -2,Falcon Instruct (7B),0.2895086,0.23968808,0.2615204,0.0490635544441649,3.5818443804034583,14928.0,0.00021729364201653395 -9,RedPajama-INCITE Chat (7B),0.261367,0.23758642,0.2487217,0.0560284823193376,3.5818443804034583,14928.0,0.0 -10,Snorkel Mistral PairRM DPO (7B),0.31672964,0.33782956,0.3265383,3.7740234383755356,3.5818443804034583,14928.0,0.002907897771152987 -14,WizardLM v1.2 (13B),0.34085444,0.32933056,0.33466902,0.28716720161049375,3.5818443804034583,14928.0,0.003671383039102015 -8,Qwen 1.5 Chat (7B),0.34855434,0.34154576,0.344803,0.29904529709475364,3.5818443804034583,14928.0,0.003185571110431172 -7,OpenHermes-2.5-Mistral (7B),0.3618188,0.35180506,0.3565194,0.312054520357568,3.5818443804034583,14928.0,0.006563161880264231 -3,LLaMA-2 Chat (7B),0.3203912,0.3153909,0.31770444,0.4084233313416049,3.5818443804034583,14928.0,0.004255859538193306 -0,01-ai Yi Chat (34B),0.33974892,0.3404481,0.3399749,0.43251538287409536,3.5818443804034583,14928.0,0.007311566390840339 -1,Chronos Hermes (13B),0.3124825,0.31071666,0.311415,0.4742810243835248,3.5818443804034583,14928.0,0.011439012700594395 -12,Upstage SOLAR Instruct v1 (11B),0.0,0.0,0.0,0.0017662349842492329,3.5818443804034583,14928.0,0.0 -","{""x"": ""length_penalty"", ""y"": ""model"", ""color"": ""model"", ""orientation"": ""h"", ""labels"": {""length_penalty"": ""length penalty"", ""model"": ""Model""}, ""title"": ""Summary metrics length penalty""}" +})",Summary metrics sentence count,"{""data"":[{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003esentence count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison (PaLM 2)"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""chat-bison (PaLM 2)"",""offsetgroup"":""chat-bison (PaLM 2)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[4.281081081081081],""xaxis"":""x"",""y"":[""chat-bison (PaLM 2)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003esentence count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison-32k (PaLM 2 32K)"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""chat-bison-32k (PaLM 2 32K)"",""offsetgroup"":""chat-bison-32k (PaLM 2 32K)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[4.281081081081081],""xaxis"":""x"",""y"":[""chat-bison-32k (PaLM 2 32K)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003esentence count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4-turbo"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""gpt-4-turbo"",""offsetgroup"":""gpt-4-turbo"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[4.266137566137566],""xaxis"":""x"",""y"":[""gpt-4-turbo""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003esentence count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""gpt-4"",""offsetgroup"":""gpt-4"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[4.266137566137566],""xaxis"":""x"",""y"":[""gpt-4""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003esentence count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gemini-pro"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""gemini-pro"",""offsetgroup"":""gemini-pro"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[4.244871794871795],""xaxis"":""x"",""y"":[""gemini-pro""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003esentence count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""offsetgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[4.244871794871795],""xaxis"":""x"",""y"":[""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003esentence count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""llama-2-70b-chat"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""llama-2-70b-chat"",""offsetgroup"":""llama-2-70b-chat"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[4.2436893203883495],""xaxis"":""x"",""y"":[""llama-2-70b-chat""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003esentence count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-3.5-turbo"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""gpt-3.5-turbo"",""offsetgroup"":""gpt-3.5-turbo"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[4.229639819909955],""xaxis"":""x"",""y"":[""gpt-3.5-turbo""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003esentence count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mixtral-8x7B-Instruct-v0.1"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""Mixtral-8x7B-Instruct-v0.1"",""offsetgroup"":""Mixtral-8x7B-Instruct-v0.1"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[4.161038961038961],""xaxis"":""x"",""y"":[""Mixtral-8x7B-Instruct-v0.1""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003esentence count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""zephyr-7b-beta"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""zephyr-7b-beta"",""offsetgroup"":""zephyr-7b-beta"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[4.159788702026735],""xaxis"":""x"",""y"":[""zephyr-7b-beta""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003esentence count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral-7B-Instruct-v0.2"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""Mistral-7B-Instruct-v0.2"",""offsetgroup"":""Mistral-7B-Instruct-v0.2"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[4.120342654588421],""xaxis"":""x"",""y"":[""Mistral-7B-Instruct-v0.2""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003esentence count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral (7B) Instruct v0.2 (Together AI)"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""Mistral (7B) Instruct v0.2 (Together AI)"",""offsetgroup"":""Mistral (7B) Instruct v0.2 (Together AI)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[3.712222222222222],""xaxis"":""x"",""y"":[""Mistral (7B) Instruct v0.2 (Together AI)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003esentence count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Vicuna v1.5 (7B)"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""Vicuna v1.5 (7B)"",""offsetgroup"":""Vicuna v1.5 (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[3.6173027989821884],""xaxis"":""x"",""y"":[""Vicuna v1.5 (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003esentence count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Falcon Instruct (7B)"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""Falcon Instruct (7B)"",""offsetgroup"":""Falcon Instruct (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[3.5818443804034583],""xaxis"":""x"",""y"":[""Falcon Instruct (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003esentence count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""RedPajama-INCITE Chat (7B)"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""RedPajama-INCITE Chat (7B)"",""offsetgroup"":""RedPajama-INCITE Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[3.5818443804034583],""xaxis"":""x"",""y"":[""RedPajama-INCITE Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003esentence count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Snorkel Mistral PairRM DPO (7B)"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""Snorkel Mistral PairRM DPO (7B)"",""offsetgroup"":""Snorkel Mistral PairRM DPO (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[3.5818443804034583],""xaxis"":""x"",""y"":[""Snorkel Mistral PairRM DPO (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003esentence count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""WizardLM v1.2 (13B)"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""WizardLM v1.2 (13B)"",""offsetgroup"":""WizardLM v1.2 (13B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[3.5818443804034583],""xaxis"":""x"",""y"":[""WizardLM v1.2 (13B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003esentence count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Qwen 1.5 Chat (7B)"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""Qwen 1.5 Chat (7B)"",""offsetgroup"":""Qwen 1.5 Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[3.5818443804034583],""xaxis"":""x"",""y"":[""Qwen 1.5 Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003esentence count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""OpenHermes-2.5-Mistral (7B)"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""OpenHermes-2.5-Mistral (7B)"",""offsetgroup"":""OpenHermes-2.5-Mistral (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[3.5818443804034583],""xaxis"":""x"",""y"":[""OpenHermes-2.5-Mistral (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003esentence count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""LLaMA-2 Chat (7B)"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""LLaMA-2 Chat (7B)"",""offsetgroup"":""LLaMA-2 Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[3.5818443804034583],""xaxis"":""x"",""y"":[""LLaMA-2 Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003esentence count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""01-ai Yi Chat (34B)"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""01-ai Yi Chat (34B)"",""offsetgroup"":""01-ai Yi Chat (34B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[3.5818443804034583],""xaxis"":""x"",""y"":[""01-ai Yi Chat (34B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003esentence count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Chronos Hermes (13B)"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""Chronos Hermes (13B)"",""offsetgroup"":""Chronos Hermes (13B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[3.5818443804034583],""xaxis"":""x"",""y"":[""Chronos Hermes (13B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003esentence count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Upstage SOLAR Instruct v1 (11B)"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""Upstage SOLAR Instruct v1 (11B)"",""offsetgroup"":""Upstage SOLAR Instruct v1 (11B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[3.5818443804034583],""xaxis"":""x"",""y"":[""Upstage SOLAR Instruct v1 (11B)""],""yaxis"":""y"",""type"":""bar""}],""layout"":{""template"":{""data"":{""histogram2dcontour"":[{""type"":""histogram2dcontour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""choropleth"":[{""type"":""choropleth"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""histogram2d"":[{""type"":""histogram2d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmap"":[{""type"":""heatmap"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmapgl"":[{""type"":""heatmapgl"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""contourcarpet"":[{""type"":""contourcarpet"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""contour"":[{""type"":""contour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""surface"":[{""type"":""surface"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""mesh3d"":[{""type"":""mesh3d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""scatter"":[{""fillpattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2},""type"":""scatter""}],""parcoords"":[{""type"":""parcoords"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolargl"":[{""type"":""scatterpolargl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""bar"":[{""error_x"":{""color"":""#2a3f5f""},""error_y"":{""color"":""#2a3f5f""},""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""bar""}],""scattergeo"":[{""type"":""scattergeo"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolar"":[{""type"":""scatterpolar"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""histogram"":[{""marker"":{""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""histogram""}],""scattergl"":[{""type"":""scattergl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatter3d"":[{""type"":""scatter3d"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattermapbox"":[{""type"":""scattermapbox"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterternary"":[{""type"":""scatterternary"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattercarpet"":[{""type"":""scattercarpet"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""carpet"":[{""aaxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""baxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""type"":""carpet""}],""table"":[{""cells"":{""fill"":{""color"":""#EBF0F8""},""line"":{""color"":""white""}},""header"":{""fill"":{""color"":""#C8D4E3""},""line"":{""color"":""white""}},""type"":""table""}],""barpolar"":[{""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""barpolar""}],""pie"":[{""automargin"":true,""type"":""pie""}]},""layout"":{""autotypenumbers"":""strict"",""colorway"":[""#636efa"",""#EF553B"",""#00cc96"",""#ab63fa"",""#FFA15A"",""#19d3f3"",""#FF6692"",""#B6E880"",""#FF97FF"",""#FECB52""],""font"":{""color"":""#2a3f5f""},""hovermode"":""closest"",""hoverlabel"":{""align"":""left""},""paper_bgcolor"":""white"",""plot_bgcolor"":""#E5ECF6"",""polar"":{""bgcolor"":""#E5ECF6"",""angularaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""radialaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""ternary"":{""bgcolor"":""#E5ECF6"",""aaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""baxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""caxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""coloraxis"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""colorscale"":{""sequential"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""sequentialminus"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""diverging"":[[0,""#8e0152""],[0.1,""#c51b7d""],[0.2,""#de77ae""],[0.3,""#f1b6da""],[0.4,""#fde0ef""],[0.5,""#f7f7f7""],[0.6,""#e6f5d0""],[0.7,""#b8e186""],[0.8,""#7fbc41""],[0.9,""#4d9221""],[1,""#276419""]]},""xaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""yaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""scene"":{""xaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""yaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""zaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2}},""shapedefaults"":{""line"":{""color"":""#2a3f5f""}},""annotationdefaults"":{""arrowcolor"":""#2a3f5f"",""arrowhead"":0,""arrowwidth"":1},""geo"":{""bgcolor"":""white"",""landcolor"":""#E5ECF6"",""subunitcolor"":""white"",""showland"":true,""showlakes"":true,""lakecolor"":""white""},""title"":{""x"":0.05},""mapbox"":{""style"":""light""}}},""xaxis"":{""anchor"":""y"",""domain"":[0.0,1.0],""title"":{""text"":""sentence count""}},""yaxis"":{""anchor"":""x"",""domain"":[0.0,1.0],""title"":{""text"":""Model""},""categoryorder"":""array"",""categoryarray"":[""Upstage SOLAR Instruct v1 (11B)"",""Chronos Hermes (13B)"",""01-ai Yi Chat (34B)"",""LLaMA-2 Chat (7B)"",""OpenHermes-2.5-Mistral (7B)"",""Qwen 1.5 Chat (7B)"",""WizardLM v1.2 (13B)"",""Snorkel Mistral PairRM DPO (7B)"",""RedPajama-INCITE Chat (7B)"",""Falcon Instruct (7B)"",""Vicuna v1.5 (7B)"",""Mistral (7B) Instruct v0.2 (Together AI)"",""Mistral-7B-Instruct-v0.2"",""zephyr-7b-beta"",""Mixtral-8x7B-Instruct-v0.1"",""gpt-3.5-turbo"",""llama-2-70b-chat"",""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""gemini-pro"",""gpt-4"",""gpt-4-turbo"",""chat-bison-32k (PaLM 2 32K)"",""chat-bison (PaLM 2)""]},""legend"":{""title"":{""text"":""Model""},""tracegroupgap"":0},""title"":{""text"":""Summary metrics sentence count""},""barmode"":""relative""}}",Average sentence count of the summary.,",model,BERT_score_precision,BERT_score_recall,BERT_score_F1,BLEU_score,original_text_length_part,sentence_count,length_penalty +15,chat-bison (PaLM 2),0.23123139,0.24001649,0.23214735,0.0037652345768886663,0.2927236655934559,4.281081081081081,83400.0 +16,chat-bison-32k (PaLM 2 32K),0.23051436,0.23993237,0.2317056,0.003694633514634998,0.2608806894318779,4.281081081081081,83400.0 +20,gpt-4-turbo,0.42933634,0.4414623,0.4294052,0.0042830628392272,0.5393220459796505,4.266137566137566,85120.0 +19,gpt-4,0.4864653,0.49512562,0.4839312,0.005711113295666468,0.4763731952669352,4.266137566137566,85120.0 +17,gemini-pro,0.23109974,0.23956373,0.23199782,0.0032373504004405487,0.295286999418032,4.244871794871795,87700.0 +11,TinyLlama/TinyLlama-1.1B-Chat-v1.0,0.122332305,0.12540509,0.12200464,0.003286423403673119,0.13915355617375091,4.244871794871795,87700.0 +21,llama-2-70b-chat,0.20810011,0.22406381,0.21268094,0.004560500754935232,0.29684572894554634,4.2436893203883495,88008.0 +18,gpt-3.5-turbo,0.49478123,0.50445867,0.49331823,0.00919205486407126,0.5905700146991734,4.229639819909955,89814.0 +6,Mixtral-8x7B-Instruct-v0.1,0.19137934,0.2029136,0.19449018,0.0031843990217988536,0.2665288353398184,4.161038961038961,103320.0 +22,zephyr-7b-beta,0.085546724,0.08755772,0.085219756,0.0012612839176470308,0.08796697338212889,4.159788702026735,103714.0 +5,Mistral-7B-Instruct-v0.2,0.04389399,0.045185987,0.04378006,0.000566625796313851,0.04250630683894714,4.120342654588421,113258.0 +4,Mistral (7B) Instruct v0.2 (Together AI),0.36488953,0.3797993,0.36758336,0.005650224193975447,0.5233998570385472,3.712222222222222,29298.0 +13,Vicuna v1.5 (7B),0.28434175,0.29119453,0.2839047,0.007105541953090669,0.2781035051738079,3.6173027989821884,16948.0 +2,Falcon Instruct (7B),0.30270517,0.28607234,0.29104736,0.0030232447024239606,0.0490635544441649,3.5818443804034583,14928.0 +9,RedPajama-INCITE Chat (7B),0.26832756,0.27305293,0.26768887,0.0,0.0560284823193376,3.5818443804034583,14928.0 +10,Snorkel Mistral PairRM DPO (7B),0.3167385,0.34785262,0.32718164,0.0029236226777824676,3.7740234383755356,3.5818443804034583,14928.0 +14,WizardLM v1.2 (13B),0.3420949,0.34746957,0.33996373,0.00373442128604677,0.28716720161049375,3.5818443804034583,14928.0 +8,Qwen 1.5 Chat (7B),0.34898603,0.35945317,0.34867778,0.0033327500620805805,0.29904529709475364,3.5818443804034583,14928.0 +7,OpenHermes-2.5-Mistral (7B),0.3621834,0.3685358,0.36003792,0.0068684572027745494,0.312054520357568,3.5818443804034583,14928.0 +3,LLaMA-2 Chat (7B),0.32074162,0.33171847,0.32136682,0.004415024709996126,0.4084233313416049,3.5818443804034583,14928.0 +0,01-ai Yi Chat (34B),0.33981326,0.35219854,0.34183535,0.007428840277380581,0.43251538287409536,3.5818443804034583,14928.0 +1,Chronos Hermes (13B),0.31285536,0.32630467,0.3150877,0.011542047908319874,0.4742810243835248,3.5818443804034583,14928.0 +12,Upstage SOLAR Instruct v1 (11B),0.0,0.0,0.0,0.0,0.0017662349842492329,3.5818443804034583,14928.0 +","{""x"": ""sentence_count"", ""y"": ""model"", ""color"": ""model"", ""orientation"": ""h"", ""labels"": {""sentence_count"": ""sentence count"", ""model"": ""Model""}, ""title"": ""Summary metrics sentence count""}" "Figure({ 'data': [{'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
BLEU score=%{x}', - 'legendgroup': 'Chronos Hermes (13B)', + 'hovertemplate': 'Model=%{y}
length penalty=%{x}', + 'legendgroup': 'Mistral-7B-Instruct-v0.2', 'marker': {'color': '#636efa', 'pattern': {'shape': ''}}, - 'name': 'Chronos Hermes (13B)', - 'offsetgroup': 'Chronos Hermes (13B)', + 'name': 'Mistral-7B-Instruct-v0.2', + 'offsetgroup': 'Mistral-7B-Instruct-v0.2', 'orientation': 'h', 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.01143901]), + 'x': array([113258.]), 'xaxis': 'x', - 'y': array(['Chronos Hermes (13B)'], dtype=object), + 'y': array(['Mistral-7B-Instruct-v0.2'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
BLEU score=%{x}', - 'legendgroup': 'gpt-3.5-turbo', + 'hovertemplate': 'Model=%{y}
length penalty=%{x}', + 'legendgroup': 'zephyr-7b-beta', 'marker': {'color': '#EF553B', 'pattern': {'shape': ''}}, - 'name': 'gpt-3.5-turbo', - 'offsetgroup': 'gpt-3.5-turbo', + 'name': 'zephyr-7b-beta', + 'offsetgroup': 'zephyr-7b-beta', 'orientation': 'h', 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.00789245]), + 'x': array([103714.]), 'xaxis': 'x', - 'y': array(['gpt-3.5-turbo'], dtype=object), + 'y': array(['zephyr-7b-beta'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
BLEU score=%{x}', - 'legendgroup': '01-ai Yi Chat (34B)', + 'hovertemplate': 'Model=%{y}
length penalty=%{x}', + 'legendgroup': 'Mixtral-8x7B-Instruct-v0.1', 'marker': {'color': '#00cc96', 'pattern': {'shape': ''}}, - 'name': '01-ai Yi Chat (34B)', - 'offsetgroup': '01-ai Yi Chat (34B)', + 'name': 'Mixtral-8x7B-Instruct-v0.1', + 'offsetgroup': 'Mixtral-8x7B-Instruct-v0.1', 'orientation': 'h', 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.00731157]), + 'x': array([103320.]), 'xaxis': 'x', - 'y': array(['01-ai Yi Chat (34B)'], dtype=object), + 'y': array(['Mixtral-8x7B-Instruct-v0.1'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
BLEU score=%{x}', - 'legendgroup': 'Vicuna v1.5 (7B)', + 'hovertemplate': 'Model=%{y}
length penalty=%{x}', + 'legendgroup': 'gpt-3.5-turbo', 'marker': {'color': '#ab63fa', 'pattern': {'shape': ''}}, - 'name': 'Vicuna v1.5 (7B)', - 'offsetgroup': 'Vicuna v1.5 (7B)', + 'name': 'gpt-3.5-turbo', + 'offsetgroup': 'gpt-3.5-turbo', 'orientation': 'h', 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.00695233]), + 'x': array([89814.]), 'xaxis': 'x', - 'y': array(['Vicuna v1.5 (7B)'], dtype=object), + 'y': array(['gpt-3.5-turbo'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
BLEU score=%{x}', - 'legendgroup': 'OpenHermes-2.5-Mistral (7B)', + 'hovertemplate': 'Model=%{y}
length penalty=%{x}', + 'legendgroup': 'llama-2-70b-chat', 'marker': {'color': '#FFA15A', 'pattern': {'shape': ''}}, - 'name': 'OpenHermes-2.5-Mistral (7B)', - 'offsetgroup': 'OpenHermes-2.5-Mistral (7B)', + 'name': 'llama-2-70b-chat', + 'offsetgroup': 'llama-2-70b-chat', 'orientation': 'h', 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.00656316]), + 'x': array([88008.]), 'xaxis': 'x', - 'y': array(['OpenHermes-2.5-Mistral (7B)'], dtype=object), + 'y': array(['llama-2-70b-chat'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
BLEU score=%{x}', - 'legendgroup': 'Mistral (7B) Instruct v0.2 (Together AI)', + 'hovertemplate': 'Model=%{y}
length penalty=%{x}', + 'legendgroup': 'gemini-pro', 'marker': {'color': '#19d3f3', 'pattern': {'shape': ''}}, - 'name': 'Mistral (7B) Instruct v0.2 (Together AI)', - 'offsetgroup': 'Mistral (7B) Instruct v0.2 (Together AI)', + 'name': 'gemini-pro', + 'offsetgroup': 'gemini-pro', 'orientation': 'h', 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.00547852]), + 'x': array([87700.]), 'xaxis': 'x', - 'y': array(['Mistral (7B) Instruct v0.2 (Together AI)'], dtype=object), + 'y': array(['gemini-pro'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
BLEU score=%{x}', - 'legendgroup': 'gpt-4', + 'hovertemplate': 'Model=%{y}
length penalty=%{x}', + 'legendgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0', 'marker': {'color': '#FF6692', 'pattern': {'shape': ''}}, - 'name': 'gpt-4', - 'offsetgroup': 'gpt-4', + 'name': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0', + 'offsetgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0', 'orientation': 'h', 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.00470457]), + 'x': array([87700.]), 'xaxis': 'x', - 'y': array(['gpt-4'], dtype=object), + 'y': array(['TinyLlama/TinyLlama-1.1B-Chat-v1.0'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
BLEU score=%{x}', - 'legendgroup': 'LLaMA-2 Chat (7B)', + 'hovertemplate': 'Model=%{y}
length penalty=%{x}', + 'legendgroup': 'gpt-4-turbo', 'marker': {'color': '#B6E880', 'pattern': {'shape': ''}}, - 'name': 'LLaMA-2 Chat (7B)', - 'offsetgroup': 'LLaMA-2 Chat (7B)', + 'name': 'gpt-4-turbo', + 'offsetgroup': 'gpt-4-turbo', 'orientation': 'h', 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.00425586]), + 'x': array([85120.]), 'xaxis': 'x', - 'y': array(['LLaMA-2 Chat (7B)'], dtype=object), + 'y': array(['gpt-4-turbo'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
BLEU score=%{x}', - 'legendgroup': 'WizardLM v1.2 (13B)', + 'hovertemplate': 'Model=%{y}
length penalty=%{x}', + 'legendgroup': 'gpt-4', 'marker': {'color': '#FF97FF', 'pattern': {'shape': ''}}, - 'name': 'WizardLM v1.2 (13B)', - 'offsetgroup': 'WizardLM v1.2 (13B)', + 'name': 'gpt-4', + 'offsetgroup': 'gpt-4', 'orientation': 'h', 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.00367138]), + 'x': array([85120.]), 'xaxis': 'x', - 'y': array(['WizardLM v1.2 (13B)'], dtype=object), + 'y': array(['gpt-4'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
BLEU score=%{x}', - 'legendgroup': 'gpt-4-turbo', + 'hovertemplate': 'Model=%{y}
length penalty=%{x}', + 'legendgroup': 'chat-bison (PaLM 2)', 'marker': {'color': '#FECB52', 'pattern': {'shape': ''}}, - 'name': 'gpt-4-turbo', - 'offsetgroup': 'gpt-4-turbo', + 'name': 'chat-bison (PaLM 2)', + 'offsetgroup': 'chat-bison (PaLM 2)', 'orientation': 'h', 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.00348737]), + 'x': array([83400.]), 'xaxis': 'x', - 'y': array(['gpt-4-turbo'], dtype=object), + 'y': array(['chat-bison (PaLM 2)'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
BLEU score=%{x}', - 'legendgroup': 'chat-bison (PaLM 2)', + 'hovertemplate': 'Model=%{y}
length penalty=%{x}', + 'legendgroup': 'chat-bison-32k (PaLM 2 32K)', 'marker': {'color': '#636efa', 'pattern': {'shape': ''}}, - 'name': 'chat-bison (PaLM 2)', - 'offsetgroup': 'chat-bison (PaLM 2)', + 'name': 'chat-bison-32k (PaLM 2 32K)', + 'offsetgroup': 'chat-bison-32k (PaLM 2 32K)', 'orientation': 'h', 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.00331735]), + 'x': array([83400.]), 'xaxis': 'x', - 'y': array(['chat-bison (PaLM 2)'], dtype=object), + 'y': array(['chat-bison-32k (PaLM 2 32K)'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
BLEU score=%{x}', - 'legendgroup': 'llama-2-70b-chat', + 'hovertemplate': 'Model=%{y}
length penalty=%{x}', + 'legendgroup': 'Mistral (7B) Instruct v0.2 (Together AI)', 'marker': {'color': '#EF553B', 'pattern': {'shape': ''}}, - 'name': 'llama-2-70b-chat', - 'offsetgroup': 'llama-2-70b-chat', + 'name': 'Mistral (7B) Instruct v0.2 (Together AI)', + 'offsetgroup': 'Mistral (7B) Instruct v0.2 (Together AI)', 'orientation': 'h', 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.00329426]), + 'x': array([29298.]), 'xaxis': 'x', - 'y': array(['llama-2-70b-chat'], dtype=object), + 'y': array(['Mistral (7B) Instruct v0.2 (Together AI)'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
BLEU score=%{x}', - 'legendgroup': 'Qwen 1.5 Chat (7B)', + 'hovertemplate': 'Model=%{y}
length penalty=%{x}', + 'legendgroup': 'Vicuna v1.5 (7B)', 'marker': {'color': '#00cc96', 'pattern': {'shape': ''}}, - 'name': 'Qwen 1.5 Chat (7B)', - 'offsetgroup': 'Qwen 1.5 Chat (7B)', + 'name': 'Vicuna v1.5 (7B)', + 'offsetgroup': 'Vicuna v1.5 (7B)', 'orientation': 'h', 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.00318557]), + 'x': array([16948.]), 'xaxis': 'x', - 'y': array(['Qwen 1.5 Chat (7B)'], dtype=object), + 'y': array(['Vicuna v1.5 (7B)'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
BLEU score=%{x}', - 'legendgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0', + 'hovertemplate': 'Model=%{y}
length penalty=%{x}', + 'legendgroup': 'Falcon Instruct (7B)', 'marker': {'color': '#ab63fa', 'pattern': {'shape': ''}}, - 'name': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0', - 'offsetgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0', + 'name': 'Falcon Instruct (7B)', + 'offsetgroup': 'Falcon Instruct (7B)', 'orientation': 'h', 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.00299116]), + 'x': array([14928.]), 'xaxis': 'x', - 'y': array(['TinyLlama/TinyLlama-1.1B-Chat-v1.0'], dtype=object), + 'y': array(['Falcon Instruct (7B)'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
BLEU score=%{x}', - 'legendgroup': 'chat-bison-32k (PaLM 2 32K)', + 'hovertemplate': 'Model=%{y}
length penalty=%{x}', + 'legendgroup': 'RedPajama-INCITE Chat (7B)', 'marker': {'color': '#FFA15A', 'pattern': {'shape': ''}}, - 'name': 'chat-bison-32k (PaLM 2 32K)', - 'offsetgroup': 'chat-bison-32k (PaLM 2 32K)', + 'name': 'RedPajama-INCITE Chat (7B)', + 'offsetgroup': 'RedPajama-INCITE Chat (7B)', 'orientation': 'h', 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.00297091]), + 'x': array([14928.]), 'xaxis': 'x', - 'y': array(['chat-bison-32k (PaLM 2 32K)'], dtype=object), + 'y': array(['RedPajama-INCITE Chat (7B)'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
BLEU score=%{x}', + 'hovertemplate': 'Model=%{y}
length penalty=%{x}', 'legendgroup': 'Snorkel Mistral PairRM DPO (7B)', 'marker': {'color': '#19d3f3', 'pattern': {'shape': ''}}, 'name': 'Snorkel Mistral PairRM DPO (7B)', @@ -2458,96 +2474,96 @@ plot_object,header,plot_json,description,df,arguments 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.0029079]), + 'x': array([14928.]), 'xaxis': 'x', 'y': array(['Snorkel Mistral PairRM DPO (7B)'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
BLEU score=%{x}', - 'legendgroup': 'Mixtral-8x7B-Instruct-v0.1', + 'hovertemplate': 'Model=%{y}
length penalty=%{x}', + 'legendgroup': 'WizardLM v1.2 (13B)', 'marker': {'color': '#FF6692', 'pattern': {'shape': ''}}, - 'name': 'Mixtral-8x7B-Instruct-v0.1', - 'offsetgroup': 'Mixtral-8x7B-Instruct-v0.1', + 'name': 'WizardLM v1.2 (13B)', + 'offsetgroup': 'WizardLM v1.2 (13B)', 'orientation': 'h', 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.00268393]), + 'x': array([14928.]), 'xaxis': 'x', - 'y': array(['Mixtral-8x7B-Instruct-v0.1'], dtype=object), + 'y': array(['WizardLM v1.2 (13B)'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
BLEU score=%{x}', - 'legendgroup': 'gemini-pro', + 'hovertemplate': 'Model=%{y}
length penalty=%{x}', + 'legendgroup': 'Qwen 1.5 Chat (7B)', 'marker': {'color': '#B6E880', 'pattern': {'shape': ''}}, - 'name': 'gemini-pro', - 'offsetgroup': 'gemini-pro', + 'name': 'Qwen 1.5 Chat (7B)', + 'offsetgroup': 'Qwen 1.5 Chat (7B)', 'orientation': 'h', 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.00254393]), + 'x': array([14928.]), 'xaxis': 'x', - 'y': array(['gemini-pro'], dtype=object), + 'y': array(['Qwen 1.5 Chat (7B)'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
BLEU score=%{x}', - 'legendgroup': 'zephyr-7b-beta', + 'hovertemplate': 'Model=%{y}
length penalty=%{x}', + 'legendgroup': 'OpenHermes-2.5-Mistral (7B)', 'marker': {'color': '#FF97FF', 'pattern': {'shape': ''}}, - 'name': 'zephyr-7b-beta', - 'offsetgroup': 'zephyr-7b-beta', + 'name': 'OpenHermes-2.5-Mistral (7B)', + 'offsetgroup': 'OpenHermes-2.5-Mistral (7B)', 'orientation': 'h', 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.00106251]), + 'x': array([14928.]), 'xaxis': 'x', - 'y': array(['zephyr-7b-beta'], dtype=object), + 'y': array(['OpenHermes-2.5-Mistral (7B)'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
BLEU score=%{x}', - 'legendgroup': 'Mistral-7B-Instruct-v0.2', + 'hovertemplate': 'Model=%{y}
length penalty=%{x}', + 'legendgroup': 'LLaMA-2 Chat (7B)', 'marker': {'color': '#FECB52', 'pattern': {'shape': ''}}, - 'name': 'Mistral-7B-Instruct-v0.2', - 'offsetgroup': 'Mistral-7B-Instruct-v0.2', + 'name': 'LLaMA-2 Chat (7B)', + 'offsetgroup': 'LLaMA-2 Chat (7B)', 'orientation': 'h', 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.00049303]), + 'x': array([14928.]), 'xaxis': 'x', - 'y': array(['Mistral-7B-Instruct-v0.2'], dtype=object), + 'y': array(['LLaMA-2 Chat (7B)'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
BLEU score=%{x}', - 'legendgroup': 'Falcon Instruct (7B)', + 'hovertemplate': 'Model=%{y}
length penalty=%{x}', + 'legendgroup': '01-ai Yi Chat (34B)', 'marker': {'color': '#636efa', 'pattern': {'shape': ''}}, - 'name': 'Falcon Instruct (7B)', - 'offsetgroup': 'Falcon Instruct (7B)', + 'name': '01-ai Yi Chat (34B)', + 'offsetgroup': '01-ai Yi Chat (34B)', 'orientation': 'h', 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.00021729]), + 'x': array([14928.]), 'xaxis': 'x', - 'y': array(['Falcon Instruct (7B)'], dtype=object), + 'y': array(['01-ai Yi Chat (34B)'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
BLEU score=%{x}', - 'legendgroup': 'RedPajama-INCITE Chat (7B)', + 'hovertemplate': 'Model=%{y}
length penalty=%{x}', + 'legendgroup': 'Chronos Hermes (13B)', 'marker': {'color': '#EF553B', 'pattern': {'shape': ''}}, - 'name': 'RedPajama-INCITE Chat (7B)', - 'offsetgroup': 'RedPajama-INCITE Chat (7B)', + 'name': 'Chronos Hermes (13B)', + 'offsetgroup': 'Chronos Hermes (13B)', 'orientation': 'h', 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.]), + 'x': array([14928.]), 'xaxis': 'x', - 'y': array(['RedPajama-INCITE Chat (7B)'], dtype=object), + 'y': array(['Chronos Hermes (13B)'], dtype=object), 'yaxis': 'y'}, {'alignmentgroup': 'True', - 'hovertemplate': 'Model=%{y}
BLEU score=%{x}', + 'hovertemplate': 'Model=%{y}
length penalty=%{x}', 'legendgroup': 'Upstage SOLAR Instruct v1 (11B)', 'marker': {'color': '#00cc96', 'pattern': {'shape': ''}}, 'name': 'Upstage SOLAR Instruct v1 (11B)', @@ -2556,56 +2572,61 @@ plot_object,header,plot_json,description,df,arguments 'showlegend': True, 'textposition': 'auto', 'type': 'bar', - 'x': array([0.]), + 'x': array([14928.]), 'xaxis': 'x', 'y': array(['Upstage SOLAR Instruct v1 (11B)'], dtype=object), 'yaxis': 'y'}], 'layout': {'barmode': 'relative', 'legend': {'title': {'text': 'Model'}, 'tracegroupgap': 0}, 'template': '...', - 'title': {'text': 'Summary metrics BLEU score'}, - 'xaxis': {'anchor': 'y', 'domain': [0.0, 1.0], 'title': {'text': 'BLEU score'}}, + 'title': {'text': 'Summary metrics length penalty'}, + 'xaxis': {'anchor': 'y', 'domain': [0.0, 1.0], 'title': {'text': 'length penalty'}}, 'yaxis': {'anchor': 'x', 'categoryarray': [Upstage SOLAR Instruct v1 (11B), - RedPajama-INCITE Chat (7B), Falcon - Instruct (7B), Mistral-7B-Instruct-v0.2, - zephyr-7b-beta, gemini-pro, - Mixtral-8x7B-Instruct-v0.1, Snorkel - Mistral PairRM DPO (7B), chat-bison-32k - (PaLM 2 32K), - TinyLlama/TinyLlama-1.1B-Chat-v1.0, Qwen - 1.5 Chat (7B), llama-2-70b-chat, chat- - bison (PaLM 2), gpt-4-turbo, WizardLM - v1.2 (13B), LLaMA-2 Chat (7B), gpt-4, - Mistral (7B) Instruct v0.2 (Together - AI), OpenHermes-2.5-Mistral (7B), Vicuna - v1.5 (7B), 01-ai Yi Chat (34B), - gpt-3.5-turbo, Chronos Hermes (13B)], + Chronos Hermes (13B), 01-ai Yi Chat + (34B), LLaMA-2 Chat (7B), + OpenHermes-2.5-Mistral (7B), Qwen 1.5 + Chat (7B), WizardLM v1.2 (13B), Snorkel + Mistral PairRM DPO (7B), RedPajama- + INCITE Chat (7B), Falcon Instruct (7B), + Vicuna v1.5 (7B), Mistral (7B) Instruct + v0.2 (Together AI), chat-bison-32k (PaLM + 2 32K), chat-bison (PaLM 2), gpt-4, + gpt-4-turbo, + TinyLlama/TinyLlama-1.1B-Chat-v1.0, + gemini-pro, llama-2-70b-chat, + gpt-3.5-turbo, + Mixtral-8x7B-Instruct-v0.1, + zephyr-7b-beta, + Mistral-7B-Instruct-v0.2], 'categoryorder': 'array', 'domain': [0.0, 1.0], 'title': {'text': 'Model'}}} -})",Summary metrics BLEU score,"{""data"":[{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBLEU score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Chronos Hermes (13B)"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""Chronos Hermes (13B)"",""offsetgroup"":""Chronos Hermes (13B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.011439012700594395],""xaxis"":""x"",""y"":[""Chronos Hermes (13B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBLEU score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-3.5-turbo"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""gpt-3.5-turbo"",""offsetgroup"":""gpt-3.5-turbo"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.007892445077902592],""xaxis"":""x"",""y"":[""gpt-3.5-turbo""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBLEU score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""01-ai Yi Chat (34B)"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""01-ai Yi Chat (34B)"",""offsetgroup"":""01-ai Yi Chat (34B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.007311566390840339],""xaxis"":""x"",""y"":[""01-ai Yi Chat (34B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBLEU score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Vicuna v1.5 (7B)"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""Vicuna v1.5 (7B)"",""offsetgroup"":""Vicuna v1.5 (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.006952332387656228],""xaxis"":""x"",""y"":[""Vicuna v1.5 (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBLEU score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""OpenHermes-2.5-Mistral (7B)"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""OpenHermes-2.5-Mistral (7B)"",""offsetgroup"":""OpenHermes-2.5-Mistral (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.006563161880264231],""xaxis"":""x"",""y"":[""OpenHermes-2.5-Mistral (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBLEU score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral (7B) Instruct v0.2 (Together AI)"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""Mistral (7B) Instruct v0.2 (Together AI)"",""offsetgroup"":""Mistral (7B) Instruct v0.2 (Together AI)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.005478518060743351],""xaxis"":""x"",""y"":[""Mistral (7B) Instruct v0.2 (Together AI)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBLEU score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""gpt-4"",""offsetgroup"":""gpt-4"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.004704572681138337],""xaxis"":""x"",""y"":[""gpt-4""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBLEU score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""LLaMA-2 Chat (7B)"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""LLaMA-2 Chat (7B)"",""offsetgroup"":""LLaMA-2 Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.004255859538193306],""xaxis"":""x"",""y"":[""LLaMA-2 Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBLEU score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""WizardLM v1.2 (13B)"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""WizardLM v1.2 (13B)"",""offsetgroup"":""WizardLM v1.2 (13B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.003671383039102015],""xaxis"":""x"",""y"":[""WizardLM v1.2 (13B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBLEU score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4-turbo"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""gpt-4-turbo"",""offsetgroup"":""gpt-4-turbo"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.0034873692407505464],""xaxis"":""x"",""y"":[""gpt-4-turbo""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBLEU score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison (PaLM 2)"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""chat-bison (PaLM 2)"",""offsetgroup"":""chat-bison (PaLM 2)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.0033173472693443363],""xaxis"":""x"",""y"":[""chat-bison (PaLM 2)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBLEU score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""llama-2-70b-chat"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""llama-2-70b-chat"",""offsetgroup"":""llama-2-70b-chat"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.00329426273003284],""xaxis"":""x"",""y"":[""llama-2-70b-chat""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBLEU score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Qwen 1.5 Chat (7B)"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""Qwen 1.5 Chat (7B)"",""offsetgroup"":""Qwen 1.5 Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.003185571110431172],""xaxis"":""x"",""y"":[""Qwen 1.5 Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBLEU score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""offsetgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.002991155730532842],""xaxis"":""x"",""y"":[""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBLEU score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison-32k (PaLM 2 32K)"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""chat-bison-32k (PaLM 2 32K)"",""offsetgroup"":""chat-bison-32k (PaLM 2 32K)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.002970914340485325],""xaxis"":""x"",""y"":[""chat-bison-32k (PaLM 2 32K)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBLEU score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Snorkel Mistral PairRM DPO (7B)"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""Snorkel Mistral PairRM DPO (7B)"",""offsetgroup"":""Snorkel Mistral PairRM DPO (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.002907897771152987],""xaxis"":""x"",""y"":[""Snorkel Mistral PairRM DPO (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBLEU score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mixtral-8x7B-Instruct-v0.1"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""Mixtral-8x7B-Instruct-v0.1"",""offsetgroup"":""Mixtral-8x7B-Instruct-v0.1"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.0026839271544750283],""xaxis"":""x"",""y"":[""Mixtral-8x7B-Instruct-v0.1""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBLEU score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gemini-pro"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""gemini-pro"",""offsetgroup"":""gemini-pro"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.0025439281189154664],""xaxis"":""x"",""y"":[""gemini-pro""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBLEU score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""zephyr-7b-beta"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""zephyr-7b-beta"",""offsetgroup"":""zephyr-7b-beta"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.0010625100735849574],""xaxis"":""x"",""y"":[""zephyr-7b-beta""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBLEU score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral-7B-Instruct-v0.2"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""Mistral-7B-Instruct-v0.2"",""offsetgroup"":""Mistral-7B-Instruct-v0.2"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.0004930290548816363],""xaxis"":""x"",""y"":[""Mistral-7B-Instruct-v0.2""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBLEU score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Falcon Instruct (7B)"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""Falcon Instruct (7B)"",""offsetgroup"":""Falcon Instruct (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.00021729364201653395],""xaxis"":""x"",""y"":[""Falcon Instruct (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBLEU score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""RedPajama-INCITE Chat (7B)"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""RedPajama-INCITE Chat (7B)"",""offsetgroup"":""RedPajama-INCITE Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.0],""xaxis"":""x"",""y"":[""RedPajama-INCITE Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003eBLEU score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Upstage SOLAR Instruct v1 (11B)"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""Upstage SOLAR Instruct v1 (11B)"",""offsetgroup"":""Upstage SOLAR Instruct v1 (11B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.0],""xaxis"":""x"",""y"":[""Upstage SOLAR Instruct v1 (11B)""],""yaxis"":""y"",""type"":""bar""}],""layout"":{""template"":{""data"":{""histogram2dcontour"":[{""type"":""histogram2dcontour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""choropleth"":[{""type"":""choropleth"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""histogram2d"":[{""type"":""histogram2d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmap"":[{""type"":""heatmap"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmapgl"":[{""type"":""heatmapgl"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""contourcarpet"":[{""type"":""contourcarpet"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""contour"":[{""type"":""contour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""surface"":[{""type"":""surface"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""mesh3d"":[{""type"":""mesh3d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""scatter"":[{""fillpattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2},""type"":""scatter""}],""parcoords"":[{""type"":""parcoords"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolargl"":[{""type"":""scatterpolargl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""bar"":[{""error_x"":{""color"":""#2a3f5f""},""error_y"":{""color"":""#2a3f5f""},""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""bar""}],""scattergeo"":[{""type"":""scattergeo"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolar"":[{""type"":""scatterpolar"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""histogram"":[{""marker"":{""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""histogram""}],""scattergl"":[{""type"":""scattergl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatter3d"":[{""type"":""scatter3d"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattermapbox"":[{""type"":""scattermapbox"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterternary"":[{""type"":""scatterternary"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattercarpet"":[{""type"":""scattercarpet"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""carpet"":[{""aaxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""baxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""type"":""carpet""}],""table"":[{""cells"":{""fill"":{""color"":""#EBF0F8""},""line"":{""color"":""white""}},""header"":{""fill"":{""color"":""#C8D4E3""},""line"":{""color"":""white""}},""type"":""table""}],""barpolar"":[{""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""barpolar""}],""pie"":[{""automargin"":true,""type"":""pie""}]},""layout"":{""autotypenumbers"":""strict"",""colorway"":[""#636efa"",""#EF553B"",""#00cc96"",""#ab63fa"",""#FFA15A"",""#19d3f3"",""#FF6692"",""#B6E880"",""#FF97FF"",""#FECB52""],""font"":{""color"":""#2a3f5f""},""hovermode"":""closest"",""hoverlabel"":{""align"":""left""},""paper_bgcolor"":""white"",""plot_bgcolor"":""#E5ECF6"",""polar"":{""bgcolor"":""#E5ECF6"",""angularaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""radialaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""ternary"":{""bgcolor"":""#E5ECF6"",""aaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""baxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""caxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""coloraxis"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""colorscale"":{""sequential"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""sequentialminus"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""diverging"":[[0,""#8e0152""],[0.1,""#c51b7d""],[0.2,""#de77ae""],[0.3,""#f1b6da""],[0.4,""#fde0ef""],[0.5,""#f7f7f7""],[0.6,""#e6f5d0""],[0.7,""#b8e186""],[0.8,""#7fbc41""],[0.9,""#4d9221""],[1,""#276419""]]},""xaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""yaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""scene"":{""xaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""yaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""zaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2}},""shapedefaults"":{""line"":{""color"":""#2a3f5f""}},""annotationdefaults"":{""arrowcolor"":""#2a3f5f"",""arrowhead"":0,""arrowwidth"":1},""geo"":{""bgcolor"":""white"",""landcolor"":""#E5ECF6"",""subunitcolor"":""white"",""showland"":true,""showlakes"":true,""lakecolor"":""white""},""title"":{""x"":0.05},""mapbox"":{""style"":""light""}}},""xaxis"":{""anchor"":""y"",""domain"":[0.0,1.0],""title"":{""text"":""BLEU score""}},""yaxis"":{""anchor"":""x"",""domain"":[0.0,1.0],""title"":{""text"":""Model""},""categoryorder"":""array"",""categoryarray"":[""Upstage SOLAR Instruct v1 (11B)"",""RedPajama-INCITE Chat (7B)"",""Falcon Instruct (7B)"",""Mistral-7B-Instruct-v0.2"",""zephyr-7b-beta"",""gemini-pro"",""Mixtral-8x7B-Instruct-v0.1"",""Snorkel Mistral PairRM DPO (7B)"",""chat-bison-32k (PaLM 2 32K)"",""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""Qwen 1.5 Chat (7B)"",""llama-2-70b-chat"",""chat-bison (PaLM 2)"",""gpt-4-turbo"",""WizardLM v1.2 (13B)"",""LLaMA-2 Chat (7B)"",""gpt-4"",""Mistral (7B) Instruct v0.2 (Together AI)"",""OpenHermes-2.5-Mistral (7B)"",""Vicuna v1.5 (7B)"",""01-ai Yi Chat (34B)"",""gpt-3.5-turbo"",""Chronos Hermes (13B)""]},""legend"":{""title"":{""text"":""Model""},""tracegroupgap"":0},""title"":{""text"":""Summary metrics BLEU score""},""barmode"":""relative""}}","BLEU (BiLingual Evaluation Understudy) measures similarity between unigrams, bigrams and trigrams in the summarized and original text. Unlike BERT score this metric doesn't handle synonyms. Value is averaged for each model.",",model,bert_score_P,bert_score_R,bert_score_F1,original_text_length_part,sentence_count,length_penalty,bleu_score -1,Chronos Hermes (13B),0.3124825,0.31071666,0.311415,0.4742810243835248,3.5818443804034583,14928.0,0.011439012700594395 -18,gpt-3.5-turbo,0.4943981,0.48408476,0.4888874,0.5905700146991734,4.229639819909955,89814.0,0.007892445077902592 -0,01-ai Yi Chat (34B),0.33974892,0.3404481,0.3399749,0.43251538287409536,3.5818443804034583,14928.0,0.007311566390840339 -13,Vicuna v1.5 (7B),0.284109,0.27878883,0.28129113,0.2781035051738079,3.6173027989821884,16948.0,0.006952332387656228 -7,OpenHermes-2.5-Mistral (7B),0.3618188,0.35180506,0.3565194,0.312054520357568,3.5818443804034583,14928.0,0.006563161880264231 -4,Mistral (7B) Instruct v0.2 (Together AI),0.3647361,0.3664233,0.36540908,0.5233998570385472,3.712222222222222,29298.0,0.005478518060743351 -19,gpt-4,0.48605907,0.472583,0.47901583,0.4763731952669352,4.266137566137566,85120.0,0.004704572681138337 -3,LLaMA-2 Chat (7B),0.3203912,0.3153909,0.31770444,0.4084233313416049,3.5818443804034583,14928.0,0.004255859538193306 -14,WizardLM v1.2 (13B),0.34085444,0.32933056,0.33466902,0.28716720161049375,3.5818443804034583,14928.0,0.003671383039102015 -20,gpt-4-turbo,0.42728576,0.4162435,0.42098433,0.5393220459796505,4.266137566137566,85120.0,0.0034873692407505464 -15,chat-bison (PaLM 2),0.23117188,0.23029378,0.23060663,0.2927236655934559,4.281081081081081,83400.0,0.0033173472693443363 -21,llama-2-70b-chat,0.20800962,0.21472095,0.21117964,0.29684572894554634,4.2436893203883495,88008.0,0.00329426273003284 -8,Qwen 1.5 Chat (7B),0.34855434,0.34154576,0.344803,0.29904529709475364,3.5818443804034583,14928.0,0.003185571110431172 -11,TinyLlama/TinyLlama-1.1B-Chat-v1.0,0.122185074,0.11885959,0.12042627,0.13915355617375091,4.244871794871795,87700.0,0.002991155730532842 -16,chat-bison-32k (PaLM 2 32K),0.23046139,0.22983725,0.23002876,0.2608806894318779,4.281081081081081,83400.0,0.002970914340485325 -10,Snorkel Mistral PairRM DPO (7B),0.31672964,0.33782956,0.3265383,3.7740234383755356,3.5818443804034583,14928.0,0.002907897771152987 -6,Mixtral-8x7B-Instruct-v0.1,0.19128644,0.19555509,0.19330867,0.2665288353398184,4.161038961038961,103320.0,0.0026839271544750283 -17,gemini-pro,0.23105659,0.23057175,0.23072062,0.295286999418032,4.244871794871795,87700.0,0.0025439281189154664 -22,zephyr-7b-beta,0.085390136,0.08266569,0.08394519,0.08796697338212889,4.159788702026735,103714.0,0.0010625100735849574 -5,Mistral-7B-Instruct-v0.2,0.043820098,0.042561684,0.04313921,0.04250630683894714,4.120342654588421,113258.0,0.0004930290548816363 -2,Falcon Instruct (7B),0.2895086,0.23968808,0.2615204,0.0490635544441649,3.5818443804034583,14928.0,0.00021729364201653395 -9,RedPajama-INCITE Chat (7B),0.261367,0.23758642,0.2487217,0.0560284823193376,3.5818443804034583,14928.0,0.0 -12,Upstage SOLAR Instruct v1 (11B),0.0,0.0,0.0,0.0017662349842492329,3.5818443804034583,14928.0,0.0 -","{""x"": ""bleu_score"", ""y"": ""model"", ""color"": ""model"", ""orientation"": ""h"", ""labels"": {""bleu_score"": ""BLEU score"", ""model"": ""Model""}, ""title"": ""Summary metrics BLEU score""}" +})",Summary metrics length penalty,"{""data"":[{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003elength penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral-7B-Instruct-v0.2"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""Mistral-7B-Instruct-v0.2"",""offsetgroup"":""Mistral-7B-Instruct-v0.2"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[113258.0],""xaxis"":""x"",""y"":[""Mistral-7B-Instruct-v0.2""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003elength penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""zephyr-7b-beta"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""zephyr-7b-beta"",""offsetgroup"":""zephyr-7b-beta"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[103714.0],""xaxis"":""x"",""y"":[""zephyr-7b-beta""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003elength penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mixtral-8x7B-Instruct-v0.1"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""Mixtral-8x7B-Instruct-v0.1"",""offsetgroup"":""Mixtral-8x7B-Instruct-v0.1"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[103320.0],""xaxis"":""x"",""y"":[""Mixtral-8x7B-Instruct-v0.1""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003elength penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-3.5-turbo"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""gpt-3.5-turbo"",""offsetgroup"":""gpt-3.5-turbo"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[89814.0],""xaxis"":""x"",""y"":[""gpt-3.5-turbo""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003elength penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""llama-2-70b-chat"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""llama-2-70b-chat"",""offsetgroup"":""llama-2-70b-chat"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[88008.0],""xaxis"":""x"",""y"":[""llama-2-70b-chat""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003elength penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gemini-pro"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""gemini-pro"",""offsetgroup"":""gemini-pro"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[87700.0],""xaxis"":""x"",""y"":[""gemini-pro""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003elength penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""offsetgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[87700.0],""xaxis"":""x"",""y"":[""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003elength penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4-turbo"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""gpt-4-turbo"",""offsetgroup"":""gpt-4-turbo"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[85120.0],""xaxis"":""x"",""y"":[""gpt-4-turbo""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003elength penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""gpt-4"",""offsetgroup"":""gpt-4"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[85120.0],""xaxis"":""x"",""y"":[""gpt-4""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003elength penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison (PaLM 2)"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""chat-bison (PaLM 2)"",""offsetgroup"":""chat-bison (PaLM 2)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[83400.0],""xaxis"":""x"",""y"":[""chat-bison (PaLM 2)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003elength penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison-32k (PaLM 2 32K)"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""chat-bison-32k (PaLM 2 32K)"",""offsetgroup"":""chat-bison-32k (PaLM 2 32K)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[83400.0],""xaxis"":""x"",""y"":[""chat-bison-32k (PaLM 2 32K)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003elength penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral (7B) Instruct v0.2 (Together AI)"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""Mistral (7B) Instruct v0.2 (Together AI)"",""offsetgroup"":""Mistral (7B) Instruct v0.2 (Together AI)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[29298.0],""xaxis"":""x"",""y"":[""Mistral (7B) Instruct v0.2 (Together AI)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003elength penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Vicuna v1.5 (7B)"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""Vicuna v1.5 (7B)"",""offsetgroup"":""Vicuna v1.5 (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[16948.0],""xaxis"":""x"",""y"":[""Vicuna v1.5 (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003elength penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Falcon Instruct (7B)"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""Falcon Instruct (7B)"",""offsetgroup"":""Falcon Instruct (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[14928.0],""xaxis"":""x"",""y"":[""Falcon Instruct (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003elength penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""RedPajama-INCITE Chat (7B)"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""RedPajama-INCITE Chat (7B)"",""offsetgroup"":""RedPajama-INCITE Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[14928.0],""xaxis"":""x"",""y"":[""RedPajama-INCITE Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003elength penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Snorkel Mistral PairRM DPO (7B)"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""Snorkel Mistral PairRM DPO (7B)"",""offsetgroup"":""Snorkel Mistral PairRM DPO (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[14928.0],""xaxis"":""x"",""y"":[""Snorkel Mistral PairRM DPO (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003elength penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""WizardLM v1.2 (13B)"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""WizardLM v1.2 (13B)"",""offsetgroup"":""WizardLM v1.2 (13B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[14928.0],""xaxis"":""x"",""y"":[""WizardLM v1.2 (13B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003elength penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Qwen 1.5 Chat (7B)"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""Qwen 1.5 Chat (7B)"",""offsetgroup"":""Qwen 1.5 Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[14928.0],""xaxis"":""x"",""y"":[""Qwen 1.5 Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003elength penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""OpenHermes-2.5-Mistral (7B)"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""OpenHermes-2.5-Mistral (7B)"",""offsetgroup"":""OpenHermes-2.5-Mistral (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[14928.0],""xaxis"":""x"",""y"":[""OpenHermes-2.5-Mistral (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003elength penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""LLaMA-2 Chat (7B)"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""LLaMA-2 Chat (7B)"",""offsetgroup"":""LLaMA-2 Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[14928.0],""xaxis"":""x"",""y"":[""LLaMA-2 Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003elength penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""01-ai Yi Chat (34B)"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""01-ai Yi Chat (34B)"",""offsetgroup"":""01-ai Yi Chat (34B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[14928.0],""xaxis"":""x"",""y"":[""01-ai Yi Chat (34B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003elength penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Chronos Hermes (13B)"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""Chronos Hermes (13B)"",""offsetgroup"":""Chronos Hermes (13B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[14928.0],""xaxis"":""x"",""y"":[""Chronos Hermes (13B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""Model=%{y}\u003cbr\u003elength penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Upstage SOLAR Instruct v1 (11B)"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""Upstage SOLAR Instruct v1 (11B)"",""offsetgroup"":""Upstage SOLAR Instruct v1 (11B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[14928.0],""xaxis"":""x"",""y"":[""Upstage SOLAR Instruct v1 (11B)""],""yaxis"":""y"",""type"":""bar""}],""layout"":{""template"":{""data"":{""histogram2dcontour"":[{""type"":""histogram2dcontour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""choropleth"":[{""type"":""choropleth"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""histogram2d"":[{""type"":""histogram2d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmap"":[{""type"":""heatmap"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmapgl"":[{""type"":""heatmapgl"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""contourcarpet"":[{""type"":""contourcarpet"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""contour"":[{""type"":""contour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""surface"":[{""type"":""surface"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""mesh3d"":[{""type"":""mesh3d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""scatter"":[{""fillpattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2},""type"":""scatter""}],""parcoords"":[{""type"":""parcoords"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolargl"":[{""type"":""scatterpolargl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""bar"":[{""error_x"":{""color"":""#2a3f5f""},""error_y"":{""color"":""#2a3f5f""},""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""bar""}],""scattergeo"":[{""type"":""scattergeo"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolar"":[{""type"":""scatterpolar"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""histogram"":[{""marker"":{""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""histogram""}],""scattergl"":[{""type"":""scattergl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatter3d"":[{""type"":""scatter3d"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattermapbox"":[{""type"":""scattermapbox"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterternary"":[{""type"":""scatterternary"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattercarpet"":[{""type"":""scattercarpet"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""carpet"":[{""aaxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""baxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""type"":""carpet""}],""table"":[{""cells"":{""fill"":{""color"":""#EBF0F8""},""line"":{""color"":""white""}},""header"":{""fill"":{""color"":""#C8D4E3""},""line"":{""color"":""white""}},""type"":""table""}],""barpolar"":[{""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""barpolar""}],""pie"":[{""automargin"":true,""type"":""pie""}]},""layout"":{""autotypenumbers"":""strict"",""colorway"":[""#636efa"",""#EF553B"",""#00cc96"",""#ab63fa"",""#FFA15A"",""#19d3f3"",""#FF6692"",""#B6E880"",""#FF97FF"",""#FECB52""],""font"":{""color"":""#2a3f5f""},""hovermode"":""closest"",""hoverlabel"":{""align"":""left""},""paper_bgcolor"":""white"",""plot_bgcolor"":""#E5ECF6"",""polar"":{""bgcolor"":""#E5ECF6"",""angularaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""radialaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""ternary"":{""bgcolor"":""#E5ECF6"",""aaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""baxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""caxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""coloraxis"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""colorscale"":{""sequential"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""sequentialminus"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""diverging"":[[0,""#8e0152""],[0.1,""#c51b7d""],[0.2,""#de77ae""],[0.3,""#f1b6da""],[0.4,""#fde0ef""],[0.5,""#f7f7f7""],[0.6,""#e6f5d0""],[0.7,""#b8e186""],[0.8,""#7fbc41""],[0.9,""#4d9221""],[1,""#276419""]]},""xaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""yaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""scene"":{""xaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""yaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""zaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2}},""shapedefaults"":{""line"":{""color"":""#2a3f5f""}},""annotationdefaults"":{""arrowcolor"":""#2a3f5f"",""arrowhead"":0,""arrowwidth"":1},""geo"":{""bgcolor"":""white"",""landcolor"":""#E5ECF6"",""subunitcolor"":""white"",""showland"":true,""showlakes"":true,""lakecolor"":""white""},""title"":{""x"":0.05},""mapbox"":{""style"":""light""}}},""xaxis"":{""anchor"":""y"",""domain"":[0.0,1.0],""title"":{""text"":""length penalty""}},""yaxis"":{""anchor"":""x"",""domain"":[0.0,1.0],""title"":{""text"":""Model""},""categoryorder"":""array"",""categoryarray"":[""Upstage SOLAR Instruct v1 (11B)"",""Chronos Hermes (13B)"",""01-ai Yi Chat (34B)"",""LLaMA-2 Chat (7B)"",""OpenHermes-2.5-Mistral (7B)"",""Qwen 1.5 Chat (7B)"",""WizardLM v1.2 (13B)"",""Snorkel Mistral PairRM DPO (7B)"",""RedPajama-INCITE Chat (7B)"",""Falcon Instruct (7B)"",""Vicuna v1.5 (7B)"",""Mistral (7B) Instruct v0.2 (Together AI)"",""chat-bison-32k (PaLM 2 32K)"",""chat-bison (PaLM 2)"",""gpt-4"",""gpt-4-turbo"",""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""gemini-pro"",""llama-2-70b-chat"",""gpt-3.5-turbo"",""Mixtral-8x7B-Instruct-v0.1"",""zephyr-7b-beta"",""Mistral-7B-Instruct-v0.2""]},""legend"":{""title"":{""text"":""Model""},""tracegroupgap"":0},""title"":{""text"":""Summary metrics length penalty""},""barmode"":""relative""}}","It is assumed that good quality summary contains between 2 and 5 sentences (inclusive range).
+ The penalty is a difference between summary sentence count and this range. + + It is summed for each model.",",model,BERT_score_precision,BERT_score_recall,BERT_score_F1,BLEU_score,original_text_length_part,sentence_count,length_penalty +5,Mistral-7B-Instruct-v0.2,0.04389399,0.045185987,0.04378006,0.000566625796313851,0.04250630683894714,4.120342654588421,113258.0 +22,zephyr-7b-beta,0.085546724,0.08755772,0.085219756,0.0012612839176470308,0.08796697338212889,4.159788702026735,103714.0 +6,Mixtral-8x7B-Instruct-v0.1,0.19137934,0.2029136,0.19449018,0.0031843990217988536,0.2665288353398184,4.161038961038961,103320.0 +18,gpt-3.5-turbo,0.49478123,0.50445867,0.49331823,0.00919205486407126,0.5905700146991734,4.229639819909955,89814.0 +21,llama-2-70b-chat,0.20810011,0.22406381,0.21268094,0.004560500754935232,0.29684572894554634,4.2436893203883495,88008.0 +17,gemini-pro,0.23109974,0.23956373,0.23199782,0.0032373504004405487,0.295286999418032,4.244871794871795,87700.0 +11,TinyLlama/TinyLlama-1.1B-Chat-v1.0,0.122332305,0.12540509,0.12200464,0.003286423403673119,0.13915355617375091,4.244871794871795,87700.0 +20,gpt-4-turbo,0.42933634,0.4414623,0.4294052,0.0042830628392272,0.5393220459796505,4.266137566137566,85120.0 +19,gpt-4,0.4864653,0.49512562,0.4839312,0.005711113295666468,0.4763731952669352,4.266137566137566,85120.0 +15,chat-bison (PaLM 2),0.23123139,0.24001649,0.23214735,0.0037652345768886663,0.2927236655934559,4.281081081081081,83400.0 +16,chat-bison-32k (PaLM 2 32K),0.23051436,0.23993237,0.2317056,0.003694633514634998,0.2608806894318779,4.281081081081081,83400.0 +4,Mistral (7B) Instruct v0.2 (Together AI),0.36488953,0.3797993,0.36758336,0.005650224193975447,0.5233998570385472,3.712222222222222,29298.0 +13,Vicuna v1.5 (7B),0.28434175,0.29119453,0.2839047,0.007105541953090669,0.2781035051738079,3.6173027989821884,16948.0 +2,Falcon Instruct (7B),0.30270517,0.28607234,0.29104736,0.0030232447024239606,0.0490635544441649,3.5818443804034583,14928.0 +9,RedPajama-INCITE Chat (7B),0.26832756,0.27305293,0.26768887,0.0,0.0560284823193376,3.5818443804034583,14928.0 +10,Snorkel Mistral PairRM DPO (7B),0.3167385,0.34785262,0.32718164,0.0029236226777824676,3.7740234383755356,3.5818443804034583,14928.0 +14,WizardLM v1.2 (13B),0.3420949,0.34746957,0.33996373,0.00373442128604677,0.28716720161049375,3.5818443804034583,14928.0 +8,Qwen 1.5 Chat (7B),0.34898603,0.35945317,0.34867778,0.0033327500620805805,0.29904529709475364,3.5818443804034583,14928.0 +7,OpenHermes-2.5-Mistral (7B),0.3621834,0.3685358,0.36003792,0.0068684572027745494,0.312054520357568,3.5818443804034583,14928.0 +3,LLaMA-2 Chat (7B),0.32074162,0.33171847,0.32136682,0.004415024709996126,0.4084233313416049,3.5818443804034583,14928.0 +0,01-ai Yi Chat (34B),0.33981326,0.35219854,0.34183535,0.007428840277380581,0.43251538287409536,3.5818443804034583,14928.0 +1,Chronos Hermes (13B),0.31285536,0.32630467,0.3150877,0.011542047908319874,0.4742810243835248,3.5818443804034583,14928.0 +12,Upstage SOLAR Instruct v1 (11B),0.0,0.0,0.0,0.0,0.0017662349842492329,3.5818443804034583,14928.0 +","{""x"": ""length_penalty"", ""y"": ""model"", ""color"": ""model"", ""orientation"": ""h"", ""labels"": {""length_penalty"": ""length penalty"", ""model"": ""Model""}, ""title"": ""Summary metrics length penalty""}"