diff --git "a/data/summary_metrics_plots.csv" "b/data/summary_metrics_plots.csv"
new file mode 100644--- /dev/null
+++ "b/data/summary_metrics_plots.csv"
@@ -0,0 +1,2611 @@
+plot_object,header,plot_json,description,df,arguments
+"Figure({
+ 'data': [{'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
bert_score_P=%{x}',
+ 'legendgroup': 'gpt-3.5-turbo',
+ 'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
+ 'name': 'gpt-3.5-turbo',
+ 'offsetgroup': 'gpt-3.5-turbo',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.4943981], dtype=float32),
+ 'xaxis': 'x',
+ 'y': array(['gpt-3.5-turbo'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
bert_score_P=%{x}',
+ 'legendgroup': 'gpt-4',
+ 'marker': {'color': '#EF553B', 'pattern': {'shape': ''}},
+ 'name': 'gpt-4',
+ 'offsetgroup': 'gpt-4',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.48605907], dtype=float32),
+ 'xaxis': 'x',
+ 'y': array(['gpt-4'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
bert_score_P=%{x}',
+ 'legendgroup': 'gpt-4-turbo',
+ 'marker': {'color': '#00cc96', 'pattern': {'shape': ''}},
+ 'name': 'gpt-4-turbo',
+ 'offsetgroup': 'gpt-4-turbo',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.42728576], dtype=float32),
+ 'xaxis': 'x',
+ 'y': array(['gpt-4-turbo'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
bert_score_P=%{x}',
+ 'legendgroup': 'Mistral (7B) Instruct v0.2 (Together AI)',
+ 'marker': {'color': '#ab63fa', 'pattern': {'shape': ''}},
+ 'name': 'Mistral (7B) Instruct v0.2 (Together AI)',
+ 'offsetgroup': 'Mistral (7B) Instruct v0.2 (Together AI)',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.3647361], dtype=float32),
+ 'xaxis': 'x',
+ 'y': array(['Mistral (7B) Instruct v0.2 (Together AI)'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
bert_score_P=%{x}',
+ 'legendgroup': 'OpenHermes-2.5-Mistral (7B)',
+ 'marker': {'color': '#FFA15A', 'pattern': {'shape': ''}},
+ 'name': 'OpenHermes-2.5-Mistral (7B)',
+ 'offsetgroup': 'OpenHermes-2.5-Mistral (7B)',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.3618188], dtype=float32),
+ 'xaxis': 'x',
+ 'y': array(['OpenHermes-2.5-Mistral (7B)'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
bert_score_P=%{x}',
+ 'legendgroup': 'Qwen 1.5 Chat (7B)',
+ 'marker': {'color': '#19d3f3', 'pattern': {'shape': ''}},
+ 'name': 'Qwen 1.5 Chat (7B)',
+ 'offsetgroup': 'Qwen 1.5 Chat (7B)',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.34855434], dtype=float32),
+ 'xaxis': 'x',
+ 'y': array(['Qwen 1.5 Chat (7B)'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
bert_score_P=%{x}',
+ 'legendgroup': 'WizardLM v1.2 (13B)',
+ 'marker': {'color': '#FF6692', 'pattern': {'shape': ''}},
+ 'name': 'WizardLM v1.2 (13B)',
+ 'offsetgroup': 'WizardLM v1.2 (13B)',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.34085444], dtype=float32),
+ 'xaxis': 'x',
+ 'y': array(['WizardLM v1.2 (13B)'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
bert_score_P=%{x}',
+ 'legendgroup': '01-ai Yi Chat (34B)',
+ 'marker': {'color': '#B6E880', 'pattern': {'shape': ''}},
+ 'name': '01-ai Yi Chat (34B)',
+ 'offsetgroup': '01-ai Yi Chat (34B)',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.33974892], dtype=float32),
+ 'xaxis': 'x',
+ 'y': array(['01-ai Yi Chat (34B)'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
bert_score_P=%{x}',
+ 'legendgroup': 'LLaMA-2 Chat (7B)',
+ 'marker': {'color': '#FF97FF', 'pattern': {'shape': ''}},
+ 'name': 'LLaMA-2 Chat (7B)',
+ 'offsetgroup': 'LLaMA-2 Chat (7B)',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.3203912], dtype=float32),
+ 'xaxis': 'x',
+ 'y': array(['LLaMA-2 Chat (7B)'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
bert_score_P=%{x}',
+ 'legendgroup': 'Snorkel Mistral PairRM DPO (7B)',
+ 'marker': {'color': '#FECB52', 'pattern': {'shape': ''}},
+ 'name': 'Snorkel Mistral PairRM DPO (7B)',
+ 'offsetgroup': 'Snorkel Mistral PairRM DPO (7B)',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.31672964], dtype=float32),
+ 'xaxis': 'x',
+ 'y': array(['Snorkel Mistral PairRM DPO (7B)'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
bert_score_P=%{x}',
+ 'legendgroup': 'Chronos Hermes (13B)',
+ 'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
+ 'name': 'Chronos Hermes (13B)',
+ 'offsetgroup': 'Chronos Hermes (13B)',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.3124825], dtype=float32),
+ 'xaxis': 'x',
+ 'y': array(['Chronos Hermes (13B)'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
bert_score_P=%{x}',
+ 'legendgroup': 'Falcon Instruct (7B)',
+ 'marker': {'color': '#EF553B', 'pattern': {'shape': ''}},
+ 'name': 'Falcon Instruct (7B)',
+ 'offsetgroup': 'Falcon Instruct (7B)',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.2895086], dtype=float32),
+ 'xaxis': 'x',
+ 'y': array(['Falcon Instruct (7B)'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
bert_score_P=%{x}',
+ 'legendgroup': 'Vicuna v1.5 (7B)',
+ 'marker': {'color': '#00cc96', 'pattern': {'shape': ''}},
+ 'name': 'Vicuna v1.5 (7B)',
+ 'offsetgroup': 'Vicuna v1.5 (7B)',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.284109], dtype=float32),
+ 'xaxis': 'x',
+ 'y': array(['Vicuna v1.5 (7B)'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
bert_score_P=%{x}',
+ 'legendgroup': 'RedPajama-INCITE Chat (7B)',
+ 'marker': {'color': '#ab63fa', 'pattern': {'shape': ''}},
+ 'name': 'RedPajama-INCITE Chat (7B)',
+ 'offsetgroup': 'RedPajama-INCITE Chat (7B)',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.261367], dtype=float32),
+ 'xaxis': 'x',
+ 'y': array(['RedPajama-INCITE Chat (7B)'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
bert_score_P=%{x}',
+ 'legendgroup': 'chat-bison (PaLM 2)',
+ 'marker': {'color': '#FFA15A', 'pattern': {'shape': ''}},
+ 'name': 'chat-bison (PaLM 2)',
+ 'offsetgroup': 'chat-bison (PaLM 2)',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.23117188], dtype=float32),
+ 'xaxis': 'x',
+ 'y': array(['chat-bison (PaLM 2)'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
bert_score_P=%{x}',
+ 'legendgroup': 'gemini-pro',
+ 'marker': {'color': '#19d3f3', 'pattern': {'shape': ''}},
+ 'name': 'gemini-pro',
+ 'offsetgroup': 'gemini-pro',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.23105659], dtype=float32),
+ 'xaxis': 'x',
+ 'y': array(['gemini-pro'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
bert_score_P=%{x}',
+ 'legendgroup': 'chat-bison-32k (PaLM 2 32K)',
+ 'marker': {'color': '#FF6692', 'pattern': {'shape': ''}},
+ 'name': 'chat-bison-32k (PaLM 2 32K)',
+ 'offsetgroup': 'chat-bison-32k (PaLM 2 32K)',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.23046139], dtype=float32),
+ 'xaxis': 'x',
+ 'y': array(['chat-bison-32k (PaLM 2 32K)'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
bert_score_P=%{x}',
+ 'legendgroup': 'llama-2-70b-chat',
+ 'marker': {'color': '#B6E880', 'pattern': {'shape': ''}},
+ 'name': 'llama-2-70b-chat',
+ 'offsetgroup': 'llama-2-70b-chat',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.20800962], dtype=float32),
+ 'xaxis': 'x',
+ 'y': array(['llama-2-70b-chat'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
bert_score_P=%{x}',
+ 'legendgroup': 'Mixtral-8x7B-Instruct-v0.1',
+ 'marker': {'color': '#FF97FF', 'pattern': {'shape': ''}},
+ 'name': 'Mixtral-8x7B-Instruct-v0.1',
+ 'offsetgroup': 'Mixtral-8x7B-Instruct-v0.1',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.19128644], dtype=float32),
+ 'xaxis': 'x',
+ 'y': array(['Mixtral-8x7B-Instruct-v0.1'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
bert_score_P=%{x}',
+ 'legendgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
+ 'marker': {'color': '#FECB52', 'pattern': {'shape': ''}},
+ 'name': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
+ 'offsetgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.12218507], dtype=float32),
+ 'xaxis': 'x',
+ 'y': array(['TinyLlama/TinyLlama-1.1B-Chat-v1.0'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
bert_score_P=%{x}',
+ 'legendgroup': 'zephyr-7b-beta',
+ 'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
+ 'name': 'zephyr-7b-beta',
+ 'offsetgroup': 'zephyr-7b-beta',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.08539014], dtype=float32),
+ 'xaxis': 'x',
+ 'y': array(['zephyr-7b-beta'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
bert_score_P=%{x}',
+ 'legendgroup': 'Mistral-7B-Instruct-v0.2',
+ 'marker': {'color': '#EF553B', 'pattern': {'shape': ''}},
+ 'name': 'Mistral-7B-Instruct-v0.2',
+ 'offsetgroup': 'Mistral-7B-Instruct-v0.2',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.0438201], dtype=float32),
+ 'xaxis': 'x',
+ 'y': array(['Mistral-7B-Instruct-v0.2'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
bert_score_P=%{x}',
+ 'legendgroup': 'Upstage SOLAR Instruct v1 (11B)',
+ 'marker': {'color': '#00cc96', 'pattern': {'shape': ''}},
+ 'name': 'Upstage SOLAR Instruct v1 (11B)',
+ 'offsetgroup': 'Upstage SOLAR Instruct v1 (11B)',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.], dtype=float32),
+ 'xaxis': 'x',
+ 'y': array(['Upstage SOLAR Instruct v1 (11B)'], dtype=object),
+ 'yaxis': 'y'}],
+ 'layout': {'barmode': 'relative',
+ 'legend': {'title': {'text': 'model'}, 'tracegroupgap': 0},
+ 'template': '...',
+ 'title': {'text': 'Summary metrics BERT score P'},
+ 'xaxis': {'anchor': 'y', 'domain': [0.0, 1.0], 'title': {'text': 'bert_score_P'}},
+ 'yaxis': {'anchor': 'x',
+ 'categoryarray': [Upstage SOLAR Instruct v1 (11B),
+ Mistral-7B-Instruct-v0.2,
+ zephyr-7b-beta,
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,
+ Mixtral-8x7B-Instruct-v0.1,
+ llama-2-70b-chat, chat-bison-32k (PaLM 2
+ 32K), gemini-pro, chat-bison (PaLM 2),
+ RedPajama-INCITE Chat (7B), Vicuna v1.5
+ (7B), Falcon Instruct (7B), Chronos
+ Hermes (13B), Snorkel Mistral PairRM DPO
+ (7B), LLaMA-2 Chat (7B), 01-ai Yi Chat
+ (34B), WizardLM v1.2 (13B), Qwen 1.5
+ Chat (7B), OpenHermes-2.5-Mistral (7B),
+ Mistral (7B) Instruct v0.2 (Together
+ AI), gpt-4-turbo, gpt-4, gpt-3.5-turbo],
+ 'categoryorder': 'array',
+ 'domain': [0.0, 1.0],
+ 'title': {'text': 'model'}}}
+})",Summary metrics BERT score P,"{""data"":[{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003ebert_score_P=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-3.5-turbo"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""gpt-3.5-turbo"",""offsetgroup"":""gpt-3.5-turbo"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.4943981],""xaxis"":""x"",""y"":[""gpt-3.5-turbo""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003ebert_score_P=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""gpt-4"",""offsetgroup"":""gpt-4"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.48605907],""xaxis"":""x"",""y"":[""gpt-4""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003ebert_score_P=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4-turbo"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""gpt-4-turbo"",""offsetgroup"":""gpt-4-turbo"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.42728576],""xaxis"":""x"",""y"":[""gpt-4-turbo""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003ebert_score_P=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral (7B) Instruct v0.2 (Together AI)"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""Mistral (7B) Instruct v0.2 (Together AI)"",""offsetgroup"":""Mistral (7B) Instruct v0.2 (Together AI)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.3647361],""xaxis"":""x"",""y"":[""Mistral (7B) Instruct v0.2 (Together AI)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003ebert_score_P=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""OpenHermes-2.5-Mistral (7B)"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""OpenHermes-2.5-Mistral (7B)"",""offsetgroup"":""OpenHermes-2.5-Mistral (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.3618188],""xaxis"":""x"",""y"":[""OpenHermes-2.5-Mistral (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003ebert_score_P=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Qwen 1.5 Chat (7B)"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""Qwen 1.5 Chat (7B)"",""offsetgroup"":""Qwen 1.5 Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.34855434],""xaxis"":""x"",""y"":[""Qwen 1.5 Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003ebert_score_P=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""WizardLM v1.2 (13B)"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""WizardLM v1.2 (13B)"",""offsetgroup"":""WizardLM v1.2 (13B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.34085444],""xaxis"":""x"",""y"":[""WizardLM v1.2 (13B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003ebert_score_P=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""01-ai Yi Chat (34B)"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""01-ai Yi Chat (34B)"",""offsetgroup"":""01-ai Yi Chat (34B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.33974892],""xaxis"":""x"",""y"":[""01-ai Yi Chat (34B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003ebert_score_P=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""LLaMA-2 Chat (7B)"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""LLaMA-2 Chat (7B)"",""offsetgroup"":""LLaMA-2 Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.3203912],""xaxis"":""x"",""y"":[""LLaMA-2 Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003ebert_score_P=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Snorkel Mistral PairRM DPO (7B)"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""Snorkel Mistral PairRM DPO (7B)"",""offsetgroup"":""Snorkel Mistral PairRM DPO (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.31672964],""xaxis"":""x"",""y"":[""Snorkel Mistral PairRM DPO (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003ebert_score_P=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Chronos Hermes (13B)"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""Chronos Hermes (13B)"",""offsetgroup"":""Chronos Hermes (13B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.3124825],""xaxis"":""x"",""y"":[""Chronos Hermes (13B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003ebert_score_P=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Falcon Instruct (7B)"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""Falcon Instruct (7B)"",""offsetgroup"":""Falcon Instruct (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.2895086],""xaxis"":""x"",""y"":[""Falcon Instruct (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003ebert_score_P=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Vicuna v1.5 (7B)"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""Vicuna v1.5 (7B)"",""offsetgroup"":""Vicuna v1.5 (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.284109],""xaxis"":""x"",""y"":[""Vicuna v1.5 (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003ebert_score_P=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""RedPajama-INCITE Chat (7B)"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""RedPajama-INCITE Chat (7B)"",""offsetgroup"":""RedPajama-INCITE Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.261367],""xaxis"":""x"",""y"":[""RedPajama-INCITE Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003ebert_score_P=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison (PaLM 2)"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""chat-bison (PaLM 2)"",""offsetgroup"":""chat-bison (PaLM 2)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.23117188],""xaxis"":""x"",""y"":[""chat-bison (PaLM 2)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003ebert_score_P=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gemini-pro"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""gemini-pro"",""offsetgroup"":""gemini-pro"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.23105659],""xaxis"":""x"",""y"":[""gemini-pro""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003ebert_score_P=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison-32k (PaLM 2 32K)"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""chat-bison-32k (PaLM 2 32K)"",""offsetgroup"":""chat-bison-32k (PaLM 2 32K)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.23046139],""xaxis"":""x"",""y"":[""chat-bison-32k (PaLM 2 32K)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003ebert_score_P=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""llama-2-70b-chat"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""llama-2-70b-chat"",""offsetgroup"":""llama-2-70b-chat"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.20800962],""xaxis"":""x"",""y"":[""llama-2-70b-chat""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003ebert_score_P=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mixtral-8x7B-Instruct-v0.1"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""Mixtral-8x7B-Instruct-v0.1"",""offsetgroup"":""Mixtral-8x7B-Instruct-v0.1"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.19128644],""xaxis"":""x"",""y"":[""Mixtral-8x7B-Instruct-v0.1""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003ebert_score_P=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""offsetgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.122185074],""xaxis"":""x"",""y"":[""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003ebert_score_P=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""zephyr-7b-beta"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""zephyr-7b-beta"",""offsetgroup"":""zephyr-7b-beta"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.085390136],""xaxis"":""x"",""y"":[""zephyr-7b-beta""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003ebert_score_P=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral-7B-Instruct-v0.2"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""Mistral-7B-Instruct-v0.2"",""offsetgroup"":""Mistral-7B-Instruct-v0.2"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.043820098],""xaxis"":""x"",""y"":[""Mistral-7B-Instruct-v0.2""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003ebert_score_P=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Upstage SOLAR Instruct v1 (11B)"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""Upstage SOLAR Instruct v1 (11B)"",""offsetgroup"":""Upstage SOLAR Instruct v1 (11B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.0],""xaxis"":""x"",""y"":[""Upstage SOLAR Instruct v1 (11B)""],""yaxis"":""y"",""type"":""bar""}],""layout"":{""template"":{""data"":{""histogram2dcontour"":[{""type"":""histogram2dcontour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""choropleth"":[{""type"":""choropleth"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""histogram2d"":[{""type"":""histogram2d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmap"":[{""type"":""heatmap"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmapgl"":[{""type"":""heatmapgl"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""contourcarpet"":[{""type"":""contourcarpet"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""contour"":[{""type"":""contour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""surface"":[{""type"":""surface"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""mesh3d"":[{""type"":""mesh3d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""scatter"":[{""fillpattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2},""type"":""scatter""}],""parcoords"":[{""type"":""parcoords"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolargl"":[{""type"":""scatterpolargl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""bar"":[{""error_x"":{""color"":""#2a3f5f""},""error_y"":{""color"":""#2a3f5f""},""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""bar""}],""scattergeo"":[{""type"":""scattergeo"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolar"":[{""type"":""scatterpolar"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""histogram"":[{""marker"":{""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""histogram""}],""scattergl"":[{""type"":""scattergl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatter3d"":[{""type"":""scatter3d"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattermapbox"":[{""type"":""scattermapbox"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterternary"":[{""type"":""scatterternary"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattercarpet"":[{""type"":""scattercarpet"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""carpet"":[{""aaxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""baxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""type"":""carpet""}],""table"":[{""cells"":{""fill"":{""color"":""#EBF0F8""},""line"":{""color"":""white""}},""header"":{""fill"":{""color"":""#C8D4E3""},""line"":{""color"":""white""}},""type"":""table""}],""barpolar"":[{""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""barpolar""}],""pie"":[{""automargin"":true,""type"":""pie""}]},""layout"":{""autotypenumbers"":""strict"",""colorway"":[""#636efa"",""#EF553B"",""#00cc96"",""#ab63fa"",""#FFA15A"",""#19d3f3"",""#FF6692"",""#B6E880"",""#FF97FF"",""#FECB52""],""font"":{""color"":""#2a3f5f""},""hovermode"":""closest"",""hoverlabel"":{""align"":""left""},""paper_bgcolor"":""white"",""plot_bgcolor"":""#E5ECF6"",""polar"":{""bgcolor"":""#E5ECF6"",""angularaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""radialaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""ternary"":{""bgcolor"":""#E5ECF6"",""aaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""baxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""caxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""coloraxis"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""colorscale"":{""sequential"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""sequentialminus"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""diverging"":[[0,""#8e0152""],[0.1,""#c51b7d""],[0.2,""#de77ae""],[0.3,""#f1b6da""],[0.4,""#fde0ef""],[0.5,""#f7f7f7""],[0.6,""#e6f5d0""],[0.7,""#b8e186""],[0.8,""#7fbc41""],[0.9,""#4d9221""],[1,""#276419""]]},""xaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""yaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""scene"":{""xaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""yaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""zaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2}},""shapedefaults"":{""line"":{""color"":""#2a3f5f""}},""annotationdefaults"":{""arrowcolor"":""#2a3f5f"",""arrowhead"":0,""arrowwidth"":1},""geo"":{""bgcolor"":""white"",""landcolor"":""#E5ECF6"",""subunitcolor"":""white"",""showland"":true,""showlakes"":true,""lakecolor"":""white""},""title"":{""x"":0.05},""mapbox"":{""style"":""light""}}},""xaxis"":{""anchor"":""y"",""domain"":[0.0,1.0],""title"":{""text"":""bert_score_P""}},""yaxis"":{""anchor"":""x"",""domain"":[0.0,1.0],""title"":{""text"":""model""},""categoryorder"":""array"",""categoryarray"":[""Upstage SOLAR Instruct v1 (11B)"",""Mistral-7B-Instruct-v0.2"",""zephyr-7b-beta"",""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""Mixtral-8x7B-Instruct-v0.1"",""llama-2-70b-chat"",""chat-bison-32k (PaLM 2 32K)"",""gemini-pro"",""chat-bison (PaLM 2)"",""RedPajama-INCITE Chat (7B)"",""Vicuna v1.5 (7B)"",""Falcon Instruct (7B)"",""Chronos Hermes (13B)"",""Snorkel Mistral PairRM DPO (7B)"",""LLaMA-2 Chat (7B)"",""01-ai Yi Chat (34B)"",""WizardLM v1.2 (13B)"",""Qwen 1.5 Chat (7B)"",""OpenHermes-2.5-Mistral (7B)"",""Mistral (7B) Instruct v0.2 (Together AI)"",""gpt-4-turbo"",""gpt-4"",""gpt-3.5-turbo""]},""legend"":{""title"":{""text"":""model""},""tracegroupgap"":0},""title"":{""text"":""Summary metrics BERT score P""},""barmode"":""relative""}}",,",model,bert_score_P,bert_score_R,bert_score_F1,original_text_length_part,sentence_count,length_penalty,bleu_score
+18,gpt-3.5-turbo,0.4943981,0.48408476,0.4888874,0.5905700146991734,4.229639819909955,89814.0,0.007892445077902592
+19,gpt-4,0.48605907,0.472583,0.47901583,0.4763731952669352,4.266137566137566,85120.0,0.004704572681138337
+20,gpt-4-turbo,0.42728576,0.4162435,0.42098433,0.5393220459796505,4.266137566137566,85120.0,0.0034873692407505464
+4,Mistral (7B) Instruct v0.2 (Together AI),0.3647361,0.3664233,0.36540908,0.5233998570385472,3.712222222222222,29298.0,0.005478518060743351
+7,OpenHermes-2.5-Mistral (7B),0.3618188,0.35180506,0.3565194,0.312054520357568,3.5818443804034583,14928.0,0.006563161880264231
+8,Qwen 1.5 Chat (7B),0.34855434,0.34154576,0.344803,0.29904529709475364,3.5818443804034583,14928.0,0.003185571110431172
+14,WizardLM v1.2 (13B),0.34085444,0.32933056,0.33466902,0.28716720161049375,3.5818443804034583,14928.0,0.003671383039102015
+0,01-ai Yi Chat (34B),0.33974892,0.3404481,0.3399749,0.43251538287409536,3.5818443804034583,14928.0,0.007311566390840339
+3,LLaMA-2 Chat (7B),0.3203912,0.3153909,0.31770444,0.4084233313416049,3.5818443804034583,14928.0,0.004255859538193306
+10,Snorkel Mistral PairRM DPO (7B),0.31672964,0.33782956,0.3265383,3.7740234383755356,3.5818443804034583,14928.0,0.002907897771152987
+1,Chronos Hermes (13B),0.3124825,0.31071666,0.311415,0.4742810243835248,3.5818443804034583,14928.0,0.011439012700594395
+2,Falcon Instruct (7B),0.2895086,0.23968808,0.2615204,0.0490635544441649,3.5818443804034583,14928.0,0.00021729364201653395
+13,Vicuna v1.5 (7B),0.284109,0.27878883,0.28129113,0.2781035051738079,3.6173027989821884,16948.0,0.006952332387656228
+9,RedPajama-INCITE Chat (7B),0.261367,0.23758642,0.2487217,0.0560284823193376,3.5818443804034583,14928.0,0.0
+15,chat-bison (PaLM 2),0.23117188,0.23029378,0.23060663,0.2927236655934559,4.281081081081081,83400.0,0.0033173472693443363
+17,gemini-pro,0.23105659,0.23057175,0.23072062,0.295286999418032,4.244871794871795,87700.0,0.0025439281189154664
+16,chat-bison-32k (PaLM 2 32K),0.23046139,0.22983725,0.23002876,0.2608806894318779,4.281081081081081,83400.0,0.002970914340485325
+21,llama-2-70b-chat,0.20800962,0.21472095,0.21117964,0.29684572894554634,4.2436893203883495,88008.0,0.00329426273003284
+6,Mixtral-8x7B-Instruct-v0.1,0.19128644,0.19555509,0.19330867,0.2665288353398184,4.161038961038961,103320.0,0.0026839271544750283
+11,TinyLlama/TinyLlama-1.1B-Chat-v1.0,0.122185074,0.11885959,0.12042627,0.13915355617375091,4.244871794871795,87700.0,0.002991155730532842
+22,zephyr-7b-beta,0.085390136,0.08266569,0.08394519,0.08796697338212889,4.159788702026735,103714.0,0.0010625100735849574
+5,Mistral-7B-Instruct-v0.2,0.043820098,0.042561684,0.04313921,0.04250630683894714,4.120342654588421,113258.0,0.0004930290548816363
+12,Upstage SOLAR Instruct v1 (11B),0.0,0.0,0.0,0.0017662349842492329,3.5818443804034583,14928.0,0.0
+","{""x"": ""bert_score_P"", ""y"": ""model"", ""color"": ""model"", ""orientation"": ""h"", ""title"": ""Summary metrics BERT score P""}"
+"Figure({
+ 'data': [{'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
bert_score_R=%{x}',
+ 'legendgroup': 'gpt-3.5-turbo',
+ 'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
+ 'name': 'gpt-3.5-turbo',
+ 'offsetgroup': 'gpt-3.5-turbo',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.48408476], dtype=float32),
+ 'xaxis': 'x',
+ 'y': array(['gpt-3.5-turbo'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
bert_score_R=%{x}',
+ 'legendgroup': 'gpt-4',
+ 'marker': {'color': '#EF553B', 'pattern': {'shape': ''}},
+ 'name': 'gpt-4',
+ 'offsetgroup': 'gpt-4',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.472583], dtype=float32),
+ 'xaxis': 'x',
+ 'y': array(['gpt-4'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
bert_score_R=%{x}',
+ 'legendgroup': 'gpt-4-turbo',
+ 'marker': {'color': '#00cc96', 'pattern': {'shape': ''}},
+ 'name': 'gpt-4-turbo',
+ 'offsetgroup': 'gpt-4-turbo',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.4162435], dtype=float32),
+ 'xaxis': 'x',
+ 'y': array(['gpt-4-turbo'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
bert_score_R=%{x}',
+ 'legendgroup': 'Mistral (7B) Instruct v0.2 (Together AI)',
+ 'marker': {'color': '#ab63fa', 'pattern': {'shape': ''}},
+ 'name': 'Mistral (7B) Instruct v0.2 (Together AI)',
+ 'offsetgroup': 'Mistral (7B) Instruct v0.2 (Together AI)',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.3664233], dtype=float32),
+ 'xaxis': 'x',
+ 'y': array(['Mistral (7B) Instruct v0.2 (Together AI)'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
bert_score_R=%{x}',
+ 'legendgroup': 'OpenHermes-2.5-Mistral (7B)',
+ 'marker': {'color': '#FFA15A', 'pattern': {'shape': ''}},
+ 'name': 'OpenHermes-2.5-Mistral (7B)',
+ 'offsetgroup': 'OpenHermes-2.5-Mistral (7B)',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.35180506], dtype=float32),
+ 'xaxis': 'x',
+ 'y': array(['OpenHermes-2.5-Mistral (7B)'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
bert_score_R=%{x}',
+ 'legendgroup': 'Qwen 1.5 Chat (7B)',
+ 'marker': {'color': '#19d3f3', 'pattern': {'shape': ''}},
+ 'name': 'Qwen 1.5 Chat (7B)',
+ 'offsetgroup': 'Qwen 1.5 Chat (7B)',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.34154576], dtype=float32),
+ 'xaxis': 'x',
+ 'y': array(['Qwen 1.5 Chat (7B)'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
bert_score_R=%{x}',
+ 'legendgroup': '01-ai Yi Chat (34B)',
+ 'marker': {'color': '#FF6692', 'pattern': {'shape': ''}},
+ 'name': '01-ai Yi Chat (34B)',
+ 'offsetgroup': '01-ai Yi Chat (34B)',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.3404481], dtype=float32),
+ 'xaxis': 'x',
+ 'y': array(['01-ai Yi Chat (34B)'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
bert_score_R=%{x}',
+ 'legendgroup': 'Snorkel Mistral PairRM DPO (7B)',
+ 'marker': {'color': '#B6E880', 'pattern': {'shape': ''}},
+ 'name': 'Snorkel Mistral PairRM DPO (7B)',
+ 'offsetgroup': 'Snorkel Mistral PairRM DPO (7B)',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.33782956], dtype=float32),
+ 'xaxis': 'x',
+ 'y': array(['Snorkel Mistral PairRM DPO (7B)'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
bert_score_R=%{x}',
+ 'legendgroup': 'WizardLM v1.2 (13B)',
+ 'marker': {'color': '#FF97FF', 'pattern': {'shape': ''}},
+ 'name': 'WizardLM v1.2 (13B)',
+ 'offsetgroup': 'WizardLM v1.2 (13B)',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.32933056], dtype=float32),
+ 'xaxis': 'x',
+ 'y': array(['WizardLM v1.2 (13B)'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
bert_score_R=%{x}',
+ 'legendgroup': 'LLaMA-2 Chat (7B)',
+ 'marker': {'color': '#FECB52', 'pattern': {'shape': ''}},
+ 'name': 'LLaMA-2 Chat (7B)',
+ 'offsetgroup': 'LLaMA-2 Chat (7B)',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.3153909], dtype=float32),
+ 'xaxis': 'x',
+ 'y': array(['LLaMA-2 Chat (7B)'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
bert_score_R=%{x}',
+ 'legendgroup': 'Chronos Hermes (13B)',
+ 'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
+ 'name': 'Chronos Hermes (13B)',
+ 'offsetgroup': 'Chronos Hermes (13B)',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.31071666], dtype=float32),
+ 'xaxis': 'x',
+ 'y': array(['Chronos Hermes (13B)'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
bert_score_R=%{x}',
+ 'legendgroup': 'Vicuna v1.5 (7B)',
+ 'marker': {'color': '#EF553B', 'pattern': {'shape': ''}},
+ 'name': 'Vicuna v1.5 (7B)',
+ 'offsetgroup': 'Vicuna v1.5 (7B)',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.27878883], dtype=float32),
+ 'xaxis': 'x',
+ 'y': array(['Vicuna v1.5 (7B)'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
bert_score_R=%{x}',
+ 'legendgroup': 'Falcon Instruct (7B)',
+ 'marker': {'color': '#00cc96', 'pattern': {'shape': ''}},
+ 'name': 'Falcon Instruct (7B)',
+ 'offsetgroup': 'Falcon Instruct (7B)',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.23968808], dtype=float32),
+ 'xaxis': 'x',
+ 'y': array(['Falcon Instruct (7B)'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
bert_score_R=%{x}',
+ 'legendgroup': 'RedPajama-INCITE Chat (7B)',
+ 'marker': {'color': '#ab63fa', 'pattern': {'shape': ''}},
+ 'name': 'RedPajama-INCITE Chat (7B)',
+ 'offsetgroup': 'RedPajama-INCITE Chat (7B)',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.23758642], dtype=float32),
+ 'xaxis': 'x',
+ 'y': array(['RedPajama-INCITE Chat (7B)'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
bert_score_R=%{x}',
+ 'legendgroup': 'gemini-pro',
+ 'marker': {'color': '#FFA15A', 'pattern': {'shape': ''}},
+ 'name': 'gemini-pro',
+ 'offsetgroup': 'gemini-pro',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.23057175], dtype=float32),
+ 'xaxis': 'x',
+ 'y': array(['gemini-pro'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
bert_score_R=%{x}',
+ 'legendgroup': 'chat-bison (PaLM 2)',
+ 'marker': {'color': '#19d3f3', 'pattern': {'shape': ''}},
+ 'name': 'chat-bison (PaLM 2)',
+ 'offsetgroup': 'chat-bison (PaLM 2)',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.23029378], dtype=float32),
+ 'xaxis': 'x',
+ 'y': array(['chat-bison (PaLM 2)'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
bert_score_R=%{x}',
+ 'legendgroup': 'chat-bison-32k (PaLM 2 32K)',
+ 'marker': {'color': '#FF6692', 'pattern': {'shape': ''}},
+ 'name': 'chat-bison-32k (PaLM 2 32K)',
+ 'offsetgroup': 'chat-bison-32k (PaLM 2 32K)',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.22983725], dtype=float32),
+ 'xaxis': 'x',
+ 'y': array(['chat-bison-32k (PaLM 2 32K)'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
bert_score_R=%{x}',
+ 'legendgroup': 'llama-2-70b-chat',
+ 'marker': {'color': '#B6E880', 'pattern': {'shape': ''}},
+ 'name': 'llama-2-70b-chat',
+ 'offsetgroup': 'llama-2-70b-chat',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.21472095], dtype=float32),
+ 'xaxis': 'x',
+ 'y': array(['llama-2-70b-chat'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
bert_score_R=%{x}',
+ 'legendgroup': 'Mixtral-8x7B-Instruct-v0.1',
+ 'marker': {'color': '#FF97FF', 'pattern': {'shape': ''}},
+ 'name': 'Mixtral-8x7B-Instruct-v0.1',
+ 'offsetgroup': 'Mixtral-8x7B-Instruct-v0.1',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.19555509], dtype=float32),
+ 'xaxis': 'x',
+ 'y': array(['Mixtral-8x7B-Instruct-v0.1'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
bert_score_R=%{x}',
+ 'legendgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
+ 'marker': {'color': '#FECB52', 'pattern': {'shape': ''}},
+ 'name': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
+ 'offsetgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.11885959], dtype=float32),
+ 'xaxis': 'x',
+ 'y': array(['TinyLlama/TinyLlama-1.1B-Chat-v1.0'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
bert_score_R=%{x}',
+ 'legendgroup': 'zephyr-7b-beta',
+ 'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
+ 'name': 'zephyr-7b-beta',
+ 'offsetgroup': 'zephyr-7b-beta',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.08266569], dtype=float32),
+ 'xaxis': 'x',
+ 'y': array(['zephyr-7b-beta'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
bert_score_R=%{x}',
+ 'legendgroup': 'Mistral-7B-Instruct-v0.2',
+ 'marker': {'color': '#EF553B', 'pattern': {'shape': ''}},
+ 'name': 'Mistral-7B-Instruct-v0.2',
+ 'offsetgroup': 'Mistral-7B-Instruct-v0.2',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.04256168], dtype=float32),
+ 'xaxis': 'x',
+ 'y': array(['Mistral-7B-Instruct-v0.2'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
bert_score_R=%{x}',
+ 'legendgroup': 'Upstage SOLAR Instruct v1 (11B)',
+ 'marker': {'color': '#00cc96', 'pattern': {'shape': ''}},
+ 'name': 'Upstage SOLAR Instruct v1 (11B)',
+ 'offsetgroup': 'Upstage SOLAR Instruct v1 (11B)',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.], dtype=float32),
+ 'xaxis': 'x',
+ 'y': array(['Upstage SOLAR Instruct v1 (11B)'], dtype=object),
+ 'yaxis': 'y'}],
+ 'layout': {'barmode': 'relative',
+ 'legend': {'title': {'text': 'model'}, 'tracegroupgap': 0},
+ 'template': '...',
+ 'title': {'text': 'Summary metrics BERT score R'},
+ 'xaxis': {'anchor': 'y', 'domain': [0.0, 1.0], 'title': {'text': 'bert_score_R'}},
+ 'yaxis': {'anchor': 'x',
+ 'categoryarray': [Upstage SOLAR Instruct v1 (11B),
+ Mistral-7B-Instruct-v0.2,
+ zephyr-7b-beta,
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,
+ Mixtral-8x7B-Instruct-v0.1,
+ llama-2-70b-chat, chat-bison-32k (PaLM 2
+ 32K), chat-bison (PaLM 2), gemini-pro,
+ RedPajama-INCITE Chat (7B), Falcon
+ Instruct (7B), Vicuna v1.5 (7B), Chronos
+ Hermes (13B), LLaMA-2 Chat (7B),
+ WizardLM v1.2 (13B), Snorkel Mistral
+ PairRM DPO (7B), 01-ai Yi Chat (34B),
+ Qwen 1.5 Chat (7B),
+ OpenHermes-2.5-Mistral (7B), Mistral
+ (7B) Instruct v0.2 (Together AI),
+ gpt-4-turbo, gpt-4, gpt-3.5-turbo],
+ 'categoryorder': 'array',
+ 'domain': [0.0, 1.0],
+ 'title': {'text': 'model'}}}
+})",Summary metrics BERT score R,"{""data"":[{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003ebert_score_R=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-3.5-turbo"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""gpt-3.5-turbo"",""offsetgroup"":""gpt-3.5-turbo"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.48408476],""xaxis"":""x"",""y"":[""gpt-3.5-turbo""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003ebert_score_R=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""gpt-4"",""offsetgroup"":""gpt-4"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.472583],""xaxis"":""x"",""y"":[""gpt-4""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003ebert_score_R=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4-turbo"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""gpt-4-turbo"",""offsetgroup"":""gpt-4-turbo"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.4162435],""xaxis"":""x"",""y"":[""gpt-4-turbo""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003ebert_score_R=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral (7B) Instruct v0.2 (Together AI)"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""Mistral (7B) Instruct v0.2 (Together AI)"",""offsetgroup"":""Mistral (7B) Instruct v0.2 (Together AI)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.3664233],""xaxis"":""x"",""y"":[""Mistral (7B) Instruct v0.2 (Together AI)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003ebert_score_R=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""OpenHermes-2.5-Mistral (7B)"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""OpenHermes-2.5-Mistral (7B)"",""offsetgroup"":""OpenHermes-2.5-Mistral (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.35180506],""xaxis"":""x"",""y"":[""OpenHermes-2.5-Mistral (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003ebert_score_R=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Qwen 1.5 Chat (7B)"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""Qwen 1.5 Chat (7B)"",""offsetgroup"":""Qwen 1.5 Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.34154576],""xaxis"":""x"",""y"":[""Qwen 1.5 Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003ebert_score_R=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""01-ai Yi Chat (34B)"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""01-ai Yi Chat (34B)"",""offsetgroup"":""01-ai Yi Chat (34B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.3404481],""xaxis"":""x"",""y"":[""01-ai Yi Chat (34B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003ebert_score_R=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Snorkel Mistral PairRM DPO (7B)"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""Snorkel Mistral PairRM DPO (7B)"",""offsetgroup"":""Snorkel Mistral PairRM DPO (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.33782956],""xaxis"":""x"",""y"":[""Snorkel Mistral PairRM DPO (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003ebert_score_R=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""WizardLM v1.2 (13B)"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""WizardLM v1.2 (13B)"",""offsetgroup"":""WizardLM v1.2 (13B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.32933056],""xaxis"":""x"",""y"":[""WizardLM v1.2 (13B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003ebert_score_R=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""LLaMA-2 Chat (7B)"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""LLaMA-2 Chat (7B)"",""offsetgroup"":""LLaMA-2 Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.3153909],""xaxis"":""x"",""y"":[""LLaMA-2 Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003ebert_score_R=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Chronos Hermes (13B)"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""Chronos Hermes (13B)"",""offsetgroup"":""Chronos Hermes (13B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.31071666],""xaxis"":""x"",""y"":[""Chronos Hermes (13B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003ebert_score_R=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Vicuna v1.5 (7B)"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""Vicuna v1.5 (7B)"",""offsetgroup"":""Vicuna v1.5 (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.27878883],""xaxis"":""x"",""y"":[""Vicuna v1.5 (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003ebert_score_R=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Falcon Instruct (7B)"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""Falcon Instruct (7B)"",""offsetgroup"":""Falcon Instruct (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.23968808],""xaxis"":""x"",""y"":[""Falcon Instruct (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003ebert_score_R=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""RedPajama-INCITE Chat (7B)"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""RedPajama-INCITE Chat (7B)"",""offsetgroup"":""RedPajama-INCITE Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.23758642],""xaxis"":""x"",""y"":[""RedPajama-INCITE Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003ebert_score_R=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gemini-pro"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""gemini-pro"",""offsetgroup"":""gemini-pro"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.23057175],""xaxis"":""x"",""y"":[""gemini-pro""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003ebert_score_R=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison (PaLM 2)"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""chat-bison (PaLM 2)"",""offsetgroup"":""chat-bison (PaLM 2)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.23029378],""xaxis"":""x"",""y"":[""chat-bison (PaLM 2)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003ebert_score_R=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison-32k (PaLM 2 32K)"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""chat-bison-32k (PaLM 2 32K)"",""offsetgroup"":""chat-bison-32k (PaLM 2 32K)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.22983725],""xaxis"":""x"",""y"":[""chat-bison-32k (PaLM 2 32K)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003ebert_score_R=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""llama-2-70b-chat"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""llama-2-70b-chat"",""offsetgroup"":""llama-2-70b-chat"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.21472095],""xaxis"":""x"",""y"":[""llama-2-70b-chat""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003ebert_score_R=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mixtral-8x7B-Instruct-v0.1"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""Mixtral-8x7B-Instruct-v0.1"",""offsetgroup"":""Mixtral-8x7B-Instruct-v0.1"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.19555509],""xaxis"":""x"",""y"":[""Mixtral-8x7B-Instruct-v0.1""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003ebert_score_R=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""offsetgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.11885959],""xaxis"":""x"",""y"":[""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003ebert_score_R=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""zephyr-7b-beta"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""zephyr-7b-beta"",""offsetgroup"":""zephyr-7b-beta"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.08266569],""xaxis"":""x"",""y"":[""zephyr-7b-beta""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003ebert_score_R=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral-7B-Instruct-v0.2"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""Mistral-7B-Instruct-v0.2"",""offsetgroup"":""Mistral-7B-Instruct-v0.2"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.042561684],""xaxis"":""x"",""y"":[""Mistral-7B-Instruct-v0.2""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003ebert_score_R=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Upstage SOLAR Instruct v1 (11B)"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""Upstage SOLAR Instruct v1 (11B)"",""offsetgroup"":""Upstage SOLAR Instruct v1 (11B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.0],""xaxis"":""x"",""y"":[""Upstage SOLAR Instruct v1 (11B)""],""yaxis"":""y"",""type"":""bar""}],""layout"":{""template"":{""data"":{""histogram2dcontour"":[{""type"":""histogram2dcontour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""choropleth"":[{""type"":""choropleth"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""histogram2d"":[{""type"":""histogram2d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmap"":[{""type"":""heatmap"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmapgl"":[{""type"":""heatmapgl"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""contourcarpet"":[{""type"":""contourcarpet"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""contour"":[{""type"":""contour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""surface"":[{""type"":""surface"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""mesh3d"":[{""type"":""mesh3d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""scatter"":[{""fillpattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2},""type"":""scatter""}],""parcoords"":[{""type"":""parcoords"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolargl"":[{""type"":""scatterpolargl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""bar"":[{""error_x"":{""color"":""#2a3f5f""},""error_y"":{""color"":""#2a3f5f""},""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""bar""}],""scattergeo"":[{""type"":""scattergeo"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolar"":[{""type"":""scatterpolar"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""histogram"":[{""marker"":{""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""histogram""}],""scattergl"":[{""type"":""scattergl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatter3d"":[{""type"":""scatter3d"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattermapbox"":[{""type"":""scattermapbox"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterternary"":[{""type"":""scatterternary"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattercarpet"":[{""type"":""scattercarpet"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""carpet"":[{""aaxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""baxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""type"":""carpet""}],""table"":[{""cells"":{""fill"":{""color"":""#EBF0F8""},""line"":{""color"":""white""}},""header"":{""fill"":{""color"":""#C8D4E3""},""line"":{""color"":""white""}},""type"":""table""}],""barpolar"":[{""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""barpolar""}],""pie"":[{""automargin"":true,""type"":""pie""}]},""layout"":{""autotypenumbers"":""strict"",""colorway"":[""#636efa"",""#EF553B"",""#00cc96"",""#ab63fa"",""#FFA15A"",""#19d3f3"",""#FF6692"",""#B6E880"",""#FF97FF"",""#FECB52""],""font"":{""color"":""#2a3f5f""},""hovermode"":""closest"",""hoverlabel"":{""align"":""left""},""paper_bgcolor"":""white"",""plot_bgcolor"":""#E5ECF6"",""polar"":{""bgcolor"":""#E5ECF6"",""angularaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""radialaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""ternary"":{""bgcolor"":""#E5ECF6"",""aaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""baxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""caxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""coloraxis"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""colorscale"":{""sequential"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""sequentialminus"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""diverging"":[[0,""#8e0152""],[0.1,""#c51b7d""],[0.2,""#de77ae""],[0.3,""#f1b6da""],[0.4,""#fde0ef""],[0.5,""#f7f7f7""],[0.6,""#e6f5d0""],[0.7,""#b8e186""],[0.8,""#7fbc41""],[0.9,""#4d9221""],[1,""#276419""]]},""xaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""yaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""scene"":{""xaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""yaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""zaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2}},""shapedefaults"":{""line"":{""color"":""#2a3f5f""}},""annotationdefaults"":{""arrowcolor"":""#2a3f5f"",""arrowhead"":0,""arrowwidth"":1},""geo"":{""bgcolor"":""white"",""landcolor"":""#E5ECF6"",""subunitcolor"":""white"",""showland"":true,""showlakes"":true,""lakecolor"":""white""},""title"":{""x"":0.05},""mapbox"":{""style"":""light""}}},""xaxis"":{""anchor"":""y"",""domain"":[0.0,1.0],""title"":{""text"":""bert_score_R""}},""yaxis"":{""anchor"":""x"",""domain"":[0.0,1.0],""title"":{""text"":""model""},""categoryorder"":""array"",""categoryarray"":[""Upstage SOLAR Instruct v1 (11B)"",""Mistral-7B-Instruct-v0.2"",""zephyr-7b-beta"",""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""Mixtral-8x7B-Instruct-v0.1"",""llama-2-70b-chat"",""chat-bison-32k (PaLM 2 32K)"",""chat-bison (PaLM 2)"",""gemini-pro"",""RedPajama-INCITE Chat (7B)"",""Falcon Instruct (7B)"",""Vicuna v1.5 (7B)"",""Chronos Hermes (13B)"",""LLaMA-2 Chat (7B)"",""WizardLM v1.2 (13B)"",""Snorkel Mistral PairRM DPO (7B)"",""01-ai Yi Chat (34B)"",""Qwen 1.5 Chat (7B)"",""OpenHermes-2.5-Mistral (7B)"",""Mistral (7B) Instruct v0.2 (Together AI)"",""gpt-4-turbo"",""gpt-4"",""gpt-3.5-turbo""]},""legend"":{""title"":{""text"":""model""},""tracegroupgap"":0},""title"":{""text"":""Summary metrics BERT score R""},""barmode"":""relative""}}",,",model,bert_score_P,bert_score_R,bert_score_F1,original_text_length_part,sentence_count,length_penalty,bleu_score
+18,gpt-3.5-turbo,0.4943981,0.48408476,0.4888874,0.5905700146991734,4.229639819909955,89814.0,0.007892445077902592
+19,gpt-4,0.48605907,0.472583,0.47901583,0.4763731952669352,4.266137566137566,85120.0,0.004704572681138337
+20,gpt-4-turbo,0.42728576,0.4162435,0.42098433,0.5393220459796505,4.266137566137566,85120.0,0.0034873692407505464
+4,Mistral (7B) Instruct v0.2 (Together AI),0.3647361,0.3664233,0.36540908,0.5233998570385472,3.712222222222222,29298.0,0.005478518060743351
+7,OpenHermes-2.5-Mistral (7B),0.3618188,0.35180506,0.3565194,0.312054520357568,3.5818443804034583,14928.0,0.006563161880264231
+8,Qwen 1.5 Chat (7B),0.34855434,0.34154576,0.344803,0.29904529709475364,3.5818443804034583,14928.0,0.003185571110431172
+0,01-ai Yi Chat (34B),0.33974892,0.3404481,0.3399749,0.43251538287409536,3.5818443804034583,14928.0,0.007311566390840339
+10,Snorkel Mistral PairRM DPO (7B),0.31672964,0.33782956,0.3265383,3.7740234383755356,3.5818443804034583,14928.0,0.002907897771152987
+14,WizardLM v1.2 (13B),0.34085444,0.32933056,0.33466902,0.28716720161049375,3.5818443804034583,14928.0,0.003671383039102015
+3,LLaMA-2 Chat (7B),0.3203912,0.3153909,0.31770444,0.4084233313416049,3.5818443804034583,14928.0,0.004255859538193306
+1,Chronos Hermes (13B),0.3124825,0.31071666,0.311415,0.4742810243835248,3.5818443804034583,14928.0,0.011439012700594395
+13,Vicuna v1.5 (7B),0.284109,0.27878883,0.28129113,0.2781035051738079,3.6173027989821884,16948.0,0.006952332387656228
+2,Falcon Instruct (7B),0.2895086,0.23968808,0.2615204,0.0490635544441649,3.5818443804034583,14928.0,0.00021729364201653395
+9,RedPajama-INCITE Chat (7B),0.261367,0.23758642,0.2487217,0.0560284823193376,3.5818443804034583,14928.0,0.0
+17,gemini-pro,0.23105659,0.23057175,0.23072062,0.295286999418032,4.244871794871795,87700.0,0.0025439281189154664
+15,chat-bison (PaLM 2),0.23117188,0.23029378,0.23060663,0.2927236655934559,4.281081081081081,83400.0,0.0033173472693443363
+16,chat-bison-32k (PaLM 2 32K),0.23046139,0.22983725,0.23002876,0.2608806894318779,4.281081081081081,83400.0,0.002970914340485325
+21,llama-2-70b-chat,0.20800962,0.21472095,0.21117964,0.29684572894554634,4.2436893203883495,88008.0,0.00329426273003284
+6,Mixtral-8x7B-Instruct-v0.1,0.19128644,0.19555509,0.19330867,0.2665288353398184,4.161038961038961,103320.0,0.0026839271544750283
+11,TinyLlama/TinyLlama-1.1B-Chat-v1.0,0.122185074,0.11885959,0.12042627,0.13915355617375091,4.244871794871795,87700.0,0.002991155730532842
+22,zephyr-7b-beta,0.085390136,0.08266569,0.08394519,0.08796697338212889,4.159788702026735,103714.0,0.0010625100735849574
+5,Mistral-7B-Instruct-v0.2,0.043820098,0.042561684,0.04313921,0.04250630683894714,4.120342654588421,113258.0,0.0004930290548816363
+12,Upstage SOLAR Instruct v1 (11B),0.0,0.0,0.0,0.0017662349842492329,3.5818443804034583,14928.0,0.0
+","{""x"": ""bert_score_R"", ""y"": ""model"", ""color"": ""model"", ""orientation"": ""h"", ""title"": ""Summary metrics BERT score R""}"
+"Figure({
+ 'data': [{'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
bert_score_F1=%{x}',
+ 'legendgroup': 'gpt-3.5-turbo',
+ 'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
+ 'name': 'gpt-3.5-turbo',
+ 'offsetgroup': 'gpt-3.5-turbo',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.4888874], dtype=float32),
+ 'xaxis': 'x',
+ 'y': array(['gpt-3.5-turbo'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
bert_score_F1=%{x}',
+ 'legendgroup': 'gpt-4',
+ 'marker': {'color': '#EF553B', 'pattern': {'shape': ''}},
+ 'name': 'gpt-4',
+ 'offsetgroup': 'gpt-4',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.47901583], dtype=float32),
+ 'xaxis': 'x',
+ 'y': array(['gpt-4'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
bert_score_F1=%{x}',
+ 'legendgroup': 'gpt-4-turbo',
+ 'marker': {'color': '#00cc96', 'pattern': {'shape': ''}},
+ 'name': 'gpt-4-turbo',
+ 'offsetgroup': 'gpt-4-turbo',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.42098433], dtype=float32),
+ 'xaxis': 'x',
+ 'y': array(['gpt-4-turbo'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
bert_score_F1=%{x}',
+ 'legendgroup': 'Mistral (7B) Instruct v0.2 (Together AI)',
+ 'marker': {'color': '#ab63fa', 'pattern': {'shape': ''}},
+ 'name': 'Mistral (7B) Instruct v0.2 (Together AI)',
+ 'offsetgroup': 'Mistral (7B) Instruct v0.2 (Together AI)',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.36540908], dtype=float32),
+ 'xaxis': 'x',
+ 'y': array(['Mistral (7B) Instruct v0.2 (Together AI)'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
bert_score_F1=%{x}',
+ 'legendgroup': 'OpenHermes-2.5-Mistral (7B)',
+ 'marker': {'color': '#FFA15A', 'pattern': {'shape': ''}},
+ 'name': 'OpenHermes-2.5-Mistral (7B)',
+ 'offsetgroup': 'OpenHermes-2.5-Mistral (7B)',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.3565194], dtype=float32),
+ 'xaxis': 'x',
+ 'y': array(['OpenHermes-2.5-Mistral (7B)'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
bert_score_F1=%{x}',
+ 'legendgroup': 'Qwen 1.5 Chat (7B)',
+ 'marker': {'color': '#19d3f3', 'pattern': {'shape': ''}},
+ 'name': 'Qwen 1.5 Chat (7B)',
+ 'offsetgroup': 'Qwen 1.5 Chat (7B)',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.344803], dtype=float32),
+ 'xaxis': 'x',
+ 'y': array(['Qwen 1.5 Chat (7B)'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
bert_score_F1=%{x}',
+ 'legendgroup': '01-ai Yi Chat (34B)',
+ 'marker': {'color': '#FF6692', 'pattern': {'shape': ''}},
+ 'name': '01-ai Yi Chat (34B)',
+ 'offsetgroup': '01-ai Yi Chat (34B)',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.3399749], dtype=float32),
+ 'xaxis': 'x',
+ 'y': array(['01-ai Yi Chat (34B)'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
bert_score_F1=%{x}',
+ 'legendgroup': 'WizardLM v1.2 (13B)',
+ 'marker': {'color': '#B6E880', 'pattern': {'shape': ''}},
+ 'name': 'WizardLM v1.2 (13B)',
+ 'offsetgroup': 'WizardLM v1.2 (13B)',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.33466902], dtype=float32),
+ 'xaxis': 'x',
+ 'y': array(['WizardLM v1.2 (13B)'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
bert_score_F1=%{x}',
+ 'legendgroup': 'Snorkel Mistral PairRM DPO (7B)',
+ 'marker': {'color': '#FF97FF', 'pattern': {'shape': ''}},
+ 'name': 'Snorkel Mistral PairRM DPO (7B)',
+ 'offsetgroup': 'Snorkel Mistral PairRM DPO (7B)',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.3265383], dtype=float32),
+ 'xaxis': 'x',
+ 'y': array(['Snorkel Mistral PairRM DPO (7B)'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
bert_score_F1=%{x}',
+ 'legendgroup': 'LLaMA-2 Chat (7B)',
+ 'marker': {'color': '#FECB52', 'pattern': {'shape': ''}},
+ 'name': 'LLaMA-2 Chat (7B)',
+ 'offsetgroup': 'LLaMA-2 Chat (7B)',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.31770444], dtype=float32),
+ 'xaxis': 'x',
+ 'y': array(['LLaMA-2 Chat (7B)'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
bert_score_F1=%{x}',
+ 'legendgroup': 'Chronos Hermes (13B)',
+ 'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
+ 'name': 'Chronos Hermes (13B)',
+ 'offsetgroup': 'Chronos Hermes (13B)',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.311415], dtype=float32),
+ 'xaxis': 'x',
+ 'y': array(['Chronos Hermes (13B)'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
bert_score_F1=%{x}',
+ 'legendgroup': 'Vicuna v1.5 (7B)',
+ 'marker': {'color': '#EF553B', 'pattern': {'shape': ''}},
+ 'name': 'Vicuna v1.5 (7B)',
+ 'offsetgroup': 'Vicuna v1.5 (7B)',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.28129113], dtype=float32),
+ 'xaxis': 'x',
+ 'y': array(['Vicuna v1.5 (7B)'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
bert_score_F1=%{x}',
+ 'legendgroup': 'Falcon Instruct (7B)',
+ 'marker': {'color': '#00cc96', 'pattern': {'shape': ''}},
+ 'name': 'Falcon Instruct (7B)',
+ 'offsetgroup': 'Falcon Instruct (7B)',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.2615204], dtype=float32),
+ 'xaxis': 'x',
+ 'y': array(['Falcon Instruct (7B)'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
bert_score_F1=%{x}',
+ 'legendgroup': 'RedPajama-INCITE Chat (7B)',
+ 'marker': {'color': '#ab63fa', 'pattern': {'shape': ''}},
+ 'name': 'RedPajama-INCITE Chat (7B)',
+ 'offsetgroup': 'RedPajama-INCITE Chat (7B)',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.2487217], dtype=float32),
+ 'xaxis': 'x',
+ 'y': array(['RedPajama-INCITE Chat (7B)'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
bert_score_F1=%{x}',
+ 'legendgroup': 'gemini-pro',
+ 'marker': {'color': '#FFA15A', 'pattern': {'shape': ''}},
+ 'name': 'gemini-pro',
+ 'offsetgroup': 'gemini-pro',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.23072062], dtype=float32),
+ 'xaxis': 'x',
+ 'y': array(['gemini-pro'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
bert_score_F1=%{x}',
+ 'legendgroup': 'chat-bison (PaLM 2)',
+ 'marker': {'color': '#19d3f3', 'pattern': {'shape': ''}},
+ 'name': 'chat-bison (PaLM 2)',
+ 'offsetgroup': 'chat-bison (PaLM 2)',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.23060663], dtype=float32),
+ 'xaxis': 'x',
+ 'y': array(['chat-bison (PaLM 2)'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
bert_score_F1=%{x}',
+ 'legendgroup': 'chat-bison-32k (PaLM 2 32K)',
+ 'marker': {'color': '#FF6692', 'pattern': {'shape': ''}},
+ 'name': 'chat-bison-32k (PaLM 2 32K)',
+ 'offsetgroup': 'chat-bison-32k (PaLM 2 32K)',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.23002876], dtype=float32),
+ 'xaxis': 'x',
+ 'y': array(['chat-bison-32k (PaLM 2 32K)'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
bert_score_F1=%{x}',
+ 'legendgroup': 'llama-2-70b-chat',
+ 'marker': {'color': '#B6E880', 'pattern': {'shape': ''}},
+ 'name': 'llama-2-70b-chat',
+ 'offsetgroup': 'llama-2-70b-chat',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.21117964], dtype=float32),
+ 'xaxis': 'x',
+ 'y': array(['llama-2-70b-chat'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
bert_score_F1=%{x}',
+ 'legendgroup': 'Mixtral-8x7B-Instruct-v0.1',
+ 'marker': {'color': '#FF97FF', 'pattern': {'shape': ''}},
+ 'name': 'Mixtral-8x7B-Instruct-v0.1',
+ 'offsetgroup': 'Mixtral-8x7B-Instruct-v0.1',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.19330867], dtype=float32),
+ 'xaxis': 'x',
+ 'y': array(['Mixtral-8x7B-Instruct-v0.1'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
bert_score_F1=%{x}',
+ 'legendgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
+ 'marker': {'color': '#FECB52', 'pattern': {'shape': ''}},
+ 'name': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
+ 'offsetgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.12042627], dtype=float32),
+ 'xaxis': 'x',
+ 'y': array(['TinyLlama/TinyLlama-1.1B-Chat-v1.0'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
bert_score_F1=%{x}',
+ 'legendgroup': 'zephyr-7b-beta',
+ 'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
+ 'name': 'zephyr-7b-beta',
+ 'offsetgroup': 'zephyr-7b-beta',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.08394519], dtype=float32),
+ 'xaxis': 'x',
+ 'y': array(['zephyr-7b-beta'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
bert_score_F1=%{x}',
+ 'legendgroup': 'Mistral-7B-Instruct-v0.2',
+ 'marker': {'color': '#EF553B', 'pattern': {'shape': ''}},
+ 'name': 'Mistral-7B-Instruct-v0.2',
+ 'offsetgroup': 'Mistral-7B-Instruct-v0.2',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.04313921], dtype=float32),
+ 'xaxis': 'x',
+ 'y': array(['Mistral-7B-Instruct-v0.2'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
bert_score_F1=%{x}',
+ 'legendgroup': 'Upstage SOLAR Instruct v1 (11B)',
+ 'marker': {'color': '#00cc96', 'pattern': {'shape': ''}},
+ 'name': 'Upstage SOLAR Instruct v1 (11B)',
+ 'offsetgroup': 'Upstage SOLAR Instruct v1 (11B)',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.], dtype=float32),
+ 'xaxis': 'x',
+ 'y': array(['Upstage SOLAR Instruct v1 (11B)'], dtype=object),
+ 'yaxis': 'y'}],
+ 'layout': {'barmode': 'relative',
+ 'legend': {'title': {'text': 'model'}, 'tracegroupgap': 0},
+ 'template': '...',
+ 'title': {'text': 'Summary metrics BERT score F1'},
+ 'xaxis': {'anchor': 'y', 'domain': [0.0, 1.0], 'title': {'text': 'bert_score_F1'}},
+ 'yaxis': {'anchor': 'x',
+ 'categoryarray': [Upstage SOLAR Instruct v1 (11B),
+ Mistral-7B-Instruct-v0.2,
+ zephyr-7b-beta,
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,
+ Mixtral-8x7B-Instruct-v0.1,
+ llama-2-70b-chat, chat-bison-32k (PaLM 2
+ 32K), chat-bison (PaLM 2), gemini-pro,
+ RedPajama-INCITE Chat (7B), Falcon
+ Instruct (7B), Vicuna v1.5 (7B), Chronos
+ Hermes (13B), LLaMA-2 Chat (7B), Snorkel
+ Mistral PairRM DPO (7B), WizardLM v1.2
+ (13B), 01-ai Yi Chat (34B), Qwen 1.5
+ Chat (7B), OpenHermes-2.5-Mistral (7B),
+ Mistral (7B) Instruct v0.2 (Together
+ AI), gpt-4-turbo, gpt-4, gpt-3.5-turbo],
+ 'categoryorder': 'array',
+ 'domain': [0.0, 1.0],
+ 'title': {'text': 'model'}}}
+})",Summary metrics BERT score F1,"{""data"":[{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003ebert_score_F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-3.5-turbo"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""gpt-3.5-turbo"",""offsetgroup"":""gpt-3.5-turbo"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.4888874],""xaxis"":""x"",""y"":[""gpt-3.5-turbo""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003ebert_score_F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""gpt-4"",""offsetgroup"":""gpt-4"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.47901583],""xaxis"":""x"",""y"":[""gpt-4""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003ebert_score_F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4-turbo"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""gpt-4-turbo"",""offsetgroup"":""gpt-4-turbo"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.42098433],""xaxis"":""x"",""y"":[""gpt-4-turbo""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003ebert_score_F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral (7B) Instruct v0.2 (Together AI)"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""Mistral (7B) Instruct v0.2 (Together AI)"",""offsetgroup"":""Mistral (7B) Instruct v0.2 (Together AI)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.36540908],""xaxis"":""x"",""y"":[""Mistral (7B) Instruct v0.2 (Together AI)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003ebert_score_F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""OpenHermes-2.5-Mistral (7B)"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""OpenHermes-2.5-Mistral (7B)"",""offsetgroup"":""OpenHermes-2.5-Mistral (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.3565194],""xaxis"":""x"",""y"":[""OpenHermes-2.5-Mistral (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003ebert_score_F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Qwen 1.5 Chat (7B)"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""Qwen 1.5 Chat (7B)"",""offsetgroup"":""Qwen 1.5 Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.344803],""xaxis"":""x"",""y"":[""Qwen 1.5 Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003ebert_score_F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""01-ai Yi Chat (34B)"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""01-ai Yi Chat (34B)"",""offsetgroup"":""01-ai Yi Chat (34B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.3399749],""xaxis"":""x"",""y"":[""01-ai Yi Chat (34B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003ebert_score_F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""WizardLM v1.2 (13B)"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""WizardLM v1.2 (13B)"",""offsetgroup"":""WizardLM v1.2 (13B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.33466902],""xaxis"":""x"",""y"":[""WizardLM v1.2 (13B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003ebert_score_F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Snorkel Mistral PairRM DPO (7B)"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""Snorkel Mistral PairRM DPO (7B)"",""offsetgroup"":""Snorkel Mistral PairRM DPO (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.3265383],""xaxis"":""x"",""y"":[""Snorkel Mistral PairRM DPO (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003ebert_score_F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""LLaMA-2 Chat (7B)"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""LLaMA-2 Chat (7B)"",""offsetgroup"":""LLaMA-2 Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.31770444],""xaxis"":""x"",""y"":[""LLaMA-2 Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003ebert_score_F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Chronos Hermes (13B)"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""Chronos Hermes (13B)"",""offsetgroup"":""Chronos Hermes (13B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.311415],""xaxis"":""x"",""y"":[""Chronos Hermes (13B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003ebert_score_F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Vicuna v1.5 (7B)"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""Vicuna v1.5 (7B)"",""offsetgroup"":""Vicuna v1.5 (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.28129113],""xaxis"":""x"",""y"":[""Vicuna v1.5 (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003ebert_score_F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Falcon Instruct (7B)"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""Falcon Instruct (7B)"",""offsetgroup"":""Falcon Instruct (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.2615204],""xaxis"":""x"",""y"":[""Falcon Instruct (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003ebert_score_F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""RedPajama-INCITE Chat (7B)"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""RedPajama-INCITE Chat (7B)"",""offsetgroup"":""RedPajama-INCITE Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.2487217],""xaxis"":""x"",""y"":[""RedPajama-INCITE Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003ebert_score_F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gemini-pro"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""gemini-pro"",""offsetgroup"":""gemini-pro"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.23072062],""xaxis"":""x"",""y"":[""gemini-pro""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003ebert_score_F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison (PaLM 2)"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""chat-bison (PaLM 2)"",""offsetgroup"":""chat-bison (PaLM 2)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.23060663],""xaxis"":""x"",""y"":[""chat-bison (PaLM 2)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003ebert_score_F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison-32k (PaLM 2 32K)"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""chat-bison-32k (PaLM 2 32K)"",""offsetgroup"":""chat-bison-32k (PaLM 2 32K)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.23002876],""xaxis"":""x"",""y"":[""chat-bison-32k (PaLM 2 32K)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003ebert_score_F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""llama-2-70b-chat"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""llama-2-70b-chat"",""offsetgroup"":""llama-2-70b-chat"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.21117964],""xaxis"":""x"",""y"":[""llama-2-70b-chat""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003ebert_score_F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mixtral-8x7B-Instruct-v0.1"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""Mixtral-8x7B-Instruct-v0.1"",""offsetgroup"":""Mixtral-8x7B-Instruct-v0.1"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.19330867],""xaxis"":""x"",""y"":[""Mixtral-8x7B-Instruct-v0.1""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003ebert_score_F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""offsetgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.12042627],""xaxis"":""x"",""y"":[""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003ebert_score_F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""zephyr-7b-beta"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""zephyr-7b-beta"",""offsetgroup"":""zephyr-7b-beta"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.08394519],""xaxis"":""x"",""y"":[""zephyr-7b-beta""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003ebert_score_F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral-7B-Instruct-v0.2"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""Mistral-7B-Instruct-v0.2"",""offsetgroup"":""Mistral-7B-Instruct-v0.2"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.04313921],""xaxis"":""x"",""y"":[""Mistral-7B-Instruct-v0.2""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003ebert_score_F1=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Upstage SOLAR Instruct v1 (11B)"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""Upstage SOLAR Instruct v1 (11B)"",""offsetgroup"":""Upstage SOLAR Instruct v1 (11B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.0],""xaxis"":""x"",""y"":[""Upstage SOLAR Instruct v1 (11B)""],""yaxis"":""y"",""type"":""bar""}],""layout"":{""template"":{""data"":{""histogram2dcontour"":[{""type"":""histogram2dcontour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""choropleth"":[{""type"":""choropleth"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""histogram2d"":[{""type"":""histogram2d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmap"":[{""type"":""heatmap"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmapgl"":[{""type"":""heatmapgl"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""contourcarpet"":[{""type"":""contourcarpet"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""contour"":[{""type"":""contour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""surface"":[{""type"":""surface"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""mesh3d"":[{""type"":""mesh3d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""scatter"":[{""fillpattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2},""type"":""scatter""}],""parcoords"":[{""type"":""parcoords"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolargl"":[{""type"":""scatterpolargl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""bar"":[{""error_x"":{""color"":""#2a3f5f""},""error_y"":{""color"":""#2a3f5f""},""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""bar""}],""scattergeo"":[{""type"":""scattergeo"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolar"":[{""type"":""scatterpolar"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""histogram"":[{""marker"":{""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""histogram""}],""scattergl"":[{""type"":""scattergl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatter3d"":[{""type"":""scatter3d"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattermapbox"":[{""type"":""scattermapbox"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterternary"":[{""type"":""scatterternary"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattercarpet"":[{""type"":""scattercarpet"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""carpet"":[{""aaxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""baxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""type"":""carpet""}],""table"":[{""cells"":{""fill"":{""color"":""#EBF0F8""},""line"":{""color"":""white""}},""header"":{""fill"":{""color"":""#C8D4E3""},""line"":{""color"":""white""}},""type"":""table""}],""barpolar"":[{""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""barpolar""}],""pie"":[{""automargin"":true,""type"":""pie""}]},""layout"":{""autotypenumbers"":""strict"",""colorway"":[""#636efa"",""#EF553B"",""#00cc96"",""#ab63fa"",""#FFA15A"",""#19d3f3"",""#FF6692"",""#B6E880"",""#FF97FF"",""#FECB52""],""font"":{""color"":""#2a3f5f""},""hovermode"":""closest"",""hoverlabel"":{""align"":""left""},""paper_bgcolor"":""white"",""plot_bgcolor"":""#E5ECF6"",""polar"":{""bgcolor"":""#E5ECF6"",""angularaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""radialaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""ternary"":{""bgcolor"":""#E5ECF6"",""aaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""baxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""caxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""coloraxis"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""colorscale"":{""sequential"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""sequentialminus"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""diverging"":[[0,""#8e0152""],[0.1,""#c51b7d""],[0.2,""#de77ae""],[0.3,""#f1b6da""],[0.4,""#fde0ef""],[0.5,""#f7f7f7""],[0.6,""#e6f5d0""],[0.7,""#b8e186""],[0.8,""#7fbc41""],[0.9,""#4d9221""],[1,""#276419""]]},""xaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""yaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""scene"":{""xaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""yaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""zaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2}},""shapedefaults"":{""line"":{""color"":""#2a3f5f""}},""annotationdefaults"":{""arrowcolor"":""#2a3f5f"",""arrowhead"":0,""arrowwidth"":1},""geo"":{""bgcolor"":""white"",""landcolor"":""#E5ECF6"",""subunitcolor"":""white"",""showland"":true,""showlakes"":true,""lakecolor"":""white""},""title"":{""x"":0.05},""mapbox"":{""style"":""light""}}},""xaxis"":{""anchor"":""y"",""domain"":[0.0,1.0],""title"":{""text"":""bert_score_F1""}},""yaxis"":{""anchor"":""x"",""domain"":[0.0,1.0],""title"":{""text"":""model""},""categoryorder"":""array"",""categoryarray"":[""Upstage SOLAR Instruct v1 (11B)"",""Mistral-7B-Instruct-v0.2"",""zephyr-7b-beta"",""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""Mixtral-8x7B-Instruct-v0.1"",""llama-2-70b-chat"",""chat-bison-32k (PaLM 2 32K)"",""chat-bison (PaLM 2)"",""gemini-pro"",""RedPajama-INCITE Chat (7B)"",""Falcon Instruct (7B)"",""Vicuna v1.5 (7B)"",""Chronos Hermes (13B)"",""LLaMA-2 Chat (7B)"",""Snorkel Mistral PairRM DPO (7B)"",""WizardLM v1.2 (13B)"",""01-ai Yi Chat (34B)"",""Qwen 1.5 Chat (7B)"",""OpenHermes-2.5-Mistral (7B)"",""Mistral (7B) Instruct v0.2 (Together AI)"",""gpt-4-turbo"",""gpt-4"",""gpt-3.5-turbo""]},""legend"":{""title"":{""text"":""model""},""tracegroupgap"":0},""title"":{""text"":""Summary metrics BERT score F1""},""barmode"":""relative""}}",How similar are the BERT model embeddings of the summary to the BERT model embeddings of the original text. Value is averaged for each model.,",model,bert_score_P,bert_score_R,bert_score_F1,original_text_length_part,sentence_count,length_penalty,bleu_score
+18,gpt-3.5-turbo,0.4943981,0.48408476,0.4888874,0.5905700146991734,4.229639819909955,89814.0,0.007892445077902592
+19,gpt-4,0.48605907,0.472583,0.47901583,0.4763731952669352,4.266137566137566,85120.0,0.004704572681138337
+20,gpt-4-turbo,0.42728576,0.4162435,0.42098433,0.5393220459796505,4.266137566137566,85120.0,0.0034873692407505464
+4,Mistral (7B) Instruct v0.2 (Together AI),0.3647361,0.3664233,0.36540908,0.5233998570385472,3.712222222222222,29298.0,0.005478518060743351
+7,OpenHermes-2.5-Mistral (7B),0.3618188,0.35180506,0.3565194,0.312054520357568,3.5818443804034583,14928.0,0.006563161880264231
+8,Qwen 1.5 Chat (7B),0.34855434,0.34154576,0.344803,0.29904529709475364,3.5818443804034583,14928.0,0.003185571110431172
+0,01-ai Yi Chat (34B),0.33974892,0.3404481,0.3399749,0.43251538287409536,3.5818443804034583,14928.0,0.007311566390840339
+14,WizardLM v1.2 (13B),0.34085444,0.32933056,0.33466902,0.28716720161049375,3.5818443804034583,14928.0,0.003671383039102015
+10,Snorkel Mistral PairRM DPO (7B),0.31672964,0.33782956,0.3265383,3.7740234383755356,3.5818443804034583,14928.0,0.002907897771152987
+3,LLaMA-2 Chat (7B),0.3203912,0.3153909,0.31770444,0.4084233313416049,3.5818443804034583,14928.0,0.004255859538193306
+1,Chronos Hermes (13B),0.3124825,0.31071666,0.311415,0.4742810243835248,3.5818443804034583,14928.0,0.011439012700594395
+13,Vicuna v1.5 (7B),0.284109,0.27878883,0.28129113,0.2781035051738079,3.6173027989821884,16948.0,0.006952332387656228
+2,Falcon Instruct (7B),0.2895086,0.23968808,0.2615204,0.0490635544441649,3.5818443804034583,14928.0,0.00021729364201653395
+9,RedPajama-INCITE Chat (7B),0.261367,0.23758642,0.2487217,0.0560284823193376,3.5818443804034583,14928.0,0.0
+17,gemini-pro,0.23105659,0.23057175,0.23072062,0.295286999418032,4.244871794871795,87700.0,0.0025439281189154664
+15,chat-bison (PaLM 2),0.23117188,0.23029378,0.23060663,0.2927236655934559,4.281081081081081,83400.0,0.0033173472693443363
+16,chat-bison-32k (PaLM 2 32K),0.23046139,0.22983725,0.23002876,0.2608806894318779,4.281081081081081,83400.0,0.002970914340485325
+21,llama-2-70b-chat,0.20800962,0.21472095,0.21117964,0.29684572894554634,4.2436893203883495,88008.0,0.00329426273003284
+6,Mixtral-8x7B-Instruct-v0.1,0.19128644,0.19555509,0.19330867,0.2665288353398184,4.161038961038961,103320.0,0.0026839271544750283
+11,TinyLlama/TinyLlama-1.1B-Chat-v1.0,0.122185074,0.11885959,0.12042627,0.13915355617375091,4.244871794871795,87700.0,0.002991155730532842
+22,zephyr-7b-beta,0.085390136,0.08266569,0.08394519,0.08796697338212889,4.159788702026735,103714.0,0.0010625100735849574
+5,Mistral-7B-Instruct-v0.2,0.043820098,0.042561684,0.04313921,0.04250630683894714,4.120342654588421,113258.0,0.0004930290548816363
+12,Upstage SOLAR Instruct v1 (11B),0.0,0.0,0.0,0.0017662349842492329,3.5818443804034583,14928.0,0.0
+","{""x"": ""bert_score_F1"", ""y"": ""model"", ""color"": ""model"", ""orientation"": ""h"", ""title"": ""Summary metrics BERT score F1""}"
+"Figure({
+ 'data': [{'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
original_text_length_part=%{x}',
+ 'legendgroup': 'Snorkel Mistral PairRM DPO (7B)',
+ 'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
+ 'name': 'Snorkel Mistral PairRM DPO (7B)',
+ 'offsetgroup': 'Snorkel Mistral PairRM DPO (7B)',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([3.77402344]),
+ 'xaxis': 'x',
+ 'y': array(['Snorkel Mistral PairRM DPO (7B)'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
original_text_length_part=%{x}',
+ 'legendgroup': 'gpt-3.5-turbo',
+ 'marker': {'color': '#EF553B', 'pattern': {'shape': ''}},
+ 'name': 'gpt-3.5-turbo',
+ 'offsetgroup': 'gpt-3.5-turbo',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.59057001]),
+ 'xaxis': 'x',
+ 'y': array(['gpt-3.5-turbo'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
original_text_length_part=%{x}',
+ 'legendgroup': 'gpt-4-turbo',
+ 'marker': {'color': '#00cc96', 'pattern': {'shape': ''}},
+ 'name': 'gpt-4-turbo',
+ 'offsetgroup': 'gpt-4-turbo',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.53932205]),
+ 'xaxis': 'x',
+ 'y': array(['gpt-4-turbo'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
original_text_length_part=%{x}',
+ 'legendgroup': 'Mistral (7B) Instruct v0.2 (Together AI)',
+ 'marker': {'color': '#ab63fa', 'pattern': {'shape': ''}},
+ 'name': 'Mistral (7B) Instruct v0.2 (Together AI)',
+ 'offsetgroup': 'Mistral (7B) Instruct v0.2 (Together AI)',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.52339986]),
+ 'xaxis': 'x',
+ 'y': array(['Mistral (7B) Instruct v0.2 (Together AI)'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
original_text_length_part=%{x}',
+ 'legendgroup': 'gpt-4',
+ 'marker': {'color': '#FFA15A', 'pattern': {'shape': ''}},
+ 'name': 'gpt-4',
+ 'offsetgroup': 'gpt-4',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.4763732]),
+ 'xaxis': 'x',
+ 'y': array(['gpt-4'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
original_text_length_part=%{x}',
+ 'legendgroup': 'Chronos Hermes (13B)',
+ 'marker': {'color': '#19d3f3', 'pattern': {'shape': ''}},
+ 'name': 'Chronos Hermes (13B)',
+ 'offsetgroup': 'Chronos Hermes (13B)',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.47428102]),
+ 'xaxis': 'x',
+ 'y': array(['Chronos Hermes (13B)'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
original_text_length_part=%{x}',
+ 'legendgroup': '01-ai Yi Chat (34B)',
+ 'marker': {'color': '#FF6692', 'pattern': {'shape': ''}},
+ 'name': '01-ai Yi Chat (34B)',
+ 'offsetgroup': '01-ai Yi Chat (34B)',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.43251538]),
+ 'xaxis': 'x',
+ 'y': array(['01-ai Yi Chat (34B)'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
original_text_length_part=%{x}',
+ 'legendgroup': 'LLaMA-2 Chat (7B)',
+ 'marker': {'color': '#B6E880', 'pattern': {'shape': ''}},
+ 'name': 'LLaMA-2 Chat (7B)',
+ 'offsetgroup': 'LLaMA-2 Chat (7B)',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.40842333]),
+ 'xaxis': 'x',
+ 'y': array(['LLaMA-2 Chat (7B)'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
original_text_length_part=%{x}',
+ 'legendgroup': 'OpenHermes-2.5-Mistral (7B)',
+ 'marker': {'color': '#FF97FF', 'pattern': {'shape': ''}},
+ 'name': 'OpenHermes-2.5-Mistral (7B)',
+ 'offsetgroup': 'OpenHermes-2.5-Mistral (7B)',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.31205452]),
+ 'xaxis': 'x',
+ 'y': array(['OpenHermes-2.5-Mistral (7B)'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
original_text_length_part=%{x}',
+ 'legendgroup': 'Qwen 1.5 Chat (7B)',
+ 'marker': {'color': '#FECB52', 'pattern': {'shape': ''}},
+ 'name': 'Qwen 1.5 Chat (7B)',
+ 'offsetgroup': 'Qwen 1.5 Chat (7B)',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.2990453]),
+ 'xaxis': 'x',
+ 'y': array(['Qwen 1.5 Chat (7B)'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
original_text_length_part=%{x}',
+ 'legendgroup': 'llama-2-70b-chat',
+ 'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
+ 'name': 'llama-2-70b-chat',
+ 'offsetgroup': 'llama-2-70b-chat',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.29684573]),
+ 'xaxis': 'x',
+ 'y': array(['llama-2-70b-chat'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
original_text_length_part=%{x}',
+ 'legendgroup': 'gemini-pro',
+ 'marker': {'color': '#EF553B', 'pattern': {'shape': ''}},
+ 'name': 'gemini-pro',
+ 'offsetgroup': 'gemini-pro',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.295287]),
+ 'xaxis': 'x',
+ 'y': array(['gemini-pro'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
original_text_length_part=%{x}',
+ 'legendgroup': 'chat-bison (PaLM 2)',
+ 'marker': {'color': '#00cc96', 'pattern': {'shape': ''}},
+ 'name': 'chat-bison (PaLM 2)',
+ 'offsetgroup': 'chat-bison (PaLM 2)',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.29272367]),
+ 'xaxis': 'x',
+ 'y': array(['chat-bison (PaLM 2)'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
original_text_length_part=%{x}',
+ 'legendgroup': 'WizardLM v1.2 (13B)',
+ 'marker': {'color': '#ab63fa', 'pattern': {'shape': ''}},
+ 'name': 'WizardLM v1.2 (13B)',
+ 'offsetgroup': 'WizardLM v1.2 (13B)',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.2871672]),
+ 'xaxis': 'x',
+ 'y': array(['WizardLM v1.2 (13B)'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
original_text_length_part=%{x}',
+ 'legendgroup': 'Vicuna v1.5 (7B)',
+ 'marker': {'color': '#FFA15A', 'pattern': {'shape': ''}},
+ 'name': 'Vicuna v1.5 (7B)',
+ 'offsetgroup': 'Vicuna v1.5 (7B)',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.27810351]),
+ 'xaxis': 'x',
+ 'y': array(['Vicuna v1.5 (7B)'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
original_text_length_part=%{x}',
+ 'legendgroup': 'Mixtral-8x7B-Instruct-v0.1',
+ 'marker': {'color': '#19d3f3', 'pattern': {'shape': ''}},
+ 'name': 'Mixtral-8x7B-Instruct-v0.1',
+ 'offsetgroup': 'Mixtral-8x7B-Instruct-v0.1',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.26652884]),
+ 'xaxis': 'x',
+ 'y': array(['Mixtral-8x7B-Instruct-v0.1'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
original_text_length_part=%{x}',
+ 'legendgroup': 'chat-bison-32k (PaLM 2 32K)',
+ 'marker': {'color': '#FF6692', 'pattern': {'shape': ''}},
+ 'name': 'chat-bison-32k (PaLM 2 32K)',
+ 'offsetgroup': 'chat-bison-32k (PaLM 2 32K)',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.26088069]),
+ 'xaxis': 'x',
+ 'y': array(['chat-bison-32k (PaLM 2 32K)'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
original_text_length_part=%{x}',
+ 'legendgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
+ 'marker': {'color': '#B6E880', 'pattern': {'shape': ''}},
+ 'name': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
+ 'offsetgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.13915356]),
+ 'xaxis': 'x',
+ 'y': array(['TinyLlama/TinyLlama-1.1B-Chat-v1.0'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
original_text_length_part=%{x}',
+ 'legendgroup': 'zephyr-7b-beta',
+ 'marker': {'color': '#FF97FF', 'pattern': {'shape': ''}},
+ 'name': 'zephyr-7b-beta',
+ 'offsetgroup': 'zephyr-7b-beta',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.08796697]),
+ 'xaxis': 'x',
+ 'y': array(['zephyr-7b-beta'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
original_text_length_part=%{x}',
+ 'legendgroup': 'RedPajama-INCITE Chat (7B)',
+ 'marker': {'color': '#FECB52', 'pattern': {'shape': ''}},
+ 'name': 'RedPajama-INCITE Chat (7B)',
+ 'offsetgroup': 'RedPajama-INCITE Chat (7B)',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.05602848]),
+ 'xaxis': 'x',
+ 'y': array(['RedPajama-INCITE Chat (7B)'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
original_text_length_part=%{x}',
+ 'legendgroup': 'Falcon Instruct (7B)',
+ 'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
+ 'name': 'Falcon Instruct (7B)',
+ 'offsetgroup': 'Falcon Instruct (7B)',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.04906355]),
+ 'xaxis': 'x',
+ 'y': array(['Falcon Instruct (7B)'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
original_text_length_part=%{x}',
+ 'legendgroup': 'Mistral-7B-Instruct-v0.2',
+ 'marker': {'color': '#EF553B', 'pattern': {'shape': ''}},
+ 'name': 'Mistral-7B-Instruct-v0.2',
+ 'offsetgroup': 'Mistral-7B-Instruct-v0.2',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.04250631]),
+ 'xaxis': 'x',
+ 'y': array(['Mistral-7B-Instruct-v0.2'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
original_text_length_part=%{x}',
+ 'legendgroup': 'Upstage SOLAR Instruct v1 (11B)',
+ 'marker': {'color': '#00cc96', 'pattern': {'shape': ''}},
+ 'name': 'Upstage SOLAR Instruct v1 (11B)',
+ 'offsetgroup': 'Upstage SOLAR Instruct v1 (11B)',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.00176623]),
+ 'xaxis': 'x',
+ 'y': array(['Upstage SOLAR Instruct v1 (11B)'], dtype=object),
+ 'yaxis': 'y'}],
+ 'layout': {'barmode': 'relative',
+ 'legend': {'title': {'text': 'model'}, 'tracegroupgap': 0},
+ 'template': '...',
+ 'title': {'text': 'Summary metrics original text length part'},
+ 'xaxis': {'anchor': 'y', 'domain': [0.0, 1.0], 'title': {'text': 'original_text_length_part'}},
+ 'yaxis': {'anchor': 'x',
+ 'categoryarray': [Upstage SOLAR Instruct v1 (11B),
+ Mistral-7B-Instruct-v0.2, Falcon
+ Instruct (7B), RedPajama-INCITE Chat
+ (7B), zephyr-7b-beta,
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,
+ chat-bison-32k (PaLM 2 32K),
+ Mixtral-8x7B-Instruct-v0.1, Vicuna v1.5
+ (7B), WizardLM v1.2 (13B), chat-bison
+ (PaLM 2), gemini-pro, llama-2-70b-chat,
+ Qwen 1.5 Chat (7B),
+ OpenHermes-2.5-Mistral (7B), LLaMA-2
+ Chat (7B), 01-ai Yi Chat (34B), Chronos
+ Hermes (13B), gpt-4, Mistral (7B)
+ Instruct v0.2 (Together AI),
+ gpt-4-turbo, gpt-3.5-turbo, Snorkel
+ Mistral PairRM DPO (7B)],
+ 'categoryorder': 'array',
+ 'domain': [0.0, 1.0],
+ 'title': {'text': 'model'}}}
+})",Summary metrics original text length part,"{""data"":[{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003eoriginal_text_length_part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Snorkel Mistral PairRM DPO (7B)"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""Snorkel Mistral PairRM DPO (7B)"",""offsetgroup"":""Snorkel Mistral PairRM DPO (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[3.7740234383755356],""xaxis"":""x"",""y"":[""Snorkel Mistral PairRM DPO (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003eoriginal_text_length_part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-3.5-turbo"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""gpt-3.5-turbo"",""offsetgroup"":""gpt-3.5-turbo"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.5905700146991734],""xaxis"":""x"",""y"":[""gpt-3.5-turbo""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003eoriginal_text_length_part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4-turbo"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""gpt-4-turbo"",""offsetgroup"":""gpt-4-turbo"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.5393220459796505],""xaxis"":""x"",""y"":[""gpt-4-turbo""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003eoriginal_text_length_part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral (7B) Instruct v0.2 (Together AI)"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""Mistral (7B) Instruct v0.2 (Together AI)"",""offsetgroup"":""Mistral (7B) Instruct v0.2 (Together AI)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.5233998570385472],""xaxis"":""x"",""y"":[""Mistral (7B) Instruct v0.2 (Together AI)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003eoriginal_text_length_part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""gpt-4"",""offsetgroup"":""gpt-4"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.4763731952669352],""xaxis"":""x"",""y"":[""gpt-4""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003eoriginal_text_length_part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Chronos Hermes (13B)"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""Chronos Hermes (13B)"",""offsetgroup"":""Chronos Hermes (13B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.4742810243835248],""xaxis"":""x"",""y"":[""Chronos Hermes (13B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003eoriginal_text_length_part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""01-ai Yi Chat (34B)"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""01-ai Yi Chat (34B)"",""offsetgroup"":""01-ai Yi Chat (34B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.43251538287409536],""xaxis"":""x"",""y"":[""01-ai Yi Chat (34B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003eoriginal_text_length_part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""LLaMA-2 Chat (7B)"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""LLaMA-2 Chat (7B)"",""offsetgroup"":""LLaMA-2 Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.4084233313416049],""xaxis"":""x"",""y"":[""LLaMA-2 Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003eoriginal_text_length_part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""OpenHermes-2.5-Mistral (7B)"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""OpenHermes-2.5-Mistral (7B)"",""offsetgroup"":""OpenHermes-2.5-Mistral (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.312054520357568],""xaxis"":""x"",""y"":[""OpenHermes-2.5-Mistral (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003eoriginal_text_length_part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Qwen 1.5 Chat (7B)"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""Qwen 1.5 Chat (7B)"",""offsetgroup"":""Qwen 1.5 Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.29904529709475364],""xaxis"":""x"",""y"":[""Qwen 1.5 Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003eoriginal_text_length_part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""llama-2-70b-chat"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""llama-2-70b-chat"",""offsetgroup"":""llama-2-70b-chat"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.29684572894554634],""xaxis"":""x"",""y"":[""llama-2-70b-chat""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003eoriginal_text_length_part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gemini-pro"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""gemini-pro"",""offsetgroup"":""gemini-pro"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.295286999418032],""xaxis"":""x"",""y"":[""gemini-pro""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003eoriginal_text_length_part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison (PaLM 2)"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""chat-bison (PaLM 2)"",""offsetgroup"":""chat-bison (PaLM 2)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.2927236655934559],""xaxis"":""x"",""y"":[""chat-bison (PaLM 2)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003eoriginal_text_length_part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""WizardLM v1.2 (13B)"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""WizardLM v1.2 (13B)"",""offsetgroup"":""WizardLM v1.2 (13B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.28716720161049375],""xaxis"":""x"",""y"":[""WizardLM v1.2 (13B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003eoriginal_text_length_part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Vicuna v1.5 (7B)"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""Vicuna v1.5 (7B)"",""offsetgroup"":""Vicuna v1.5 (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.2781035051738079],""xaxis"":""x"",""y"":[""Vicuna v1.5 (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003eoriginal_text_length_part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mixtral-8x7B-Instruct-v0.1"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""Mixtral-8x7B-Instruct-v0.1"",""offsetgroup"":""Mixtral-8x7B-Instruct-v0.1"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.2665288353398184],""xaxis"":""x"",""y"":[""Mixtral-8x7B-Instruct-v0.1""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003eoriginal_text_length_part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison-32k (PaLM 2 32K)"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""chat-bison-32k (PaLM 2 32K)"",""offsetgroup"":""chat-bison-32k (PaLM 2 32K)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.2608806894318779],""xaxis"":""x"",""y"":[""chat-bison-32k (PaLM 2 32K)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003eoriginal_text_length_part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""offsetgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.13915355617375091],""xaxis"":""x"",""y"":[""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003eoriginal_text_length_part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""zephyr-7b-beta"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""zephyr-7b-beta"",""offsetgroup"":""zephyr-7b-beta"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.08796697338212889],""xaxis"":""x"",""y"":[""zephyr-7b-beta""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003eoriginal_text_length_part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""RedPajama-INCITE Chat (7B)"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""RedPajama-INCITE Chat (7B)"",""offsetgroup"":""RedPajama-INCITE Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.0560284823193376],""xaxis"":""x"",""y"":[""RedPajama-INCITE Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003eoriginal_text_length_part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Falcon Instruct (7B)"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""Falcon Instruct (7B)"",""offsetgroup"":""Falcon Instruct (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.0490635544441649],""xaxis"":""x"",""y"":[""Falcon Instruct (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003eoriginal_text_length_part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral-7B-Instruct-v0.2"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""Mistral-7B-Instruct-v0.2"",""offsetgroup"":""Mistral-7B-Instruct-v0.2"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.04250630683894714],""xaxis"":""x"",""y"":[""Mistral-7B-Instruct-v0.2""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003eoriginal_text_length_part=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Upstage SOLAR Instruct v1 (11B)"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""Upstage SOLAR Instruct v1 (11B)"",""offsetgroup"":""Upstage SOLAR Instruct v1 (11B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.0017662349842492329],""xaxis"":""x"",""y"":[""Upstage SOLAR Instruct v1 (11B)""],""yaxis"":""y"",""type"":""bar""}],""layout"":{""template"":{""data"":{""histogram2dcontour"":[{""type"":""histogram2dcontour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""choropleth"":[{""type"":""choropleth"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""histogram2d"":[{""type"":""histogram2d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmap"":[{""type"":""heatmap"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmapgl"":[{""type"":""heatmapgl"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""contourcarpet"":[{""type"":""contourcarpet"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""contour"":[{""type"":""contour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""surface"":[{""type"":""surface"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""mesh3d"":[{""type"":""mesh3d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""scatter"":[{""fillpattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2},""type"":""scatter""}],""parcoords"":[{""type"":""parcoords"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolargl"":[{""type"":""scatterpolargl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""bar"":[{""error_x"":{""color"":""#2a3f5f""},""error_y"":{""color"":""#2a3f5f""},""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""bar""}],""scattergeo"":[{""type"":""scattergeo"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolar"":[{""type"":""scatterpolar"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""histogram"":[{""marker"":{""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""histogram""}],""scattergl"":[{""type"":""scattergl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatter3d"":[{""type"":""scatter3d"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattermapbox"":[{""type"":""scattermapbox"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterternary"":[{""type"":""scatterternary"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattercarpet"":[{""type"":""scattercarpet"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""carpet"":[{""aaxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""baxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""type"":""carpet""}],""table"":[{""cells"":{""fill"":{""color"":""#EBF0F8""},""line"":{""color"":""white""}},""header"":{""fill"":{""color"":""#C8D4E3""},""line"":{""color"":""white""}},""type"":""table""}],""barpolar"":[{""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""barpolar""}],""pie"":[{""automargin"":true,""type"":""pie""}]},""layout"":{""autotypenumbers"":""strict"",""colorway"":[""#636efa"",""#EF553B"",""#00cc96"",""#ab63fa"",""#FFA15A"",""#19d3f3"",""#FF6692"",""#B6E880"",""#FF97FF"",""#FECB52""],""font"":{""color"":""#2a3f5f""},""hovermode"":""closest"",""hoverlabel"":{""align"":""left""},""paper_bgcolor"":""white"",""plot_bgcolor"":""#E5ECF6"",""polar"":{""bgcolor"":""#E5ECF6"",""angularaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""radialaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""ternary"":{""bgcolor"":""#E5ECF6"",""aaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""baxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""caxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""coloraxis"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""colorscale"":{""sequential"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""sequentialminus"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""diverging"":[[0,""#8e0152""],[0.1,""#c51b7d""],[0.2,""#de77ae""],[0.3,""#f1b6da""],[0.4,""#fde0ef""],[0.5,""#f7f7f7""],[0.6,""#e6f5d0""],[0.7,""#b8e186""],[0.8,""#7fbc41""],[0.9,""#4d9221""],[1,""#276419""]]},""xaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""yaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""scene"":{""xaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""yaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""zaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2}},""shapedefaults"":{""line"":{""color"":""#2a3f5f""}},""annotationdefaults"":{""arrowcolor"":""#2a3f5f"",""arrowhead"":0,""arrowwidth"":1},""geo"":{""bgcolor"":""white"",""landcolor"":""#E5ECF6"",""subunitcolor"":""white"",""showland"":true,""showlakes"":true,""lakecolor"":""white""},""title"":{""x"":0.05},""mapbox"":{""style"":""light""}}},""xaxis"":{""anchor"":""y"",""domain"":[0.0,1.0],""title"":{""text"":""original_text_length_part""}},""yaxis"":{""anchor"":""x"",""domain"":[0.0,1.0],""title"":{""text"":""model""},""categoryorder"":""array"",""categoryarray"":[""Upstage SOLAR Instruct v1 (11B)"",""Mistral-7B-Instruct-v0.2"",""Falcon Instruct (7B)"",""RedPajama-INCITE Chat (7B)"",""zephyr-7b-beta"",""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""chat-bison-32k (PaLM 2 32K)"",""Mixtral-8x7B-Instruct-v0.1"",""Vicuna v1.5 (7B)"",""WizardLM v1.2 (13B)"",""chat-bison (PaLM 2)"",""gemini-pro"",""llama-2-70b-chat"",""Qwen 1.5 Chat (7B)"",""OpenHermes-2.5-Mistral (7B)"",""LLaMA-2 Chat (7B)"",""01-ai Yi Chat (34B)"",""Chronos Hermes (13B)"",""gpt-4"",""Mistral (7B) Instruct v0.2 (Together AI)"",""gpt-4-turbo"",""gpt-3.5-turbo"",""Snorkel Mistral PairRM DPO (7B)""]},""legend"":{""title"":{""text"":""model""},""tracegroupgap"":0},""title"":{""text"":""Summary metrics original text length part""},""barmode"":""relative""}}","How long is the summarization compared to the original text, calculated as: `len(summarized_text) + 1 / len(original_text) + 1`. Value is averaged for each model.",",model,bert_score_P,bert_score_R,bert_score_F1,original_text_length_part,sentence_count,length_penalty,bleu_score
+10,Snorkel Mistral PairRM DPO (7B),0.31672964,0.33782956,0.3265383,3.7740234383755356,3.5818443804034583,14928.0,0.002907897771152987
+18,gpt-3.5-turbo,0.4943981,0.48408476,0.4888874,0.5905700146991734,4.229639819909955,89814.0,0.007892445077902592
+20,gpt-4-turbo,0.42728576,0.4162435,0.42098433,0.5393220459796505,4.266137566137566,85120.0,0.0034873692407505464
+4,Mistral (7B) Instruct v0.2 (Together AI),0.3647361,0.3664233,0.36540908,0.5233998570385472,3.712222222222222,29298.0,0.005478518060743351
+19,gpt-4,0.48605907,0.472583,0.47901583,0.4763731952669352,4.266137566137566,85120.0,0.004704572681138337
+1,Chronos Hermes (13B),0.3124825,0.31071666,0.311415,0.4742810243835248,3.5818443804034583,14928.0,0.011439012700594395
+0,01-ai Yi Chat (34B),0.33974892,0.3404481,0.3399749,0.43251538287409536,3.5818443804034583,14928.0,0.007311566390840339
+3,LLaMA-2 Chat (7B),0.3203912,0.3153909,0.31770444,0.4084233313416049,3.5818443804034583,14928.0,0.004255859538193306
+7,OpenHermes-2.5-Mistral (7B),0.3618188,0.35180506,0.3565194,0.312054520357568,3.5818443804034583,14928.0,0.006563161880264231
+8,Qwen 1.5 Chat (7B),0.34855434,0.34154576,0.344803,0.29904529709475364,3.5818443804034583,14928.0,0.003185571110431172
+21,llama-2-70b-chat,0.20800962,0.21472095,0.21117964,0.29684572894554634,4.2436893203883495,88008.0,0.00329426273003284
+17,gemini-pro,0.23105659,0.23057175,0.23072062,0.295286999418032,4.244871794871795,87700.0,0.0025439281189154664
+15,chat-bison (PaLM 2),0.23117188,0.23029378,0.23060663,0.2927236655934559,4.281081081081081,83400.0,0.0033173472693443363
+14,WizardLM v1.2 (13B),0.34085444,0.32933056,0.33466902,0.28716720161049375,3.5818443804034583,14928.0,0.003671383039102015
+13,Vicuna v1.5 (7B),0.284109,0.27878883,0.28129113,0.2781035051738079,3.6173027989821884,16948.0,0.006952332387656228
+6,Mixtral-8x7B-Instruct-v0.1,0.19128644,0.19555509,0.19330867,0.2665288353398184,4.161038961038961,103320.0,0.0026839271544750283
+16,chat-bison-32k (PaLM 2 32K),0.23046139,0.22983725,0.23002876,0.2608806894318779,4.281081081081081,83400.0,0.002970914340485325
+11,TinyLlama/TinyLlama-1.1B-Chat-v1.0,0.122185074,0.11885959,0.12042627,0.13915355617375091,4.244871794871795,87700.0,0.002991155730532842
+22,zephyr-7b-beta,0.085390136,0.08266569,0.08394519,0.08796697338212889,4.159788702026735,103714.0,0.0010625100735849574
+9,RedPajama-INCITE Chat (7B),0.261367,0.23758642,0.2487217,0.0560284823193376,3.5818443804034583,14928.0,0.0
+2,Falcon Instruct (7B),0.2895086,0.23968808,0.2615204,0.0490635544441649,3.5818443804034583,14928.0,0.00021729364201653395
+5,Mistral-7B-Instruct-v0.2,0.043820098,0.042561684,0.04313921,0.04250630683894714,4.120342654588421,113258.0,0.0004930290548816363
+12,Upstage SOLAR Instruct v1 (11B),0.0,0.0,0.0,0.0017662349842492329,3.5818443804034583,14928.0,0.0
+","{""x"": ""original_text_length_part"", ""y"": ""model"", ""color"": ""model"", ""orientation"": ""h"", ""title"": ""Summary metrics original text length part""}"
+"Figure({
+ 'data': [{'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
sentence_count=%{x}',
+ 'legendgroup': 'chat-bison (PaLM 2)',
+ 'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
+ 'name': 'chat-bison (PaLM 2)',
+ 'offsetgroup': 'chat-bison (PaLM 2)',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([4.28108108]),
+ 'xaxis': 'x',
+ 'y': array(['chat-bison (PaLM 2)'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
sentence_count=%{x}',
+ 'legendgroup': 'chat-bison-32k (PaLM 2 32K)',
+ 'marker': {'color': '#EF553B', 'pattern': {'shape': ''}},
+ 'name': 'chat-bison-32k (PaLM 2 32K)',
+ 'offsetgroup': 'chat-bison-32k (PaLM 2 32K)',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([4.28108108]),
+ 'xaxis': 'x',
+ 'y': array(['chat-bison-32k (PaLM 2 32K)'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
sentence_count=%{x}',
+ 'legendgroup': 'gpt-4-turbo',
+ 'marker': {'color': '#00cc96', 'pattern': {'shape': ''}},
+ 'name': 'gpt-4-turbo',
+ 'offsetgroup': 'gpt-4-turbo',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([4.26613757]),
+ 'xaxis': 'x',
+ 'y': array(['gpt-4-turbo'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
sentence_count=%{x}',
+ 'legendgroup': 'gpt-4',
+ 'marker': {'color': '#ab63fa', 'pattern': {'shape': ''}},
+ 'name': 'gpt-4',
+ 'offsetgroup': 'gpt-4',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([4.26613757]),
+ 'xaxis': 'x',
+ 'y': array(['gpt-4'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
sentence_count=%{x}',
+ 'legendgroup': 'gemini-pro',
+ 'marker': {'color': '#FFA15A', 'pattern': {'shape': ''}},
+ 'name': 'gemini-pro',
+ 'offsetgroup': 'gemini-pro',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([4.24487179]),
+ 'xaxis': 'x',
+ 'y': array(['gemini-pro'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
sentence_count=%{x}',
+ 'legendgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
+ 'marker': {'color': '#19d3f3', 'pattern': {'shape': ''}},
+ 'name': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
+ 'offsetgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([4.24487179]),
+ 'xaxis': 'x',
+ 'y': array(['TinyLlama/TinyLlama-1.1B-Chat-v1.0'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
sentence_count=%{x}',
+ 'legendgroup': 'llama-2-70b-chat',
+ 'marker': {'color': '#FF6692', 'pattern': {'shape': ''}},
+ 'name': 'llama-2-70b-chat',
+ 'offsetgroup': 'llama-2-70b-chat',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([4.24368932]),
+ 'xaxis': 'x',
+ 'y': array(['llama-2-70b-chat'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
sentence_count=%{x}',
+ 'legendgroup': 'gpt-3.5-turbo',
+ 'marker': {'color': '#B6E880', 'pattern': {'shape': ''}},
+ 'name': 'gpt-3.5-turbo',
+ 'offsetgroup': 'gpt-3.5-turbo',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([4.22963982]),
+ 'xaxis': 'x',
+ 'y': array(['gpt-3.5-turbo'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
sentence_count=%{x}',
+ 'legendgroup': 'Mixtral-8x7B-Instruct-v0.1',
+ 'marker': {'color': '#FF97FF', 'pattern': {'shape': ''}},
+ 'name': 'Mixtral-8x7B-Instruct-v0.1',
+ 'offsetgroup': 'Mixtral-8x7B-Instruct-v0.1',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([4.16103896]),
+ 'xaxis': 'x',
+ 'y': array(['Mixtral-8x7B-Instruct-v0.1'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
sentence_count=%{x}',
+ 'legendgroup': 'zephyr-7b-beta',
+ 'marker': {'color': '#FECB52', 'pattern': {'shape': ''}},
+ 'name': 'zephyr-7b-beta',
+ 'offsetgroup': 'zephyr-7b-beta',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([4.1597887]),
+ 'xaxis': 'x',
+ 'y': array(['zephyr-7b-beta'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
sentence_count=%{x}',
+ 'legendgroup': 'Mistral-7B-Instruct-v0.2',
+ 'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
+ 'name': 'Mistral-7B-Instruct-v0.2',
+ 'offsetgroup': 'Mistral-7B-Instruct-v0.2',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([4.12034265]),
+ 'xaxis': 'x',
+ 'y': array(['Mistral-7B-Instruct-v0.2'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
sentence_count=%{x}',
+ 'legendgroup': 'Mistral (7B) Instruct v0.2 (Together AI)',
+ 'marker': {'color': '#EF553B', 'pattern': {'shape': ''}},
+ 'name': 'Mistral (7B) Instruct v0.2 (Together AI)',
+ 'offsetgroup': 'Mistral (7B) Instruct v0.2 (Together AI)',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([3.71222222]),
+ 'xaxis': 'x',
+ 'y': array(['Mistral (7B) Instruct v0.2 (Together AI)'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
sentence_count=%{x}',
+ 'legendgroup': 'Vicuna v1.5 (7B)',
+ 'marker': {'color': '#00cc96', 'pattern': {'shape': ''}},
+ 'name': 'Vicuna v1.5 (7B)',
+ 'offsetgroup': 'Vicuna v1.5 (7B)',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([3.6173028]),
+ 'xaxis': 'x',
+ 'y': array(['Vicuna v1.5 (7B)'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
sentence_count=%{x}',
+ 'legendgroup': 'Falcon Instruct (7B)',
+ 'marker': {'color': '#ab63fa', 'pattern': {'shape': ''}},
+ 'name': 'Falcon Instruct (7B)',
+ 'offsetgroup': 'Falcon Instruct (7B)',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([3.58184438]),
+ 'xaxis': 'x',
+ 'y': array(['Falcon Instruct (7B)'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
sentence_count=%{x}',
+ 'legendgroup': 'RedPajama-INCITE Chat (7B)',
+ 'marker': {'color': '#FFA15A', 'pattern': {'shape': ''}},
+ 'name': 'RedPajama-INCITE Chat (7B)',
+ 'offsetgroup': 'RedPajama-INCITE Chat (7B)',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([3.58184438]),
+ 'xaxis': 'x',
+ 'y': array(['RedPajama-INCITE Chat (7B)'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
sentence_count=%{x}',
+ 'legendgroup': 'Snorkel Mistral PairRM DPO (7B)',
+ 'marker': {'color': '#19d3f3', 'pattern': {'shape': ''}},
+ 'name': 'Snorkel Mistral PairRM DPO (7B)',
+ 'offsetgroup': 'Snorkel Mistral PairRM DPO (7B)',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([3.58184438]),
+ 'xaxis': 'x',
+ 'y': array(['Snorkel Mistral PairRM DPO (7B)'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
sentence_count=%{x}',
+ 'legendgroup': 'WizardLM v1.2 (13B)',
+ 'marker': {'color': '#FF6692', 'pattern': {'shape': ''}},
+ 'name': 'WizardLM v1.2 (13B)',
+ 'offsetgroup': 'WizardLM v1.2 (13B)',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([3.58184438]),
+ 'xaxis': 'x',
+ 'y': array(['WizardLM v1.2 (13B)'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
sentence_count=%{x}',
+ 'legendgroup': 'Qwen 1.5 Chat (7B)',
+ 'marker': {'color': '#B6E880', 'pattern': {'shape': ''}},
+ 'name': 'Qwen 1.5 Chat (7B)',
+ 'offsetgroup': 'Qwen 1.5 Chat (7B)',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([3.58184438]),
+ 'xaxis': 'x',
+ 'y': array(['Qwen 1.5 Chat (7B)'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
sentence_count=%{x}',
+ 'legendgroup': 'OpenHermes-2.5-Mistral (7B)',
+ 'marker': {'color': '#FF97FF', 'pattern': {'shape': ''}},
+ 'name': 'OpenHermes-2.5-Mistral (7B)',
+ 'offsetgroup': 'OpenHermes-2.5-Mistral (7B)',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([3.58184438]),
+ 'xaxis': 'x',
+ 'y': array(['OpenHermes-2.5-Mistral (7B)'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
sentence_count=%{x}',
+ 'legendgroup': 'LLaMA-2 Chat (7B)',
+ 'marker': {'color': '#FECB52', 'pattern': {'shape': ''}},
+ 'name': 'LLaMA-2 Chat (7B)',
+ 'offsetgroup': 'LLaMA-2 Chat (7B)',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([3.58184438]),
+ 'xaxis': 'x',
+ 'y': array(['LLaMA-2 Chat (7B)'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
sentence_count=%{x}',
+ 'legendgroup': '01-ai Yi Chat (34B)',
+ 'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
+ 'name': '01-ai Yi Chat (34B)',
+ 'offsetgroup': '01-ai Yi Chat (34B)',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([3.58184438]),
+ 'xaxis': 'x',
+ 'y': array(['01-ai Yi Chat (34B)'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
sentence_count=%{x}',
+ 'legendgroup': 'Chronos Hermes (13B)',
+ 'marker': {'color': '#EF553B', 'pattern': {'shape': ''}},
+ 'name': 'Chronos Hermes (13B)',
+ 'offsetgroup': 'Chronos Hermes (13B)',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([3.58184438]),
+ 'xaxis': 'x',
+ 'y': array(['Chronos Hermes (13B)'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
sentence_count=%{x}',
+ 'legendgroup': 'Upstage SOLAR Instruct v1 (11B)',
+ 'marker': {'color': '#00cc96', 'pattern': {'shape': ''}},
+ 'name': 'Upstage SOLAR Instruct v1 (11B)',
+ 'offsetgroup': 'Upstage SOLAR Instruct v1 (11B)',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([3.58184438]),
+ 'xaxis': 'x',
+ 'y': array(['Upstage SOLAR Instruct v1 (11B)'], dtype=object),
+ 'yaxis': 'y'}],
+ 'layout': {'barmode': 'relative',
+ 'legend': {'title': {'text': 'model'}, 'tracegroupgap': 0},
+ 'template': '...',
+ 'title': {'text': 'Summary metrics sentence count'},
+ 'xaxis': {'anchor': 'y', 'domain': [0.0, 1.0], 'title': {'text': 'sentence_count'}},
+ 'yaxis': {'anchor': 'x',
+ 'categoryarray': [Upstage SOLAR Instruct v1 (11B),
+ Chronos Hermes (13B), 01-ai Yi Chat
+ (34B), LLaMA-2 Chat (7B),
+ OpenHermes-2.5-Mistral (7B), Qwen 1.5
+ Chat (7B), WizardLM v1.2 (13B), Snorkel
+ Mistral PairRM DPO (7B), RedPajama-
+ INCITE Chat (7B), Falcon Instruct (7B),
+ Vicuna v1.5 (7B), Mistral (7B) Instruct
+ v0.2 (Together AI),
+ Mistral-7B-Instruct-v0.2,
+ zephyr-7b-beta,
+ Mixtral-8x7B-Instruct-v0.1,
+ gpt-3.5-turbo, llama-2-70b-chat,
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,
+ gemini-pro, gpt-4, gpt-4-turbo, chat-
+ bison-32k (PaLM 2 32K), chat-bison (PaLM
+ 2)],
+ 'categoryorder': 'array',
+ 'domain': [0.0, 1.0],
+ 'title': {'text': 'model'}}}
+})",Summary metrics sentence count,"{""data"":[{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003esentence_count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison (PaLM 2)"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""chat-bison (PaLM 2)"",""offsetgroup"":""chat-bison (PaLM 2)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[4.281081081081081],""xaxis"":""x"",""y"":[""chat-bison (PaLM 2)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003esentence_count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison-32k (PaLM 2 32K)"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""chat-bison-32k (PaLM 2 32K)"",""offsetgroup"":""chat-bison-32k (PaLM 2 32K)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[4.281081081081081],""xaxis"":""x"",""y"":[""chat-bison-32k (PaLM 2 32K)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003esentence_count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4-turbo"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""gpt-4-turbo"",""offsetgroup"":""gpt-4-turbo"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[4.266137566137566],""xaxis"":""x"",""y"":[""gpt-4-turbo""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003esentence_count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""gpt-4"",""offsetgroup"":""gpt-4"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[4.266137566137566],""xaxis"":""x"",""y"":[""gpt-4""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003esentence_count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gemini-pro"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""gemini-pro"",""offsetgroup"":""gemini-pro"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[4.244871794871795],""xaxis"":""x"",""y"":[""gemini-pro""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003esentence_count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""offsetgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[4.244871794871795],""xaxis"":""x"",""y"":[""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003esentence_count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""llama-2-70b-chat"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""llama-2-70b-chat"",""offsetgroup"":""llama-2-70b-chat"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[4.2436893203883495],""xaxis"":""x"",""y"":[""llama-2-70b-chat""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003esentence_count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-3.5-turbo"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""gpt-3.5-turbo"",""offsetgroup"":""gpt-3.5-turbo"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[4.229639819909955],""xaxis"":""x"",""y"":[""gpt-3.5-turbo""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003esentence_count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mixtral-8x7B-Instruct-v0.1"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""Mixtral-8x7B-Instruct-v0.1"",""offsetgroup"":""Mixtral-8x7B-Instruct-v0.1"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[4.161038961038961],""xaxis"":""x"",""y"":[""Mixtral-8x7B-Instruct-v0.1""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003esentence_count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""zephyr-7b-beta"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""zephyr-7b-beta"",""offsetgroup"":""zephyr-7b-beta"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[4.159788702026735],""xaxis"":""x"",""y"":[""zephyr-7b-beta""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003esentence_count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral-7B-Instruct-v0.2"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""Mistral-7B-Instruct-v0.2"",""offsetgroup"":""Mistral-7B-Instruct-v0.2"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[4.120342654588421],""xaxis"":""x"",""y"":[""Mistral-7B-Instruct-v0.2""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003esentence_count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral (7B) Instruct v0.2 (Together AI)"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""Mistral (7B) Instruct v0.2 (Together AI)"",""offsetgroup"":""Mistral (7B) Instruct v0.2 (Together AI)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[3.712222222222222],""xaxis"":""x"",""y"":[""Mistral (7B) Instruct v0.2 (Together AI)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003esentence_count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Vicuna v1.5 (7B)"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""Vicuna v1.5 (7B)"",""offsetgroup"":""Vicuna v1.5 (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[3.6173027989821884],""xaxis"":""x"",""y"":[""Vicuna v1.5 (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003esentence_count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Falcon Instruct (7B)"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""Falcon Instruct (7B)"",""offsetgroup"":""Falcon Instruct (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[3.5818443804034583],""xaxis"":""x"",""y"":[""Falcon Instruct (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003esentence_count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""RedPajama-INCITE Chat (7B)"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""RedPajama-INCITE Chat (7B)"",""offsetgroup"":""RedPajama-INCITE Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[3.5818443804034583],""xaxis"":""x"",""y"":[""RedPajama-INCITE Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003esentence_count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Snorkel Mistral PairRM DPO (7B)"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""Snorkel Mistral PairRM DPO (7B)"",""offsetgroup"":""Snorkel Mistral PairRM DPO (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[3.5818443804034583],""xaxis"":""x"",""y"":[""Snorkel Mistral PairRM DPO (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003esentence_count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""WizardLM v1.2 (13B)"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""WizardLM v1.2 (13B)"",""offsetgroup"":""WizardLM v1.2 (13B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[3.5818443804034583],""xaxis"":""x"",""y"":[""WizardLM v1.2 (13B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003esentence_count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Qwen 1.5 Chat (7B)"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""Qwen 1.5 Chat (7B)"",""offsetgroup"":""Qwen 1.5 Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[3.5818443804034583],""xaxis"":""x"",""y"":[""Qwen 1.5 Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003esentence_count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""OpenHermes-2.5-Mistral (7B)"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""OpenHermes-2.5-Mistral (7B)"",""offsetgroup"":""OpenHermes-2.5-Mistral (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[3.5818443804034583],""xaxis"":""x"",""y"":[""OpenHermes-2.5-Mistral (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003esentence_count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""LLaMA-2 Chat (7B)"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""LLaMA-2 Chat (7B)"",""offsetgroup"":""LLaMA-2 Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[3.5818443804034583],""xaxis"":""x"",""y"":[""LLaMA-2 Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003esentence_count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""01-ai Yi Chat (34B)"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""01-ai Yi Chat (34B)"",""offsetgroup"":""01-ai Yi Chat (34B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[3.5818443804034583],""xaxis"":""x"",""y"":[""01-ai Yi Chat (34B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003esentence_count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Chronos Hermes (13B)"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""Chronos Hermes (13B)"",""offsetgroup"":""Chronos Hermes (13B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[3.5818443804034583],""xaxis"":""x"",""y"":[""Chronos Hermes (13B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003esentence_count=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Upstage SOLAR Instruct v1 (11B)"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""Upstage SOLAR Instruct v1 (11B)"",""offsetgroup"":""Upstage SOLAR Instruct v1 (11B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[3.5818443804034583],""xaxis"":""x"",""y"":[""Upstage SOLAR Instruct v1 (11B)""],""yaxis"":""y"",""type"":""bar""}],""layout"":{""template"":{""data"":{""histogram2dcontour"":[{""type"":""histogram2dcontour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""choropleth"":[{""type"":""choropleth"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""histogram2d"":[{""type"":""histogram2d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmap"":[{""type"":""heatmap"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmapgl"":[{""type"":""heatmapgl"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""contourcarpet"":[{""type"":""contourcarpet"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""contour"":[{""type"":""contour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""surface"":[{""type"":""surface"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""mesh3d"":[{""type"":""mesh3d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""scatter"":[{""fillpattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2},""type"":""scatter""}],""parcoords"":[{""type"":""parcoords"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolargl"":[{""type"":""scatterpolargl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""bar"":[{""error_x"":{""color"":""#2a3f5f""},""error_y"":{""color"":""#2a3f5f""},""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""bar""}],""scattergeo"":[{""type"":""scattergeo"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolar"":[{""type"":""scatterpolar"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""histogram"":[{""marker"":{""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""histogram""}],""scattergl"":[{""type"":""scattergl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatter3d"":[{""type"":""scatter3d"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattermapbox"":[{""type"":""scattermapbox"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterternary"":[{""type"":""scatterternary"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattercarpet"":[{""type"":""scattercarpet"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""carpet"":[{""aaxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""baxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""type"":""carpet""}],""table"":[{""cells"":{""fill"":{""color"":""#EBF0F8""},""line"":{""color"":""white""}},""header"":{""fill"":{""color"":""#C8D4E3""},""line"":{""color"":""white""}},""type"":""table""}],""barpolar"":[{""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""barpolar""}],""pie"":[{""automargin"":true,""type"":""pie""}]},""layout"":{""autotypenumbers"":""strict"",""colorway"":[""#636efa"",""#EF553B"",""#00cc96"",""#ab63fa"",""#FFA15A"",""#19d3f3"",""#FF6692"",""#B6E880"",""#FF97FF"",""#FECB52""],""font"":{""color"":""#2a3f5f""},""hovermode"":""closest"",""hoverlabel"":{""align"":""left""},""paper_bgcolor"":""white"",""plot_bgcolor"":""#E5ECF6"",""polar"":{""bgcolor"":""#E5ECF6"",""angularaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""radialaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""ternary"":{""bgcolor"":""#E5ECF6"",""aaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""baxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""caxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""coloraxis"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""colorscale"":{""sequential"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""sequentialminus"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""diverging"":[[0,""#8e0152""],[0.1,""#c51b7d""],[0.2,""#de77ae""],[0.3,""#f1b6da""],[0.4,""#fde0ef""],[0.5,""#f7f7f7""],[0.6,""#e6f5d0""],[0.7,""#b8e186""],[0.8,""#7fbc41""],[0.9,""#4d9221""],[1,""#276419""]]},""xaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""yaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""scene"":{""xaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""yaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""zaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2}},""shapedefaults"":{""line"":{""color"":""#2a3f5f""}},""annotationdefaults"":{""arrowcolor"":""#2a3f5f"",""arrowhead"":0,""arrowwidth"":1},""geo"":{""bgcolor"":""white"",""landcolor"":""#E5ECF6"",""subunitcolor"":""white"",""showland"":true,""showlakes"":true,""lakecolor"":""white""},""title"":{""x"":0.05},""mapbox"":{""style"":""light""}}},""xaxis"":{""anchor"":""y"",""domain"":[0.0,1.0],""title"":{""text"":""sentence_count""}},""yaxis"":{""anchor"":""x"",""domain"":[0.0,1.0],""title"":{""text"":""model""},""categoryorder"":""array"",""categoryarray"":[""Upstage SOLAR Instruct v1 (11B)"",""Chronos Hermes (13B)"",""01-ai Yi Chat (34B)"",""LLaMA-2 Chat (7B)"",""OpenHermes-2.5-Mistral (7B)"",""Qwen 1.5 Chat (7B)"",""WizardLM v1.2 (13B)"",""Snorkel Mistral PairRM DPO (7B)"",""RedPajama-INCITE Chat (7B)"",""Falcon Instruct (7B)"",""Vicuna v1.5 (7B)"",""Mistral (7B) Instruct v0.2 (Together AI)"",""Mistral-7B-Instruct-v0.2"",""zephyr-7b-beta"",""Mixtral-8x7B-Instruct-v0.1"",""gpt-3.5-turbo"",""llama-2-70b-chat"",""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""gemini-pro"",""gpt-4"",""gpt-4-turbo"",""chat-bison-32k (PaLM 2 32K)"",""chat-bison (PaLM 2)""]},""legend"":{""title"":{""text"":""model""},""tracegroupgap"":0},""title"":{""text"":""Summary metrics sentence count""},""barmode"":""relative""}}",Average sentence count of the summary.,",model,bert_score_P,bert_score_R,bert_score_F1,original_text_length_part,sentence_count,length_penalty,bleu_score
+15,chat-bison (PaLM 2),0.23117188,0.23029378,0.23060663,0.2927236655934559,4.281081081081081,83400.0,0.0033173472693443363
+16,chat-bison-32k (PaLM 2 32K),0.23046139,0.22983725,0.23002876,0.2608806894318779,4.281081081081081,83400.0,0.002970914340485325
+20,gpt-4-turbo,0.42728576,0.4162435,0.42098433,0.5393220459796505,4.266137566137566,85120.0,0.0034873692407505464
+19,gpt-4,0.48605907,0.472583,0.47901583,0.4763731952669352,4.266137566137566,85120.0,0.004704572681138337
+17,gemini-pro,0.23105659,0.23057175,0.23072062,0.295286999418032,4.244871794871795,87700.0,0.0025439281189154664
+11,TinyLlama/TinyLlama-1.1B-Chat-v1.0,0.122185074,0.11885959,0.12042627,0.13915355617375091,4.244871794871795,87700.0,0.002991155730532842
+21,llama-2-70b-chat,0.20800962,0.21472095,0.21117964,0.29684572894554634,4.2436893203883495,88008.0,0.00329426273003284
+18,gpt-3.5-turbo,0.4943981,0.48408476,0.4888874,0.5905700146991734,4.229639819909955,89814.0,0.007892445077902592
+6,Mixtral-8x7B-Instruct-v0.1,0.19128644,0.19555509,0.19330867,0.2665288353398184,4.161038961038961,103320.0,0.0026839271544750283
+22,zephyr-7b-beta,0.085390136,0.08266569,0.08394519,0.08796697338212889,4.159788702026735,103714.0,0.0010625100735849574
+5,Mistral-7B-Instruct-v0.2,0.043820098,0.042561684,0.04313921,0.04250630683894714,4.120342654588421,113258.0,0.0004930290548816363
+4,Mistral (7B) Instruct v0.2 (Together AI),0.3647361,0.3664233,0.36540908,0.5233998570385472,3.712222222222222,29298.0,0.005478518060743351
+13,Vicuna v1.5 (7B),0.284109,0.27878883,0.28129113,0.2781035051738079,3.6173027989821884,16948.0,0.006952332387656228
+2,Falcon Instruct (7B),0.2895086,0.23968808,0.2615204,0.0490635544441649,3.5818443804034583,14928.0,0.00021729364201653395
+9,RedPajama-INCITE Chat (7B),0.261367,0.23758642,0.2487217,0.0560284823193376,3.5818443804034583,14928.0,0.0
+10,Snorkel Mistral PairRM DPO (7B),0.31672964,0.33782956,0.3265383,3.7740234383755356,3.5818443804034583,14928.0,0.002907897771152987
+14,WizardLM v1.2 (13B),0.34085444,0.32933056,0.33466902,0.28716720161049375,3.5818443804034583,14928.0,0.003671383039102015
+8,Qwen 1.5 Chat (7B),0.34855434,0.34154576,0.344803,0.29904529709475364,3.5818443804034583,14928.0,0.003185571110431172
+7,OpenHermes-2.5-Mistral (7B),0.3618188,0.35180506,0.3565194,0.312054520357568,3.5818443804034583,14928.0,0.006563161880264231
+3,LLaMA-2 Chat (7B),0.3203912,0.3153909,0.31770444,0.4084233313416049,3.5818443804034583,14928.0,0.004255859538193306
+0,01-ai Yi Chat (34B),0.33974892,0.3404481,0.3399749,0.43251538287409536,3.5818443804034583,14928.0,0.007311566390840339
+1,Chronos Hermes (13B),0.3124825,0.31071666,0.311415,0.4742810243835248,3.5818443804034583,14928.0,0.011439012700594395
+12,Upstage SOLAR Instruct v1 (11B),0.0,0.0,0.0,0.0017662349842492329,3.5818443804034583,14928.0,0.0
+","{""x"": ""sentence_count"", ""y"": ""model"", ""color"": ""model"", ""orientation"": ""h"", ""title"": ""Summary metrics sentence count""}"
+"Figure({
+ 'data': [{'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
length_penalty=%{x}',
+ 'legendgroup': 'Mistral-7B-Instruct-v0.2',
+ 'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
+ 'name': 'Mistral-7B-Instruct-v0.2',
+ 'offsetgroup': 'Mistral-7B-Instruct-v0.2',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([113258.]),
+ 'xaxis': 'x',
+ 'y': array(['Mistral-7B-Instruct-v0.2'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
length_penalty=%{x}',
+ 'legendgroup': 'zephyr-7b-beta',
+ 'marker': {'color': '#EF553B', 'pattern': {'shape': ''}},
+ 'name': 'zephyr-7b-beta',
+ 'offsetgroup': 'zephyr-7b-beta',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([103714.]),
+ 'xaxis': 'x',
+ 'y': array(['zephyr-7b-beta'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
length_penalty=%{x}',
+ 'legendgroup': 'Mixtral-8x7B-Instruct-v0.1',
+ 'marker': {'color': '#00cc96', 'pattern': {'shape': ''}},
+ 'name': 'Mixtral-8x7B-Instruct-v0.1',
+ 'offsetgroup': 'Mixtral-8x7B-Instruct-v0.1',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([103320.]),
+ 'xaxis': 'x',
+ 'y': array(['Mixtral-8x7B-Instruct-v0.1'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
length_penalty=%{x}',
+ 'legendgroup': 'gpt-3.5-turbo',
+ 'marker': {'color': '#ab63fa', 'pattern': {'shape': ''}},
+ 'name': 'gpt-3.5-turbo',
+ 'offsetgroup': 'gpt-3.5-turbo',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([89814.]),
+ 'xaxis': 'x',
+ 'y': array(['gpt-3.5-turbo'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
length_penalty=%{x}',
+ 'legendgroup': 'llama-2-70b-chat',
+ 'marker': {'color': '#FFA15A', 'pattern': {'shape': ''}},
+ 'name': 'llama-2-70b-chat',
+ 'offsetgroup': 'llama-2-70b-chat',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([88008.]),
+ 'xaxis': 'x',
+ 'y': array(['llama-2-70b-chat'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
length_penalty=%{x}',
+ 'legendgroup': 'gemini-pro',
+ 'marker': {'color': '#19d3f3', 'pattern': {'shape': ''}},
+ 'name': 'gemini-pro',
+ 'offsetgroup': 'gemini-pro',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([87700.]),
+ 'xaxis': 'x',
+ 'y': array(['gemini-pro'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
length_penalty=%{x}',
+ 'legendgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
+ 'marker': {'color': '#FF6692', 'pattern': {'shape': ''}},
+ 'name': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
+ 'offsetgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([87700.]),
+ 'xaxis': 'x',
+ 'y': array(['TinyLlama/TinyLlama-1.1B-Chat-v1.0'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
length_penalty=%{x}',
+ 'legendgroup': 'gpt-4-turbo',
+ 'marker': {'color': '#B6E880', 'pattern': {'shape': ''}},
+ 'name': 'gpt-4-turbo',
+ 'offsetgroup': 'gpt-4-turbo',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([85120.]),
+ 'xaxis': 'x',
+ 'y': array(['gpt-4-turbo'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
length_penalty=%{x}',
+ 'legendgroup': 'gpt-4',
+ 'marker': {'color': '#FF97FF', 'pattern': {'shape': ''}},
+ 'name': 'gpt-4',
+ 'offsetgroup': 'gpt-4',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([85120.]),
+ 'xaxis': 'x',
+ 'y': array(['gpt-4'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
length_penalty=%{x}',
+ 'legendgroup': 'chat-bison (PaLM 2)',
+ 'marker': {'color': '#FECB52', 'pattern': {'shape': ''}},
+ 'name': 'chat-bison (PaLM 2)',
+ 'offsetgroup': 'chat-bison (PaLM 2)',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([83400.]),
+ 'xaxis': 'x',
+ 'y': array(['chat-bison (PaLM 2)'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
length_penalty=%{x}',
+ 'legendgroup': 'chat-bison-32k (PaLM 2 32K)',
+ 'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
+ 'name': 'chat-bison-32k (PaLM 2 32K)',
+ 'offsetgroup': 'chat-bison-32k (PaLM 2 32K)',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([83400.]),
+ 'xaxis': 'x',
+ 'y': array(['chat-bison-32k (PaLM 2 32K)'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
length_penalty=%{x}',
+ 'legendgroup': 'Mistral (7B) Instruct v0.2 (Together AI)',
+ 'marker': {'color': '#EF553B', 'pattern': {'shape': ''}},
+ 'name': 'Mistral (7B) Instruct v0.2 (Together AI)',
+ 'offsetgroup': 'Mistral (7B) Instruct v0.2 (Together AI)',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([29298.]),
+ 'xaxis': 'x',
+ 'y': array(['Mistral (7B) Instruct v0.2 (Together AI)'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
length_penalty=%{x}',
+ 'legendgroup': 'Vicuna v1.5 (7B)',
+ 'marker': {'color': '#00cc96', 'pattern': {'shape': ''}},
+ 'name': 'Vicuna v1.5 (7B)',
+ 'offsetgroup': 'Vicuna v1.5 (7B)',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([16948.]),
+ 'xaxis': 'x',
+ 'y': array(['Vicuna v1.5 (7B)'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
length_penalty=%{x}',
+ 'legendgroup': 'Falcon Instruct (7B)',
+ 'marker': {'color': '#ab63fa', 'pattern': {'shape': ''}},
+ 'name': 'Falcon Instruct (7B)',
+ 'offsetgroup': 'Falcon Instruct (7B)',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([14928.]),
+ 'xaxis': 'x',
+ 'y': array(['Falcon Instruct (7B)'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
length_penalty=%{x}',
+ 'legendgroup': 'RedPajama-INCITE Chat (7B)',
+ 'marker': {'color': '#FFA15A', 'pattern': {'shape': ''}},
+ 'name': 'RedPajama-INCITE Chat (7B)',
+ 'offsetgroup': 'RedPajama-INCITE Chat (7B)',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([14928.]),
+ 'xaxis': 'x',
+ 'y': array(['RedPajama-INCITE Chat (7B)'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
length_penalty=%{x}',
+ 'legendgroup': 'Snorkel Mistral PairRM DPO (7B)',
+ 'marker': {'color': '#19d3f3', 'pattern': {'shape': ''}},
+ 'name': 'Snorkel Mistral PairRM DPO (7B)',
+ 'offsetgroup': 'Snorkel Mistral PairRM DPO (7B)',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([14928.]),
+ 'xaxis': 'x',
+ 'y': array(['Snorkel Mistral PairRM DPO (7B)'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
length_penalty=%{x}',
+ 'legendgroup': 'WizardLM v1.2 (13B)',
+ 'marker': {'color': '#FF6692', 'pattern': {'shape': ''}},
+ 'name': 'WizardLM v1.2 (13B)',
+ 'offsetgroup': 'WizardLM v1.2 (13B)',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([14928.]),
+ 'xaxis': 'x',
+ 'y': array(['WizardLM v1.2 (13B)'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
length_penalty=%{x}',
+ 'legendgroup': 'Qwen 1.5 Chat (7B)',
+ 'marker': {'color': '#B6E880', 'pattern': {'shape': ''}},
+ 'name': 'Qwen 1.5 Chat (7B)',
+ 'offsetgroup': 'Qwen 1.5 Chat (7B)',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([14928.]),
+ 'xaxis': 'x',
+ 'y': array(['Qwen 1.5 Chat (7B)'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
length_penalty=%{x}',
+ 'legendgroup': 'OpenHermes-2.5-Mistral (7B)',
+ 'marker': {'color': '#FF97FF', 'pattern': {'shape': ''}},
+ 'name': 'OpenHermes-2.5-Mistral (7B)',
+ 'offsetgroup': 'OpenHermes-2.5-Mistral (7B)',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([14928.]),
+ 'xaxis': 'x',
+ 'y': array(['OpenHermes-2.5-Mistral (7B)'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
length_penalty=%{x}',
+ 'legendgroup': 'LLaMA-2 Chat (7B)',
+ 'marker': {'color': '#FECB52', 'pattern': {'shape': ''}},
+ 'name': 'LLaMA-2 Chat (7B)',
+ 'offsetgroup': 'LLaMA-2 Chat (7B)',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([14928.]),
+ 'xaxis': 'x',
+ 'y': array(['LLaMA-2 Chat (7B)'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
length_penalty=%{x}',
+ 'legendgroup': '01-ai Yi Chat (34B)',
+ 'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
+ 'name': '01-ai Yi Chat (34B)',
+ 'offsetgroup': '01-ai Yi Chat (34B)',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([14928.]),
+ 'xaxis': 'x',
+ 'y': array(['01-ai Yi Chat (34B)'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
length_penalty=%{x}',
+ 'legendgroup': 'Chronos Hermes (13B)',
+ 'marker': {'color': '#EF553B', 'pattern': {'shape': ''}},
+ 'name': 'Chronos Hermes (13B)',
+ 'offsetgroup': 'Chronos Hermes (13B)',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([14928.]),
+ 'xaxis': 'x',
+ 'y': array(['Chronos Hermes (13B)'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
length_penalty=%{x}',
+ 'legendgroup': 'Upstage SOLAR Instruct v1 (11B)',
+ 'marker': {'color': '#00cc96', 'pattern': {'shape': ''}},
+ 'name': 'Upstage SOLAR Instruct v1 (11B)',
+ 'offsetgroup': 'Upstage SOLAR Instruct v1 (11B)',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([14928.]),
+ 'xaxis': 'x',
+ 'y': array(['Upstage SOLAR Instruct v1 (11B)'], dtype=object),
+ 'yaxis': 'y'}],
+ 'layout': {'barmode': 'relative',
+ 'legend': {'title': {'text': 'model'}, 'tracegroupgap': 0},
+ 'template': '...',
+ 'title': {'text': 'Summary metrics length penalty'},
+ 'xaxis': {'anchor': 'y', 'domain': [0.0, 1.0], 'title': {'text': 'length_penalty'}},
+ 'yaxis': {'anchor': 'x',
+ 'categoryarray': [Upstage SOLAR Instruct v1 (11B),
+ Chronos Hermes (13B), 01-ai Yi Chat
+ (34B), LLaMA-2 Chat (7B),
+ OpenHermes-2.5-Mistral (7B), Qwen 1.5
+ Chat (7B), WizardLM v1.2 (13B), Snorkel
+ Mistral PairRM DPO (7B), RedPajama-
+ INCITE Chat (7B), Falcon Instruct (7B),
+ Vicuna v1.5 (7B), Mistral (7B) Instruct
+ v0.2 (Together AI), chat-bison-32k (PaLM
+ 2 32K), chat-bison (PaLM 2), gpt-4,
+ gpt-4-turbo,
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0,
+ gemini-pro, llama-2-70b-chat,
+ gpt-3.5-turbo,
+ Mixtral-8x7B-Instruct-v0.1,
+ zephyr-7b-beta,
+ Mistral-7B-Instruct-v0.2],
+ 'categoryorder': 'array',
+ 'domain': [0.0, 1.0],
+ 'title': {'text': 'model'}}}
+})",Summary metrics length penalty,"{""data"":[{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003elength_penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral-7B-Instruct-v0.2"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""Mistral-7B-Instruct-v0.2"",""offsetgroup"":""Mistral-7B-Instruct-v0.2"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[113258.0],""xaxis"":""x"",""y"":[""Mistral-7B-Instruct-v0.2""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003elength_penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""zephyr-7b-beta"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""zephyr-7b-beta"",""offsetgroup"":""zephyr-7b-beta"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[103714.0],""xaxis"":""x"",""y"":[""zephyr-7b-beta""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003elength_penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mixtral-8x7B-Instruct-v0.1"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""Mixtral-8x7B-Instruct-v0.1"",""offsetgroup"":""Mixtral-8x7B-Instruct-v0.1"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[103320.0],""xaxis"":""x"",""y"":[""Mixtral-8x7B-Instruct-v0.1""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003elength_penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-3.5-turbo"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""gpt-3.5-turbo"",""offsetgroup"":""gpt-3.5-turbo"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[89814.0],""xaxis"":""x"",""y"":[""gpt-3.5-turbo""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003elength_penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""llama-2-70b-chat"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""llama-2-70b-chat"",""offsetgroup"":""llama-2-70b-chat"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[88008.0],""xaxis"":""x"",""y"":[""llama-2-70b-chat""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003elength_penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gemini-pro"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""gemini-pro"",""offsetgroup"":""gemini-pro"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[87700.0],""xaxis"":""x"",""y"":[""gemini-pro""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003elength_penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""offsetgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[87700.0],""xaxis"":""x"",""y"":[""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003elength_penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4-turbo"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""gpt-4-turbo"",""offsetgroup"":""gpt-4-turbo"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[85120.0],""xaxis"":""x"",""y"":[""gpt-4-turbo""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003elength_penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""gpt-4"",""offsetgroup"":""gpt-4"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[85120.0],""xaxis"":""x"",""y"":[""gpt-4""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003elength_penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison (PaLM 2)"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""chat-bison (PaLM 2)"",""offsetgroup"":""chat-bison (PaLM 2)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[83400.0],""xaxis"":""x"",""y"":[""chat-bison (PaLM 2)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003elength_penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison-32k (PaLM 2 32K)"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""chat-bison-32k (PaLM 2 32K)"",""offsetgroup"":""chat-bison-32k (PaLM 2 32K)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[83400.0],""xaxis"":""x"",""y"":[""chat-bison-32k (PaLM 2 32K)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003elength_penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral (7B) Instruct v0.2 (Together AI)"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""Mistral (7B) Instruct v0.2 (Together AI)"",""offsetgroup"":""Mistral (7B) Instruct v0.2 (Together AI)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[29298.0],""xaxis"":""x"",""y"":[""Mistral (7B) Instruct v0.2 (Together AI)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003elength_penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Vicuna v1.5 (7B)"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""Vicuna v1.5 (7B)"",""offsetgroup"":""Vicuna v1.5 (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[16948.0],""xaxis"":""x"",""y"":[""Vicuna v1.5 (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003elength_penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Falcon Instruct (7B)"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""Falcon Instruct (7B)"",""offsetgroup"":""Falcon Instruct (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[14928.0],""xaxis"":""x"",""y"":[""Falcon Instruct (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003elength_penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""RedPajama-INCITE Chat (7B)"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""RedPajama-INCITE Chat (7B)"",""offsetgroup"":""RedPajama-INCITE Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[14928.0],""xaxis"":""x"",""y"":[""RedPajama-INCITE Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003elength_penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Snorkel Mistral PairRM DPO (7B)"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""Snorkel Mistral PairRM DPO (7B)"",""offsetgroup"":""Snorkel Mistral PairRM DPO (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[14928.0],""xaxis"":""x"",""y"":[""Snorkel Mistral PairRM DPO (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003elength_penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""WizardLM v1.2 (13B)"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""WizardLM v1.2 (13B)"",""offsetgroup"":""WizardLM v1.2 (13B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[14928.0],""xaxis"":""x"",""y"":[""WizardLM v1.2 (13B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003elength_penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Qwen 1.5 Chat (7B)"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""Qwen 1.5 Chat (7B)"",""offsetgroup"":""Qwen 1.5 Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[14928.0],""xaxis"":""x"",""y"":[""Qwen 1.5 Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003elength_penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""OpenHermes-2.5-Mistral (7B)"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""OpenHermes-2.5-Mistral (7B)"",""offsetgroup"":""OpenHermes-2.5-Mistral (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[14928.0],""xaxis"":""x"",""y"":[""OpenHermes-2.5-Mistral (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003elength_penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""LLaMA-2 Chat (7B)"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""LLaMA-2 Chat (7B)"",""offsetgroup"":""LLaMA-2 Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[14928.0],""xaxis"":""x"",""y"":[""LLaMA-2 Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003elength_penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""01-ai Yi Chat (34B)"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""01-ai Yi Chat (34B)"",""offsetgroup"":""01-ai Yi Chat (34B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[14928.0],""xaxis"":""x"",""y"":[""01-ai Yi Chat (34B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003elength_penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Chronos Hermes (13B)"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""Chronos Hermes (13B)"",""offsetgroup"":""Chronos Hermes (13B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[14928.0],""xaxis"":""x"",""y"":[""Chronos Hermes (13B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003elength_penalty=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Upstage SOLAR Instruct v1 (11B)"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""Upstage SOLAR Instruct v1 (11B)"",""offsetgroup"":""Upstage SOLAR Instruct v1 (11B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[14928.0],""xaxis"":""x"",""y"":[""Upstage SOLAR Instruct v1 (11B)""],""yaxis"":""y"",""type"":""bar""}],""layout"":{""template"":{""data"":{""histogram2dcontour"":[{""type"":""histogram2dcontour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""choropleth"":[{""type"":""choropleth"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""histogram2d"":[{""type"":""histogram2d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmap"":[{""type"":""heatmap"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmapgl"":[{""type"":""heatmapgl"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""contourcarpet"":[{""type"":""contourcarpet"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""contour"":[{""type"":""contour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""surface"":[{""type"":""surface"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""mesh3d"":[{""type"":""mesh3d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""scatter"":[{""fillpattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2},""type"":""scatter""}],""parcoords"":[{""type"":""parcoords"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolargl"":[{""type"":""scatterpolargl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""bar"":[{""error_x"":{""color"":""#2a3f5f""},""error_y"":{""color"":""#2a3f5f""},""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""bar""}],""scattergeo"":[{""type"":""scattergeo"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolar"":[{""type"":""scatterpolar"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""histogram"":[{""marker"":{""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""histogram""}],""scattergl"":[{""type"":""scattergl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatter3d"":[{""type"":""scatter3d"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattermapbox"":[{""type"":""scattermapbox"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterternary"":[{""type"":""scatterternary"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattercarpet"":[{""type"":""scattercarpet"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""carpet"":[{""aaxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""baxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""type"":""carpet""}],""table"":[{""cells"":{""fill"":{""color"":""#EBF0F8""},""line"":{""color"":""white""}},""header"":{""fill"":{""color"":""#C8D4E3""},""line"":{""color"":""white""}},""type"":""table""}],""barpolar"":[{""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""barpolar""}],""pie"":[{""automargin"":true,""type"":""pie""}]},""layout"":{""autotypenumbers"":""strict"",""colorway"":[""#636efa"",""#EF553B"",""#00cc96"",""#ab63fa"",""#FFA15A"",""#19d3f3"",""#FF6692"",""#B6E880"",""#FF97FF"",""#FECB52""],""font"":{""color"":""#2a3f5f""},""hovermode"":""closest"",""hoverlabel"":{""align"":""left""},""paper_bgcolor"":""white"",""plot_bgcolor"":""#E5ECF6"",""polar"":{""bgcolor"":""#E5ECF6"",""angularaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""radialaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""ternary"":{""bgcolor"":""#E5ECF6"",""aaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""baxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""caxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""coloraxis"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""colorscale"":{""sequential"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""sequentialminus"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""diverging"":[[0,""#8e0152""],[0.1,""#c51b7d""],[0.2,""#de77ae""],[0.3,""#f1b6da""],[0.4,""#fde0ef""],[0.5,""#f7f7f7""],[0.6,""#e6f5d0""],[0.7,""#b8e186""],[0.8,""#7fbc41""],[0.9,""#4d9221""],[1,""#276419""]]},""xaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""yaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""scene"":{""xaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""yaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""zaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2}},""shapedefaults"":{""line"":{""color"":""#2a3f5f""}},""annotationdefaults"":{""arrowcolor"":""#2a3f5f"",""arrowhead"":0,""arrowwidth"":1},""geo"":{""bgcolor"":""white"",""landcolor"":""#E5ECF6"",""subunitcolor"":""white"",""showland"":true,""showlakes"":true,""lakecolor"":""white""},""title"":{""x"":0.05},""mapbox"":{""style"":""light""}}},""xaxis"":{""anchor"":""y"",""domain"":[0.0,1.0],""title"":{""text"":""length_penalty""}},""yaxis"":{""anchor"":""x"",""domain"":[0.0,1.0],""title"":{""text"":""model""},""categoryorder"":""array"",""categoryarray"":[""Upstage SOLAR Instruct v1 (11B)"",""Chronos Hermes (13B)"",""01-ai Yi Chat (34B)"",""LLaMA-2 Chat (7B)"",""OpenHermes-2.5-Mistral (7B)"",""Qwen 1.5 Chat (7B)"",""WizardLM v1.2 (13B)"",""Snorkel Mistral PairRM DPO (7B)"",""RedPajama-INCITE Chat (7B)"",""Falcon Instruct (7B)"",""Vicuna v1.5 (7B)"",""Mistral (7B) Instruct v0.2 (Together AI)"",""chat-bison-32k (PaLM 2 32K)"",""chat-bison (PaLM 2)"",""gpt-4"",""gpt-4-turbo"",""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""gemini-pro"",""llama-2-70b-chat"",""gpt-3.5-turbo"",""Mixtral-8x7B-Instruct-v0.1"",""zephyr-7b-beta"",""Mistral-7B-Instruct-v0.2""]},""legend"":{""title"":{""text"":""model""},""tracegroupgap"":0},""title"":{""text"":""Summary metrics length penalty""},""barmode"":""relative""}}",It is assumed that good quality summary contains between 2 and 5 sentences (inclusive range). The penalty is a difference between summary sentence count and this range. It is summed for each model.,",model,bert_score_P,bert_score_R,bert_score_F1,original_text_length_part,sentence_count,length_penalty,bleu_score
+5,Mistral-7B-Instruct-v0.2,0.043820098,0.042561684,0.04313921,0.04250630683894714,4.120342654588421,113258.0,0.0004930290548816363
+22,zephyr-7b-beta,0.085390136,0.08266569,0.08394519,0.08796697338212889,4.159788702026735,103714.0,0.0010625100735849574
+6,Mixtral-8x7B-Instruct-v0.1,0.19128644,0.19555509,0.19330867,0.2665288353398184,4.161038961038961,103320.0,0.0026839271544750283
+18,gpt-3.5-turbo,0.4943981,0.48408476,0.4888874,0.5905700146991734,4.229639819909955,89814.0,0.007892445077902592
+21,llama-2-70b-chat,0.20800962,0.21472095,0.21117964,0.29684572894554634,4.2436893203883495,88008.0,0.00329426273003284
+17,gemini-pro,0.23105659,0.23057175,0.23072062,0.295286999418032,4.244871794871795,87700.0,0.0025439281189154664
+11,TinyLlama/TinyLlama-1.1B-Chat-v1.0,0.122185074,0.11885959,0.12042627,0.13915355617375091,4.244871794871795,87700.0,0.002991155730532842
+20,gpt-4-turbo,0.42728576,0.4162435,0.42098433,0.5393220459796505,4.266137566137566,85120.0,0.0034873692407505464
+19,gpt-4,0.48605907,0.472583,0.47901583,0.4763731952669352,4.266137566137566,85120.0,0.004704572681138337
+15,chat-bison (PaLM 2),0.23117188,0.23029378,0.23060663,0.2927236655934559,4.281081081081081,83400.0,0.0033173472693443363
+16,chat-bison-32k (PaLM 2 32K),0.23046139,0.22983725,0.23002876,0.2608806894318779,4.281081081081081,83400.0,0.002970914340485325
+4,Mistral (7B) Instruct v0.2 (Together AI),0.3647361,0.3664233,0.36540908,0.5233998570385472,3.712222222222222,29298.0,0.005478518060743351
+13,Vicuna v1.5 (7B),0.284109,0.27878883,0.28129113,0.2781035051738079,3.6173027989821884,16948.0,0.006952332387656228
+2,Falcon Instruct (7B),0.2895086,0.23968808,0.2615204,0.0490635544441649,3.5818443804034583,14928.0,0.00021729364201653395
+9,RedPajama-INCITE Chat (7B),0.261367,0.23758642,0.2487217,0.0560284823193376,3.5818443804034583,14928.0,0.0
+10,Snorkel Mistral PairRM DPO (7B),0.31672964,0.33782956,0.3265383,3.7740234383755356,3.5818443804034583,14928.0,0.002907897771152987
+14,WizardLM v1.2 (13B),0.34085444,0.32933056,0.33466902,0.28716720161049375,3.5818443804034583,14928.0,0.003671383039102015
+8,Qwen 1.5 Chat (7B),0.34855434,0.34154576,0.344803,0.29904529709475364,3.5818443804034583,14928.0,0.003185571110431172
+7,OpenHermes-2.5-Mistral (7B),0.3618188,0.35180506,0.3565194,0.312054520357568,3.5818443804034583,14928.0,0.006563161880264231
+3,LLaMA-2 Chat (7B),0.3203912,0.3153909,0.31770444,0.4084233313416049,3.5818443804034583,14928.0,0.004255859538193306
+0,01-ai Yi Chat (34B),0.33974892,0.3404481,0.3399749,0.43251538287409536,3.5818443804034583,14928.0,0.007311566390840339
+1,Chronos Hermes (13B),0.3124825,0.31071666,0.311415,0.4742810243835248,3.5818443804034583,14928.0,0.011439012700594395
+12,Upstage SOLAR Instruct v1 (11B),0.0,0.0,0.0,0.0017662349842492329,3.5818443804034583,14928.0,0.0
+","{""x"": ""length_penalty"", ""y"": ""model"", ""color"": ""model"", ""orientation"": ""h"", ""title"": ""Summary metrics length penalty""}"
+"Figure({
+ 'data': [{'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
bleu_score=%{x}',
+ 'legendgroup': 'Chronos Hermes (13B)',
+ 'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
+ 'name': 'Chronos Hermes (13B)',
+ 'offsetgroup': 'Chronos Hermes (13B)',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.01143901]),
+ 'xaxis': 'x',
+ 'y': array(['Chronos Hermes (13B)'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
bleu_score=%{x}',
+ 'legendgroup': 'gpt-3.5-turbo',
+ 'marker': {'color': '#EF553B', 'pattern': {'shape': ''}},
+ 'name': 'gpt-3.5-turbo',
+ 'offsetgroup': 'gpt-3.5-turbo',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.00789245]),
+ 'xaxis': 'x',
+ 'y': array(['gpt-3.5-turbo'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
bleu_score=%{x}',
+ 'legendgroup': '01-ai Yi Chat (34B)',
+ 'marker': {'color': '#00cc96', 'pattern': {'shape': ''}},
+ 'name': '01-ai Yi Chat (34B)',
+ 'offsetgroup': '01-ai Yi Chat (34B)',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.00731157]),
+ 'xaxis': 'x',
+ 'y': array(['01-ai Yi Chat (34B)'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
bleu_score=%{x}',
+ 'legendgroup': 'Vicuna v1.5 (7B)',
+ 'marker': {'color': '#ab63fa', 'pattern': {'shape': ''}},
+ 'name': 'Vicuna v1.5 (7B)',
+ 'offsetgroup': 'Vicuna v1.5 (7B)',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.00695233]),
+ 'xaxis': 'x',
+ 'y': array(['Vicuna v1.5 (7B)'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
bleu_score=%{x}',
+ 'legendgroup': 'OpenHermes-2.5-Mistral (7B)',
+ 'marker': {'color': '#FFA15A', 'pattern': {'shape': ''}},
+ 'name': 'OpenHermes-2.5-Mistral (7B)',
+ 'offsetgroup': 'OpenHermes-2.5-Mistral (7B)',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.00656316]),
+ 'xaxis': 'x',
+ 'y': array(['OpenHermes-2.5-Mistral (7B)'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
bleu_score=%{x}',
+ 'legendgroup': 'Mistral (7B) Instruct v0.2 (Together AI)',
+ 'marker': {'color': '#19d3f3', 'pattern': {'shape': ''}},
+ 'name': 'Mistral (7B) Instruct v0.2 (Together AI)',
+ 'offsetgroup': 'Mistral (7B) Instruct v0.2 (Together AI)',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.00547852]),
+ 'xaxis': 'x',
+ 'y': array(['Mistral (7B) Instruct v0.2 (Together AI)'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
bleu_score=%{x}',
+ 'legendgroup': 'gpt-4',
+ 'marker': {'color': '#FF6692', 'pattern': {'shape': ''}},
+ 'name': 'gpt-4',
+ 'offsetgroup': 'gpt-4',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.00470457]),
+ 'xaxis': 'x',
+ 'y': array(['gpt-4'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
bleu_score=%{x}',
+ 'legendgroup': 'LLaMA-2 Chat (7B)',
+ 'marker': {'color': '#B6E880', 'pattern': {'shape': ''}},
+ 'name': 'LLaMA-2 Chat (7B)',
+ 'offsetgroup': 'LLaMA-2 Chat (7B)',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.00425586]),
+ 'xaxis': 'x',
+ 'y': array(['LLaMA-2 Chat (7B)'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
bleu_score=%{x}',
+ 'legendgroup': 'WizardLM v1.2 (13B)',
+ 'marker': {'color': '#FF97FF', 'pattern': {'shape': ''}},
+ 'name': 'WizardLM v1.2 (13B)',
+ 'offsetgroup': 'WizardLM v1.2 (13B)',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.00367138]),
+ 'xaxis': 'x',
+ 'y': array(['WizardLM v1.2 (13B)'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
bleu_score=%{x}',
+ 'legendgroup': 'gpt-4-turbo',
+ 'marker': {'color': '#FECB52', 'pattern': {'shape': ''}},
+ 'name': 'gpt-4-turbo',
+ 'offsetgroup': 'gpt-4-turbo',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.00348737]),
+ 'xaxis': 'x',
+ 'y': array(['gpt-4-turbo'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
bleu_score=%{x}',
+ 'legendgroup': 'chat-bison (PaLM 2)',
+ 'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
+ 'name': 'chat-bison (PaLM 2)',
+ 'offsetgroup': 'chat-bison (PaLM 2)',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.00331735]),
+ 'xaxis': 'x',
+ 'y': array(['chat-bison (PaLM 2)'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
bleu_score=%{x}',
+ 'legendgroup': 'llama-2-70b-chat',
+ 'marker': {'color': '#EF553B', 'pattern': {'shape': ''}},
+ 'name': 'llama-2-70b-chat',
+ 'offsetgroup': 'llama-2-70b-chat',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.00329426]),
+ 'xaxis': 'x',
+ 'y': array(['llama-2-70b-chat'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
bleu_score=%{x}',
+ 'legendgroup': 'Qwen 1.5 Chat (7B)',
+ 'marker': {'color': '#00cc96', 'pattern': {'shape': ''}},
+ 'name': 'Qwen 1.5 Chat (7B)',
+ 'offsetgroup': 'Qwen 1.5 Chat (7B)',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.00318557]),
+ 'xaxis': 'x',
+ 'y': array(['Qwen 1.5 Chat (7B)'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
bleu_score=%{x}',
+ 'legendgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
+ 'marker': {'color': '#ab63fa', 'pattern': {'shape': ''}},
+ 'name': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
+ 'offsetgroup': 'TinyLlama/TinyLlama-1.1B-Chat-v1.0',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.00299116]),
+ 'xaxis': 'x',
+ 'y': array(['TinyLlama/TinyLlama-1.1B-Chat-v1.0'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
bleu_score=%{x}',
+ 'legendgroup': 'chat-bison-32k (PaLM 2 32K)',
+ 'marker': {'color': '#FFA15A', 'pattern': {'shape': ''}},
+ 'name': 'chat-bison-32k (PaLM 2 32K)',
+ 'offsetgroup': 'chat-bison-32k (PaLM 2 32K)',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.00297091]),
+ 'xaxis': 'x',
+ 'y': array(['chat-bison-32k (PaLM 2 32K)'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
bleu_score=%{x}',
+ 'legendgroup': 'Snorkel Mistral PairRM DPO (7B)',
+ 'marker': {'color': '#19d3f3', 'pattern': {'shape': ''}},
+ 'name': 'Snorkel Mistral PairRM DPO (7B)',
+ 'offsetgroup': 'Snorkel Mistral PairRM DPO (7B)',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.0029079]),
+ 'xaxis': 'x',
+ 'y': array(['Snorkel Mistral PairRM DPO (7B)'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
bleu_score=%{x}',
+ 'legendgroup': 'Mixtral-8x7B-Instruct-v0.1',
+ 'marker': {'color': '#FF6692', 'pattern': {'shape': ''}},
+ 'name': 'Mixtral-8x7B-Instruct-v0.1',
+ 'offsetgroup': 'Mixtral-8x7B-Instruct-v0.1',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.00268393]),
+ 'xaxis': 'x',
+ 'y': array(['Mixtral-8x7B-Instruct-v0.1'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
bleu_score=%{x}',
+ 'legendgroup': 'gemini-pro',
+ 'marker': {'color': '#B6E880', 'pattern': {'shape': ''}},
+ 'name': 'gemini-pro',
+ 'offsetgroup': 'gemini-pro',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.00254393]),
+ 'xaxis': 'x',
+ 'y': array(['gemini-pro'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
bleu_score=%{x}',
+ 'legendgroup': 'zephyr-7b-beta',
+ 'marker': {'color': '#FF97FF', 'pattern': {'shape': ''}},
+ 'name': 'zephyr-7b-beta',
+ 'offsetgroup': 'zephyr-7b-beta',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.00106251]),
+ 'xaxis': 'x',
+ 'y': array(['zephyr-7b-beta'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
bleu_score=%{x}',
+ 'legendgroup': 'Mistral-7B-Instruct-v0.2',
+ 'marker': {'color': '#FECB52', 'pattern': {'shape': ''}},
+ 'name': 'Mistral-7B-Instruct-v0.2',
+ 'offsetgroup': 'Mistral-7B-Instruct-v0.2',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.00049303]),
+ 'xaxis': 'x',
+ 'y': array(['Mistral-7B-Instruct-v0.2'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
bleu_score=%{x}',
+ 'legendgroup': 'Falcon Instruct (7B)',
+ 'marker': {'color': '#636efa', 'pattern': {'shape': ''}},
+ 'name': 'Falcon Instruct (7B)',
+ 'offsetgroup': 'Falcon Instruct (7B)',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.00021729]),
+ 'xaxis': 'x',
+ 'y': array(['Falcon Instruct (7B)'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
bleu_score=%{x}',
+ 'legendgroup': 'RedPajama-INCITE Chat (7B)',
+ 'marker': {'color': '#EF553B', 'pattern': {'shape': ''}},
+ 'name': 'RedPajama-INCITE Chat (7B)',
+ 'offsetgroup': 'RedPajama-INCITE Chat (7B)',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.]),
+ 'xaxis': 'x',
+ 'y': array(['RedPajama-INCITE Chat (7B)'], dtype=object),
+ 'yaxis': 'y'},
+ {'alignmentgroup': 'True',
+ 'hovertemplate': 'model=%{y}
bleu_score=%{x}',
+ 'legendgroup': 'Upstage SOLAR Instruct v1 (11B)',
+ 'marker': {'color': '#00cc96', 'pattern': {'shape': ''}},
+ 'name': 'Upstage SOLAR Instruct v1 (11B)',
+ 'offsetgroup': 'Upstage SOLAR Instruct v1 (11B)',
+ 'orientation': 'h',
+ 'showlegend': True,
+ 'textposition': 'auto',
+ 'type': 'bar',
+ 'x': array([0.]),
+ 'xaxis': 'x',
+ 'y': array(['Upstage SOLAR Instruct v1 (11B)'], dtype=object),
+ 'yaxis': 'y'}],
+ 'layout': {'barmode': 'relative',
+ 'legend': {'title': {'text': 'model'}, 'tracegroupgap': 0},
+ 'template': '...',
+ 'title': {'text': 'Summary metrics BLEU score'},
+ 'xaxis': {'anchor': 'y', 'domain': [0.0, 1.0], 'title': {'text': 'bleu_score'}},
+ 'yaxis': {'anchor': 'x',
+ 'categoryarray': [Upstage SOLAR Instruct v1 (11B),
+ RedPajama-INCITE Chat (7B), Falcon
+ Instruct (7B), Mistral-7B-Instruct-v0.2,
+ zephyr-7b-beta, gemini-pro,
+ Mixtral-8x7B-Instruct-v0.1, Snorkel
+ Mistral PairRM DPO (7B), chat-bison-32k
+ (PaLM 2 32K),
+ TinyLlama/TinyLlama-1.1B-Chat-v1.0, Qwen
+ 1.5 Chat (7B), llama-2-70b-chat, chat-
+ bison (PaLM 2), gpt-4-turbo, WizardLM
+ v1.2 (13B), LLaMA-2 Chat (7B), gpt-4,
+ Mistral (7B) Instruct v0.2 (Together
+ AI), OpenHermes-2.5-Mistral (7B), Vicuna
+ v1.5 (7B), 01-ai Yi Chat (34B),
+ gpt-3.5-turbo, Chronos Hermes (13B)],
+ 'categoryorder': 'array',
+ 'domain': [0.0, 1.0],
+ 'title': {'text': 'model'}}}
+})",Summary metrics BLEU score,"{""data"":[{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003ebleu_score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Chronos Hermes (13B)"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""Chronos Hermes (13B)"",""offsetgroup"":""Chronos Hermes (13B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.011439012700594395],""xaxis"":""x"",""y"":[""Chronos Hermes (13B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003ebleu_score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-3.5-turbo"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""gpt-3.5-turbo"",""offsetgroup"":""gpt-3.5-turbo"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.007892445077902592],""xaxis"":""x"",""y"":[""gpt-3.5-turbo""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003ebleu_score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""01-ai Yi Chat (34B)"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""01-ai Yi Chat (34B)"",""offsetgroup"":""01-ai Yi Chat (34B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.007311566390840339],""xaxis"":""x"",""y"":[""01-ai Yi Chat (34B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003ebleu_score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Vicuna v1.5 (7B)"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""Vicuna v1.5 (7B)"",""offsetgroup"":""Vicuna v1.5 (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.006952332387656228],""xaxis"":""x"",""y"":[""Vicuna v1.5 (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003ebleu_score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""OpenHermes-2.5-Mistral (7B)"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""OpenHermes-2.5-Mistral (7B)"",""offsetgroup"":""OpenHermes-2.5-Mistral (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.006563161880264231],""xaxis"":""x"",""y"":[""OpenHermes-2.5-Mistral (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003ebleu_score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral (7B) Instruct v0.2 (Together AI)"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""Mistral (7B) Instruct v0.2 (Together AI)"",""offsetgroup"":""Mistral (7B) Instruct v0.2 (Together AI)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.005478518060743351],""xaxis"":""x"",""y"":[""Mistral (7B) Instruct v0.2 (Together AI)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003ebleu_score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""gpt-4"",""offsetgroup"":""gpt-4"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.004704572681138337],""xaxis"":""x"",""y"":[""gpt-4""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003ebleu_score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""LLaMA-2 Chat (7B)"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""LLaMA-2 Chat (7B)"",""offsetgroup"":""LLaMA-2 Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.004255859538193306],""xaxis"":""x"",""y"":[""LLaMA-2 Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003ebleu_score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""WizardLM v1.2 (13B)"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""WizardLM v1.2 (13B)"",""offsetgroup"":""WizardLM v1.2 (13B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.003671383039102015],""xaxis"":""x"",""y"":[""WizardLM v1.2 (13B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003ebleu_score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gpt-4-turbo"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""gpt-4-turbo"",""offsetgroup"":""gpt-4-turbo"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.0034873692407505464],""xaxis"":""x"",""y"":[""gpt-4-turbo""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003ebleu_score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison (PaLM 2)"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""chat-bison (PaLM 2)"",""offsetgroup"":""chat-bison (PaLM 2)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.0033173472693443363],""xaxis"":""x"",""y"":[""chat-bison (PaLM 2)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003ebleu_score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""llama-2-70b-chat"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""llama-2-70b-chat"",""offsetgroup"":""llama-2-70b-chat"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.00329426273003284],""xaxis"":""x"",""y"":[""llama-2-70b-chat""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003ebleu_score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Qwen 1.5 Chat (7B)"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""Qwen 1.5 Chat (7B)"",""offsetgroup"":""Qwen 1.5 Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.003185571110431172],""xaxis"":""x"",""y"":[""Qwen 1.5 Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003ebleu_score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""marker"":{""color"":""#ab63fa"",""pattern"":{""shape"":""""}},""name"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""offsetgroup"":""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.002991155730532842],""xaxis"":""x"",""y"":[""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003ebleu_score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""chat-bison-32k (PaLM 2 32K)"",""marker"":{""color"":""#FFA15A"",""pattern"":{""shape"":""""}},""name"":""chat-bison-32k (PaLM 2 32K)"",""offsetgroup"":""chat-bison-32k (PaLM 2 32K)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.002970914340485325],""xaxis"":""x"",""y"":[""chat-bison-32k (PaLM 2 32K)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003ebleu_score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Snorkel Mistral PairRM DPO (7B)"",""marker"":{""color"":""#19d3f3"",""pattern"":{""shape"":""""}},""name"":""Snorkel Mistral PairRM DPO (7B)"",""offsetgroup"":""Snorkel Mistral PairRM DPO (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.002907897771152987],""xaxis"":""x"",""y"":[""Snorkel Mistral PairRM DPO (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003ebleu_score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mixtral-8x7B-Instruct-v0.1"",""marker"":{""color"":""#FF6692"",""pattern"":{""shape"":""""}},""name"":""Mixtral-8x7B-Instruct-v0.1"",""offsetgroup"":""Mixtral-8x7B-Instruct-v0.1"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.0026839271544750283],""xaxis"":""x"",""y"":[""Mixtral-8x7B-Instruct-v0.1""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003ebleu_score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""gemini-pro"",""marker"":{""color"":""#B6E880"",""pattern"":{""shape"":""""}},""name"":""gemini-pro"",""offsetgroup"":""gemini-pro"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.0025439281189154664],""xaxis"":""x"",""y"":[""gemini-pro""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003ebleu_score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""zephyr-7b-beta"",""marker"":{""color"":""#FF97FF"",""pattern"":{""shape"":""""}},""name"":""zephyr-7b-beta"",""offsetgroup"":""zephyr-7b-beta"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.0010625100735849574],""xaxis"":""x"",""y"":[""zephyr-7b-beta""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003ebleu_score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Mistral-7B-Instruct-v0.2"",""marker"":{""color"":""#FECB52"",""pattern"":{""shape"":""""}},""name"":""Mistral-7B-Instruct-v0.2"",""offsetgroup"":""Mistral-7B-Instruct-v0.2"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.0004930290548816363],""xaxis"":""x"",""y"":[""Mistral-7B-Instruct-v0.2""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003ebleu_score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Falcon Instruct (7B)"",""marker"":{""color"":""#636efa"",""pattern"":{""shape"":""""}},""name"":""Falcon Instruct (7B)"",""offsetgroup"":""Falcon Instruct (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.00021729364201653395],""xaxis"":""x"",""y"":[""Falcon Instruct (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003ebleu_score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""RedPajama-INCITE Chat (7B)"",""marker"":{""color"":""#EF553B"",""pattern"":{""shape"":""""}},""name"":""RedPajama-INCITE Chat (7B)"",""offsetgroup"":""RedPajama-INCITE Chat (7B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.0],""xaxis"":""x"",""y"":[""RedPajama-INCITE Chat (7B)""],""yaxis"":""y"",""type"":""bar""},{""alignmentgroup"":""True"",""hovertemplate"":""model=%{y}\u003cbr\u003ebleu_score=%{x}\u003cextra\u003e\u003c\u002fextra\u003e"",""legendgroup"":""Upstage SOLAR Instruct v1 (11B)"",""marker"":{""color"":""#00cc96"",""pattern"":{""shape"":""""}},""name"":""Upstage SOLAR Instruct v1 (11B)"",""offsetgroup"":""Upstage SOLAR Instruct v1 (11B)"",""orientation"":""h"",""showlegend"":true,""textposition"":""auto"",""x"":[0.0],""xaxis"":""x"",""y"":[""Upstage SOLAR Instruct v1 (11B)""],""yaxis"":""y"",""type"":""bar""}],""layout"":{""template"":{""data"":{""histogram2dcontour"":[{""type"":""histogram2dcontour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""choropleth"":[{""type"":""choropleth"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""histogram2d"":[{""type"":""histogram2d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmap"":[{""type"":""heatmap"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""heatmapgl"":[{""type"":""heatmapgl"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""contourcarpet"":[{""type"":""contourcarpet"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""contour"":[{""type"":""contour"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""surface"":[{""type"":""surface"",""colorbar"":{""outlinewidth"":0,""ticks"":""""},""colorscale"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]]}],""mesh3d"":[{""type"":""mesh3d"",""colorbar"":{""outlinewidth"":0,""ticks"":""""}}],""scatter"":[{""fillpattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2},""type"":""scatter""}],""parcoords"":[{""type"":""parcoords"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolargl"":[{""type"":""scatterpolargl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""bar"":[{""error_x"":{""color"":""#2a3f5f""},""error_y"":{""color"":""#2a3f5f""},""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""bar""}],""scattergeo"":[{""type"":""scattergeo"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterpolar"":[{""type"":""scatterpolar"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""histogram"":[{""marker"":{""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""histogram""}],""scattergl"":[{""type"":""scattergl"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatter3d"":[{""type"":""scatter3d"",""line"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattermapbox"":[{""type"":""scattermapbox"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scatterternary"":[{""type"":""scatterternary"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""scattercarpet"":[{""type"":""scattercarpet"",""marker"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}}}],""carpet"":[{""aaxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""baxis"":{""endlinecolor"":""#2a3f5f"",""gridcolor"":""white"",""linecolor"":""white"",""minorgridcolor"":""white"",""startlinecolor"":""#2a3f5f""},""type"":""carpet""}],""table"":[{""cells"":{""fill"":{""color"":""#EBF0F8""},""line"":{""color"":""white""}},""header"":{""fill"":{""color"":""#C8D4E3""},""line"":{""color"":""white""}},""type"":""table""}],""barpolar"":[{""marker"":{""line"":{""color"":""#E5ECF6"",""width"":0.5},""pattern"":{""fillmode"":""overlay"",""size"":10,""solidity"":0.2}},""type"":""barpolar""}],""pie"":[{""automargin"":true,""type"":""pie""}]},""layout"":{""autotypenumbers"":""strict"",""colorway"":[""#636efa"",""#EF553B"",""#00cc96"",""#ab63fa"",""#FFA15A"",""#19d3f3"",""#FF6692"",""#B6E880"",""#FF97FF"",""#FECB52""],""font"":{""color"":""#2a3f5f""},""hovermode"":""closest"",""hoverlabel"":{""align"":""left""},""paper_bgcolor"":""white"",""plot_bgcolor"":""#E5ECF6"",""polar"":{""bgcolor"":""#E5ECF6"",""angularaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""radialaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""ternary"":{""bgcolor"":""#E5ECF6"",""aaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""baxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""},""caxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":""""}},""coloraxis"":{""colorbar"":{""outlinewidth"":0,""ticks"":""""}},""colorscale"":{""sequential"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""sequentialminus"":[[0.0,""#0d0887""],[0.1111111111111111,""#46039f""],[0.2222222222222222,""#7201a8""],[0.3333333333333333,""#9c179e""],[0.4444444444444444,""#bd3786""],[0.5555555555555556,""#d8576b""],[0.6666666666666666,""#ed7953""],[0.7777777777777778,""#fb9f3a""],[0.8888888888888888,""#fdca26""],[1.0,""#f0f921""]],""diverging"":[[0,""#8e0152""],[0.1,""#c51b7d""],[0.2,""#de77ae""],[0.3,""#f1b6da""],[0.4,""#fde0ef""],[0.5,""#f7f7f7""],[0.6,""#e6f5d0""],[0.7,""#b8e186""],[0.8,""#7fbc41""],[0.9,""#4d9221""],[1,""#276419""]]},""xaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""yaxis"":{""gridcolor"":""white"",""linecolor"":""white"",""ticks"":"""",""title"":{""standoff"":15},""zerolinecolor"":""white"",""automargin"":true,""zerolinewidth"":2},""scene"":{""xaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""yaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2},""zaxis"":{""backgroundcolor"":""#E5ECF6"",""gridcolor"":""white"",""linecolor"":""white"",""showbackground"":true,""ticks"":"""",""zerolinecolor"":""white"",""gridwidth"":2}},""shapedefaults"":{""line"":{""color"":""#2a3f5f""}},""annotationdefaults"":{""arrowcolor"":""#2a3f5f"",""arrowhead"":0,""arrowwidth"":1},""geo"":{""bgcolor"":""white"",""landcolor"":""#E5ECF6"",""subunitcolor"":""white"",""showland"":true,""showlakes"":true,""lakecolor"":""white""},""title"":{""x"":0.05},""mapbox"":{""style"":""light""}}},""xaxis"":{""anchor"":""y"",""domain"":[0.0,1.0],""title"":{""text"":""bleu_score""}},""yaxis"":{""anchor"":""x"",""domain"":[0.0,1.0],""title"":{""text"":""model""},""categoryorder"":""array"",""categoryarray"":[""Upstage SOLAR Instruct v1 (11B)"",""RedPajama-INCITE Chat (7B)"",""Falcon Instruct (7B)"",""Mistral-7B-Instruct-v0.2"",""zephyr-7b-beta"",""gemini-pro"",""Mixtral-8x7B-Instruct-v0.1"",""Snorkel Mistral PairRM DPO (7B)"",""chat-bison-32k (PaLM 2 32K)"",""TinyLlama\u002fTinyLlama-1.1B-Chat-v1.0"",""Qwen 1.5 Chat (7B)"",""llama-2-70b-chat"",""chat-bison (PaLM 2)"",""gpt-4-turbo"",""WizardLM v1.2 (13B)"",""LLaMA-2 Chat (7B)"",""gpt-4"",""Mistral (7B) Instruct v0.2 (Together AI)"",""OpenHermes-2.5-Mistral (7B)"",""Vicuna v1.5 (7B)"",""01-ai Yi Chat (34B)"",""gpt-3.5-turbo"",""Chronos Hermes (13B)""]},""legend"":{""title"":{""text"":""model""},""tracegroupgap"":0},""title"":{""text"":""Summary metrics BLEU score""},""barmode"":""relative""}}","BLEU (BiLingual Evaluation Understudy) measures similarity between unigrams, bigrams and trigrams in the summarized and original text. Unlike BERT score this metric doesn't handle synonyms. Value is averaged for each model.",",model,bert_score_P,bert_score_R,bert_score_F1,original_text_length_part,sentence_count,length_penalty,bleu_score
+1,Chronos Hermes (13B),0.3124825,0.31071666,0.311415,0.4742810243835248,3.5818443804034583,14928.0,0.011439012700594395
+18,gpt-3.5-turbo,0.4943981,0.48408476,0.4888874,0.5905700146991734,4.229639819909955,89814.0,0.007892445077902592
+0,01-ai Yi Chat (34B),0.33974892,0.3404481,0.3399749,0.43251538287409536,3.5818443804034583,14928.0,0.007311566390840339
+13,Vicuna v1.5 (7B),0.284109,0.27878883,0.28129113,0.2781035051738079,3.6173027989821884,16948.0,0.006952332387656228
+7,OpenHermes-2.5-Mistral (7B),0.3618188,0.35180506,0.3565194,0.312054520357568,3.5818443804034583,14928.0,0.006563161880264231
+4,Mistral (7B) Instruct v0.2 (Together AI),0.3647361,0.3664233,0.36540908,0.5233998570385472,3.712222222222222,29298.0,0.005478518060743351
+19,gpt-4,0.48605907,0.472583,0.47901583,0.4763731952669352,4.266137566137566,85120.0,0.004704572681138337
+3,LLaMA-2 Chat (7B),0.3203912,0.3153909,0.31770444,0.4084233313416049,3.5818443804034583,14928.0,0.004255859538193306
+14,WizardLM v1.2 (13B),0.34085444,0.32933056,0.33466902,0.28716720161049375,3.5818443804034583,14928.0,0.003671383039102015
+20,gpt-4-turbo,0.42728576,0.4162435,0.42098433,0.5393220459796505,4.266137566137566,85120.0,0.0034873692407505464
+15,chat-bison (PaLM 2),0.23117188,0.23029378,0.23060663,0.2927236655934559,4.281081081081081,83400.0,0.0033173472693443363
+21,llama-2-70b-chat,0.20800962,0.21472095,0.21117964,0.29684572894554634,4.2436893203883495,88008.0,0.00329426273003284
+8,Qwen 1.5 Chat (7B),0.34855434,0.34154576,0.344803,0.29904529709475364,3.5818443804034583,14928.0,0.003185571110431172
+11,TinyLlama/TinyLlama-1.1B-Chat-v1.0,0.122185074,0.11885959,0.12042627,0.13915355617375091,4.244871794871795,87700.0,0.002991155730532842
+16,chat-bison-32k (PaLM 2 32K),0.23046139,0.22983725,0.23002876,0.2608806894318779,4.281081081081081,83400.0,0.002970914340485325
+10,Snorkel Mistral PairRM DPO (7B),0.31672964,0.33782956,0.3265383,3.7740234383755356,3.5818443804034583,14928.0,0.002907897771152987
+6,Mixtral-8x7B-Instruct-v0.1,0.19128644,0.19555509,0.19330867,0.2665288353398184,4.161038961038961,103320.0,0.0026839271544750283
+17,gemini-pro,0.23105659,0.23057175,0.23072062,0.295286999418032,4.244871794871795,87700.0,0.0025439281189154664
+22,zephyr-7b-beta,0.085390136,0.08266569,0.08394519,0.08796697338212889,4.159788702026735,103714.0,0.0010625100735849574
+5,Mistral-7B-Instruct-v0.2,0.043820098,0.042561684,0.04313921,0.04250630683894714,4.120342654588421,113258.0,0.0004930290548816363
+2,Falcon Instruct (7B),0.2895086,0.23968808,0.2615204,0.0490635544441649,3.5818443804034583,14928.0,0.00021729364201653395
+9,RedPajama-INCITE Chat (7B),0.261367,0.23758642,0.2487217,0.0560284823193376,3.5818443804034583,14928.0,0.0
+12,Upstage SOLAR Instruct v1 (11B),0.0,0.0,0.0,0.0017662349842492329,3.5818443804034583,14928.0,0.0
+","{""x"": ""bleu_score"", ""y"": ""model"", ""color"": ""model"", ""orientation"": ""h"", ""title"": ""Summary metrics BLEU score""}"