giraffe176
/

WestMaid_HermesMonarchv0.1

@@ -1,15 +1,15 @@
 ---
 base_model:
 - mistralai/Mistral-7B-v0.1
 - argilla/distilabeled-OpenHermes-2.5-Mistral-7B
 - NeverSleep/Noromaid-7B-0.4-DPO
 - senseable/WestLake-7B-v2
 - mlabonne/AlphaMonarch-7B
-library_name: transformers
-tags:
-- mergekit
-- merge
-license: cc-by-nc-4.0
 model-index:
 - name: WestLake_Noromaid_OpenHermes_neural-chatv0.1
   results:
@@ -205,4 +205,17 @@ dtype: bfloat16
 | NeverSleep/Noromaid-7B-0.4-DPO                          |                                             |                                                                                 | 59.08   | 62.29 | 84.32     | 63.2  | 42.28      | 76.95      | 25.47 |
 | claude-v1                                               | 7.900000                                    | 76.83                                                                           |         |       |           |       |            |            |       |
 | gpt-3.5-turbo                                           | 7.943750                                    | 71.74                                                                           |         |       |           |       |            |            |       |
-|                                                         | [(Paper)](https://arxiv.org/abs/2306.05685) | [(Paper)](https://arxiv.org/abs/2312.06281) [Leaderboard](https://eqbench.com/) |         |       |           |       |            |            |       |

 ---
+license: cc-by-nc-4.0
+library_name: transformers
+tags:
+- mergekit
+- merge
 base_model:
 - mistralai/Mistral-7B-v0.1
 - argilla/distilabeled-OpenHermes-2.5-Mistral-7B
 - NeverSleep/Noromaid-7B-0.4-DPO
 - senseable/WestLake-7B-v2
 - mlabonne/AlphaMonarch-7B
 model-index:
 - name: WestLake_Noromaid_OpenHermes_neural-chatv0.1
   results:
 | NeverSleep/Noromaid-7B-0.4-DPO                          |                                             |                                                                                 | 59.08   | 62.29 | 84.32     | 63.2  | 42.28      | 76.95      | 25.47 |
 | claude-v1                                               | 7.900000                                    | 76.83                                                                           |         |       |           |       |            |            |       |
 | gpt-3.5-turbo                                           | 7.943750                                    | 71.74                                                                           |         |       |           |       |            |            |       |
+|                                                         | [(Paper)](https://arxiv.org/abs/2306.05685) | [(Paper)](https://arxiv.org/abs/2312.06281) [Leaderboard](https://eqbench.com/) |         |       |           |       |            |            |       |
+# [Open LLM Leaderboard Evaluation Results](https://huggingface.co/spaces/HuggingFaceH4/open_llm_leaderboard)
+Detailed results can be found [here](https://huggingface.co/datasets/open-llm-leaderboard/details_giraffe176__WestMaid_HermesMonarchv0.1)
+|             Metric              |Value|
+|---------------------------------|----:|
+|Avg.                             |72.62|
+|AI2 Reasoning Challenge (25-Shot)|70.22|
+|HellaSwag (10-Shot)              |87.42|
+|MMLU (5-Shot)                    |64.31|
+|TruthfulQA (0-shot)              |61.99|
+|Winogrande (5-shot)              |82.16|
+|GSM8k (5-shot)                   |69.60|