icefog72
/

IceEspressoRPv2-7b

@@ -1,10 +1,104 @@
 ---
-base_model: []
 library_name: transformers
 tags:
 - mergekit
 - merge
 ---
 # IceEspressoRPv2-7b
@@ -47,3 +141,17 @@ dtype: bfloat16
 ```

 ---
 library_name: transformers
 tags:
 - mergekit
 - merge
+base_model: []
+model-index:
+- name: IceEspressoRPv2-7b
+ results:
+ - task:
+ type: text-generation
+ name: Text Generation
+ dataset:
+ name: IFEval (0-Shot)
+ type: HuggingFaceH4/ifeval
+ args:
+ num_few_shot: 0
+ metrics:
+ - type: inst_level_strict_acc and prompt_level_strict_acc
+ value: 49.77
+ name: strict accuracy
+ source:
+ url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=icefog72/IceEspressoRPv2-7b
+ name: Open LLM Leaderboard
+ - task:
+ type: text-generation
+ name: Text Generation
+ dataset:
+ name: BBH (3-Shot)
+ type: BBH
+ args:
+ num_few_shot: 3
+ metrics:
+ - type: acc_norm
+ value: 31.3
+ name: normalized accuracy
+ source:
+ url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=icefog72/IceEspressoRPv2-7b
+ name: Open LLM Leaderboard
+ - task:
+ type: text-generation
+ name: Text Generation
+ dataset:
+ name: MATH Lvl 5 (4-Shot)
+ type: hendrycks/competition_math
+ args:
+ num_few_shot: 4
+ metrics:
+ - type: exact_match
+ value: 5.51
+ name: exact match
+ source:
+ url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=icefog72/IceEspressoRPv2-7b
+ name: Open LLM Leaderboard
+ - task:
+ type: text-generation
+ name: Text Generation
+ dataset:
+ name: GPQA (0-shot)
+ type: Idavidrein/gpqa
+ args:
+ num_few_shot: 0
+ metrics:
+ - type: acc_norm
+ value: 5.26
+ name: acc_norm
+ source:
+ url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=icefog72/IceEspressoRPv2-7b
+ name: Open LLM Leaderboard
+ - task:
+ type: text-generation
+ name: Text Generation
+ dataset:
+ name: MuSR (0-shot)
+ type: TAUR-Lab/MuSR
+ args:
+ num_few_shot: 0
+ metrics:
+ - type: acc_norm
+ value: 12.77
+ name: acc_norm
+ source:
+ url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=icefog72/IceEspressoRPv2-7b
+ name: Open LLM Leaderboard
+ - task:
+ type: text-generation
+ name: Text Generation
+ dataset:
+ name: MMLU-PRO (5-shot)
+ type: TIGER-Lab/MMLU-Pro
+ config: main
+ split: test
+ args:
+ num_few_shot: 5
+ metrics:
+ - type: acc
+ value: 22.9
+ name: accuracy
+ source:
+ url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=icefog72/IceEspressoRPv2-7b
+ name: Open LLM Leaderboard
 ---
 # IceEspressoRPv2-7b
 ```
+# [Open LLM Leaderboard Evaluation Results](https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard)
+Detailed results can be found [here](https://huggingface.co/datasets/open-llm-leaderboard/details_icefog72__IceEspressoRPv2-7b)
+| Metric |Value|
+|-------------------|----:|
+|Avg. |21.25|
+|IFEval (0-Shot) |49.77|
+|BBH (3-Shot) |31.30|
+|MATH Lvl 5 (4-Shot)| 5.51|
+|GPQA (0-shot) | 5.26|
+|MuSR (0-shot) |12.77|
+|MMLU-PRO (5-shot) |22.90|