DavidAU
/

L3-SMB-Instruct-12.2B-F32

@@ -1,10 +1,104 @@
 ---
-base_model: []
 library_name: transformers
 tags:
 - mergekit
 - merge
 ---
 <h2>L3-SMB-Instruct-12.2B-F32</h2>
@@ -91,3 +185,17 @@ slices:
 merge_method: passthrough
 dtype: float32
 ```

 ---
 library_name: transformers
 tags:
 - mergekit
 - merge
+base_model: []
+model-index:
+- name: L3-SMB-Instruct-12.2B-F32
+ results:
+ - task:
+ type: text-generation
+ name: Text Generation
+ dataset:
+ name: IFEval (0-Shot)
+ type: HuggingFaceH4/ifeval
+ args:
+ num_few_shot: 0
+ metrics:
+ - type: inst_level_strict_acc and prompt_level_strict_acc
+ value: 43.03
+ name: strict accuracy
+ source:
+ url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=DavidAU/L3-SMB-Instruct-12.2B-F32
+ name: Open LLM Leaderboard
+ - task:
+ type: text-generation
+ name: Text Generation
+ dataset:
+ name: BBH (3-Shot)
+ type: BBH
+ args:
+ num_few_shot: 3
+ metrics:
+ - type: acc_norm
+ value: 26.13
+ name: normalized accuracy
+ source:
+ url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=DavidAU/L3-SMB-Instruct-12.2B-F32
+ name: Open LLM Leaderboard
+ - task:
+ type: text-generation
+ name: Text Generation
+ dataset:
+ name: MATH Lvl 5 (4-Shot)
+ type: hendrycks/competition_math
+ args:
+ num_few_shot: 4
+ metrics:
+ - type: exact_match
+ value: 4.08
+ name: exact match
+ source:
+ url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=DavidAU/L3-SMB-Instruct-12.2B-F32
+ name: Open LLM Leaderboard
+ - task:
+ type: text-generation
+ name: Text Generation
+ dataset:
+ name: GPQA (0-shot)
+ type: Idavidrein/gpqa
+ args:
+ num_few_shot: 0
+ metrics:
+ - type: acc_norm
+ value: 4.25
+ name: acc_norm
+ source:
+ url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=DavidAU/L3-SMB-Instruct-12.2B-F32
+ name: Open LLM Leaderboard
+ - task:
+ type: text-generation
+ name: Text Generation
+ dataset:
+ name: MuSR (0-shot)
+ type: TAUR-Lab/MuSR
+ args:
+ num_few_shot: 0
+ metrics:
+ - type: acc_norm
+ value: 9.62
+ name: acc_norm
+ source:
+ url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=DavidAU/L3-SMB-Instruct-12.2B-F32
+ name: Open LLM Leaderboard
+ - task:
+ type: text-generation
+ name: Text Generation
+ dataset:
+ name: MMLU-PRO (5-shot)
+ type: TIGER-Lab/MMLU-Pro
+ config: main
+ split: test
+ args:
+ num_few_shot: 5
+ metrics:
+ - type: acc
+ value: 25.69
+ name: accuracy
+ source:
+ url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=DavidAU/L3-SMB-Instruct-12.2B-F32
+ name: Open LLM Leaderboard
 ---
 <h2>L3-SMB-Instruct-12.2B-F32</h2>
 merge_method: passthrough
 dtype: float32
 ```
+# [Open LLM Leaderboard Evaluation Results](https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard)
+Detailed results can be found [here](https://huggingface.co/datasets/open-llm-leaderboard/details_DavidAU__L3-SMB-Instruct-12.2B-F32)
+| Metric |Value|
+|-------------------|----:|
+|Avg. |18.80|
+|IFEval (0-Shot) |43.03|
+|BBH (3-Shot) |26.13|
+|MATH Lvl 5 (4-Shot)| 4.08|
+|GPQA (0-shot) | 4.25|
+|MuSR (0-shot) | 9.62|
+|MMLU-PRO (5-shot) |25.69|