wanlige
/

li-14b-v0.4

@@ -12,195 +12,114 @@ base_model:
 - SicariusSicariiStuff/Impish_QWEN_14B-1M
 - Qwen/Qwen2.5-14B
 model-index:
 - name: li-14b-v0.4
   results:
   - task:
       type: text-generation
       name: Text Generation
     dataset:
       name: IFEval (0-Shot)
       type: HuggingFaceH4/ifeval
       args:
         num_few_shot: 0
     metrics:
     - type: inst_level_strict_acc and prompt_level_strict_acc
       value: 81.33
       name: strict accuracy
     source:
-      url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=wanlige/li-14b-v0.4
       name: Open LLM Leaderboard
   - task:
       type: text-generation
       name: Text Generation
     dataset:
       name: BBH (3-Shot)
       type: BBH
       args:
         num_few_shot: 3
     metrics:
     - type: acc_norm
       value: 50.38
       name: normalized accuracy
     source:
-      url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=wanlige/li-14b-v0.4
       name: Open LLM Leaderboard
   - task:
       type: text-generation
       name: Text Generation
     dataset:
       name: MATH Lvl 5 (4-Shot)
       type: hendrycks/competition_math
       args:
         num_few_shot: 4
     metrics:
     - type: exact_match
       value: 55.74
       name: exact match
     source:
-      url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=wanlige/li-14b-v0.4
       name: Open LLM Leaderboard
   - task:
       type: text-generation
       name: Text Generation
     dataset:
       name: GPQA (0-shot)
       type: Idavidrein/gpqa
       args:
         num_few_shot: 0
     metrics:
     - type: acc_norm
       value: 11.86
       name: acc_norm
     source:
-      url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=wanlige/li-14b-v0.4
       name: Open LLM Leaderboard
   - task:
       type: text-generation
       name: Text Generation
     dataset:
       name: MuSR (0-shot)
       type: TAUR-Lab/MuSR
       args:
         num_few_shot: 0
     metrics:
     - type: acc_norm
       value: 16.35
       name: acc_norm
     source:
-      url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=wanlige/li-14b-v0.4
       name: Open LLM Leaderboard
   - task:
       type: text-generation
       name: Text Generation
     dataset:
       name: MMLU-PRO (5-shot)
       type: TIGER-Lab/MMLU-Pro
       config: main
       split: test
       args:
         num_few_shot: 5
     metrics:
     - type: acc
       value: 46.3
       name: accuracy
     source:
-      url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=wanlige/li-14b-v0.4
       name: Open LLM Leaderboard
 ---
 > [!TIP] This model is currently ranked #1 among the models up to 15B parameters and #50 among all models on the [Open LLM Leaderboard](https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard).
@@ -381,7 +300,4 @@ Detailed results can be found [here](https://huggingface.co/datasets/open-llm-le
 |MuSR (0-shot)      |16.35|
-|MMLU-PRO (5-shot)  |46.30|

 - SicariusSicariiStuff/Impish_QWEN_14B-1M
 - Qwen/Qwen2.5-14B
 model-index:
 - name: li-14b-v0.4
   results:
   - task:
       type: text-generation
       name: Text Generation
     dataset:
       name: IFEval (0-Shot)
       type: HuggingFaceH4/ifeval
       args:
         num_few_shot: 0
     metrics:
     - type: inst_level_strict_acc and prompt_level_strict_acc
       value: 81.33
       name: strict accuracy
     source:
+      url: >-
+        https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=wanlige/li-14b-v0.4
       name: Open LLM Leaderboard
   - task:
       type: text-generation
       name: Text Generation
     dataset:
       name: BBH (3-Shot)
       type: BBH
       args:
         num_few_shot: 3
     metrics:
     - type: acc_norm
       value: 50.38
       name: normalized accuracy
     source:
+      url: >-
+        https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=wanlige/li-14b-v0.4
       name: Open LLM Leaderboard
   - task:
       type: text-generation
       name: Text Generation
     dataset:
       name: MATH Lvl 5 (4-Shot)
       type: hendrycks/competition_math
       args:
         num_few_shot: 4
     metrics:
     - type: exact_match
       value: 55.74
       name: exact match
     source:
+      url: >-
+        https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=wanlige/li-14b-v0.4
       name: Open LLM Leaderboard
   - task:
       type: text-generation
       name: Text Generation
     dataset:
       name: GPQA (0-shot)
       type: Idavidrein/gpqa
       args:
         num_few_shot: 0
     metrics:
     - type: acc_norm
       value: 11.86
       name: acc_norm
     source:
+      url: >-
+        https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=wanlige/li-14b-v0.4
       name: Open LLM Leaderboard
   - task:
       type: text-generation
       name: Text Generation
     dataset:
       name: MuSR (0-shot)
       type: TAUR-Lab/MuSR
       args:
         num_few_shot: 0
     metrics:
     - type: acc_norm
       value: 16.35
       name: acc_norm
     source:
+      url: >-
+        https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=wanlige/li-14b-v0.4
       name: Open LLM Leaderboard
   - task:
       type: text-generation
       name: Text Generation
     dataset:
       name: MMLU-PRO (5-shot)
       type: TIGER-Lab/MMLU-Pro
       config: main
       split: test
       args:
         num_few_shot: 5
     metrics:
     - type: acc
       value: 46.3
       name: accuracy
     source:
+      url: >-
+        https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=wanlige/li-14b-v0.4
       name: Open LLM Leaderboard
+license: apache-2.0
+language:
+- zh
+- en
+- fr
+- sa
+- de
+pipeline_tag: text-generation
 ---
 > [!TIP] This model is currently ranked #1 among the models up to 15B parameters and #50 among all models on the [Open LLM Leaderboard](https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard).
 |MuSR (0-shot)      |16.35|
+|MMLU-PRO (5-shot)  |46.30|