Qwen
/

Qwen3-4B-Instruct-2507

@@ -3,6 +3,117 @@ library_name: transformers
 license: apache-2.0
 license_link: https://huggingface.co/Qwen/Qwen3-4B-Instruct-2507/blob/main/LICENSE
 pipeline_tag: text-generation
 ---
 # Qwen3-4B-Instruct-2507

 license: apache-2.0
 license_link: https://huggingface.co/Qwen/Qwen3-4B-Instruct-2507/blob/main/LICENSE
 pipeline_tag: text-generation
+model-index:
+- name: Qwen3-4B-Instruct-2507
+  results:
+  - task:
+      type: question-answering
+    dataset:
+      name: GPQA
+      type: gpqa
+    metrics:
+    - name: Accuracy
+      type: accuracy
+      value: 50.3
+  - task:
+      type: question-answering
+    dataset:
+      name: SuperGPQA
+      type: supergpqa
+    metrics:
+    - name: Accuracy
+      type: accuracy
+      value: 32.2
+  - task:
+      type: reasoning
+    dataset:
+      name: AIME25
+      type: aime25
+    metrics:
+    - name: Score
+      type: score
+      value: 22.7
+  - task:
+      type: reasoning
+    dataset:
+      name: HMMT25
+      type: hmmt25
+    metrics:
+    - name: Score
+      type: score
+      value: 9.7
+  - task:
+      type: reasoning
+    dataset:
+      name: ZebraLogic
+      type: zebralogic
+    metrics:
+    - name: Score
+      type: score
+      value: 14.8
+  - task:
+      type: reasoning
+    dataset:
+      name: LiveBench 20241125
+      type: livebench_20241125
+    metrics:
+    - name: Score
+      type: score
+      value: 41.5
+  - task:
+      type: text-generation
+    dataset:
+      name: IFEval
+      type: ifeval
+    metrics:
+    - name: Score
+      type: score
+      value: 74.5
+  - task:
+      type: text-generation
+    dataset:
+      name: Creative Writing v3
+      type: creative_writing_v3
+    metrics:
+    - name: Score
+      type: score
+      value: 72.7
+  - task:
+      type: text-generation
+    dataset:
+      name: WritingBench
+      type: writingbench
+    metrics:
+    - name: Score
+      type: score
+      value: 66.9
+  - task:
+      type: text-generation
+    dataset:
+      name: MultiIF
+      type: multiif
+    metrics:
+    - name: Score
+      type: score
+      value: 60.7
+  - task:
+      type: text-generation
+    dataset:
+      name: INCLUDE
+      type: include
+    metrics:
+    - name: Score
+      type: score
+      value: 58.6
+  - task:
+      type: reasoning
+    dataset:
+      name: PolyMATH
+      type: polymath
+    metrics:
+    - name: Score
+      type: score
+      value: 15.6
 ---
 # Qwen3-4B-Instruct-2507