opencompass
/

CompassJudger-2-7B-Instruct

@@ -1,10 +1,10 @@
 ---
-license: apache-2.0
-pipeline_tag: text-generation
 library_name: transformers
 tags:
-  - llm-as-judge
-  - qwen2
 ---
 # CompassJudger-2
@@ -59,11 +59,11 @@ from transformers import AutoModelForCausalLM, AutoTokenizer
 model_path = "opencompass/CompassJudger-2-7B-Instruct"
 model = AutoModelForCausalLM.from_pretrained(
-    model_name,
     torch_dtype="auto",
     device_map="auto"
 )
-tokenizer = AutoTokenizer.from_pretrained(model_name)
 # Example: Pair-wise Comparison
 prompt = """
@@ -125,7 +125,7 @@ CompassJudger-2 sets a new state-of-the-art for judge models, outperforming gene
 | Skywork-Critic-Llama-3.1-70B       |     52.41      |   50.65    |   65.50   |    93.30    |   65.47   |
 | RISE-Judge-Qwen2.5-32B             |     56.42      |   63.87    |   73.70   |    92.70    |   71.67   |
 | **CompassJudger-2-32B-Instruct**   |   **62.21**   | **65.48**  |   72.98   |  **92.62**  | **73.32** |
-| **General Models (for reference)** |                |            |           |             |           |
 | Qwen2.5-32B-Instruct               |     62.97      |   59.84    |   74.99   |    85.61    |   70.85   |
 | DeepSeek-V3-0324                   |     64.43      |   59.68    |   78.16   |    85.17    |   71.86   |
 | Qwen3-235B-A22B                    |     61.40      |   65.97    |   75.59   |    84.68    |   71.91   |

 ---
 library_name: transformers
+license: apache-2.0
+pipeline_tag: text-ranking
 tags:
+- llm-as-judge
+- qwen2
 ---
 # CompassJudger-2
 model_path = "opencompass/CompassJudger-2-7B-Instruct"
 model = AutoModelForCausalLM.from_pretrained(
+    model_path,
     torch_dtype="auto",
     device_map="auto"
 )
+tokenizer = AutoTokenizer.from_pretrained(model_path)
 # Example: Pair-wise Comparison
 prompt = """
 | Skywork-Critic-Llama-3.1-70B       |     52.41      |   50.65    |   65.50   |    93.30    |   65.47   |
 | RISE-Judge-Qwen2.5-32B             |     56.42      |   63.87    |   73.70   |    92.70    |   71.67   |
 | **CompassJudger-2-32B-Instruct**   |   **62.21**   | **65.48**  |   72.98   |  **92.62**  | **73.32** |
+| **General Models (for reference)** |                |            |           |             |           |\
 | Qwen2.5-32B-Instruct               |     62.97      |   59.84    |   74.99   |    85.61    |   70.85   |
 | DeepSeek-V3-0324                   |     64.43      |   59.68    |   78.16   |    85.17    |   71.86   |
 | Qwen3-235B-A22B                    |     61.40      |   65.97    |   75.59   |    84.68    |   71.91   |