launch
/

ThinkPRM-14B

@@ -9,6 +9,8 @@ tags:
 - verification
 - math reasoning
 - code verification
 ---
 # Model Card for ThinkPRM-14B
@@ -60,7 +62,8 @@ llm = LLM(model=model_id, max_model_len=16384)
 # Example problem and solution
 problem = "Solve for x: 2x + 3 = 7"
-prefix = "Step 1: Subtract 3 from both sides: 2x = 4\nStep 2: Divide by 2: x = 1"
 # Format the prompt
 prompt = f"""You are given a math problem and a proposed step-by-step solution:
@@ -78,7 +81,8 @@ Review and critique each step in the proposed solution to determine whether each
 prompt = tokenizer.apply_chat_template([
     {'role': "user", "content": prompt}
-], tokenize=False, add_generation_prompt=True) + "\nLet's verify step by step:"
 # Set sampling parameters
 sampling_params = SamplingParams(

 - verification
 - math reasoning
 - code verification
+license: apache-2.0
+pipeline_tag: text-generation
 ---
 # Model Card for ThinkPRM-14B
 # Example problem and solution
 problem = "Solve for x: 2x + 3 = 7"
+prefix = "Step 1: Subtract 3 from both sides: 2x = 4
+Step 2: Divide by 2: x = 1"
 # Format the prompt
 prompt = f"""You are given a math problem and a proposed step-by-step solution:
 prompt = tokenizer.apply_chat_template([
     {'role': "user", "content": prompt}
+], tokenize=False, add_generation_prompt=True) + "
+Let's verify step by step:"
 # Set sampling parameters
 sampling_params = SamplingParams(