Add instruct model option to verifier scripts (#82)

rasbt · web-flow · commit f0a37d21665f · 2025-11-01T22:28:17.000-05:00
* update verifier scripts

* Update ch03/02_math500-verifier-scripts/evaluate_math500_batched.py

* update
diff --git a/ch03/02_math500-verifier-scripts/evaluate_math500.py b/ch03/02_math500-verifier-scripts/evaluate_math500.py
@@ -44,7 +44,7 @@ def parse_args():
         "--which_model",
         type=str,
         default="base",
-        choices=["base", "reasoning"],
+        choices=["base", "reasoning", "instruct"],
         help="Model variant to load. Defaults to 'base'.",
     )
     parser.add_argument(
diff --git a/ch03/02_math500-verifier-scripts/evaluate_math500_batched.py b/ch03/02_math500-verifier-scripts/evaluate_math500_batched.py
@@ -14,14 +14,7 @@
 import torch
 
 from reasoning_from_scratch.ch02 import get_device
-from reasoning_from_scratch.qwen3 import (
-    download_qwen3_small,
-    Qwen3Tokenizer,
-    QWEN_CONFIG_06_B,
-)
-from reasoning_from_scratch.qwen3_batched import (
-    Qwen3Model as Qwen3ModelBatched,
-)
+from reasoning_from_scratch.qwen3_batched import get_model
 from reasoning_from_scratch.ch03 import (
     render_prompt,
     extract_final_candidate,
@@ -47,46 +40,6 @@ def get_data():
     return math_data
 
 
-def get_model(which_model, device, use_compile):
-    if which_model == "base":
-
-        download_qwen3_small(
-            kind="base", tokenizer_only=False, out_dir="qwen3"
-        )
-
-        tokenizer_path = Path("qwen3") / "tokenizer-base.json"
-        model_path = Path("qwen3") / "qwen3-0.6B-base.pth"
-        tokenizer = Qwen3Tokenizer(tokenizer_file_path=tokenizer_path)
-
-    elif which_model == "reasoning":
-
-        download_qwen3_small(
-            kind="reasoning", tokenizer_only=False, out_dir="qwen3"
-        )
-
-        tokenizer_path = Path("qwen3") / "tokenizer-reasoning.json"
-        model_path = Path("qwen3") / "qwen3-0.6B-reasoning.pth"
-        tokenizer = Qwen3Tokenizer(
-            tokenizer_file_path=tokenizer_path,
-            apply_chat_template=True,
-            add_generation_prompt=True,
-            add_thinking=True,
-        )
-
-    else:
-        raise ValueError(f"Invalid choice: WHICH_MODEL={which_model}")
-
-    model = Qwen3ModelBatched(QWEN_CONFIG_06_B)
-    model.load_state_dict(torch.load(model_path, map_location="cpu"))
-    model.to(device)
-
-    if use_compile:
-        torch._dynamo.config.allow_unspec_int_on_nn_module = True
-        model = torch.compile(model)
-
-    return model, tokenizer
-
-
 def evaluate_math500_batched(
     model,
     tokenizer,
@@ -201,7 +154,7 @@ def parse_args():
         "--which_model",
         type=str,
         default="base",
-        choices=["base", "reasoning"],
+        choices=["base", "reasoning", "instruct"],
         help="Model variant to load. Defaults to 'base'.",
     )
     parser.add_argument(
diff --git a/reasoning_from_scratch/qwen3_batched.py b/reasoning_from_scratch/qwen3_batched.py
@@ -2,7 +2,9 @@
 # Source for "Build a Reasoning Model (From Scratch)": https://mng.bz/lZ5B
 # Code repository: https://github.com/rasbt/reasoning-from-scratch
 
-from .qwen3 import KVCache
+from .qwen3 import KVCache, download_qwen3_small, Qwen3Tokenizer
+
+from pathlib import Path
 
 import torch
 import torch.nn as nn
@@ -582,4 +584,45 @@ def generate_text_basic_batched_stream_cache_stop(
 
         shrink_kv_cache_inplace(cache, keep_mask_active, model.cfg["n_layers"])
 
-        out = model(next_token_survivors, cache=cache, attn_mask=cur_attn_active)[:, -1]
+        out = model(next_token_survivors, cache=cache, attn_mask=cur_attn_active)[:, -1]
+
+
+def get_model(which_model, device, use_compile):
+    if which_model == "base":
+
+        download_qwen3_small(
+            kind="base", tokenizer_only=False, out_dir="qwen3"
+        )
+
+        tokenizer_path = Path("qwen3") / "tokenizer-base.json"
+        model_path = Path("qwen3") / "qwen3-0.6B-base.pth"
+        tokenizer = Qwen3Tokenizer(tokenizer_file_path=tokenizer_path)
+
+    elif which_model in ("reasoning", "instruct"):
+
+        download_qwen3_small(
+            kind="reasoning", tokenizer_only=False, out_dir="qwen3"
+        )
+
+        tokenizer_path = Path("qwen3") / "tokenizer-reasoning.json"
+        model_path = Path("qwen3") / "qwen3-0.6B-reasoning.pth"
+        tokenizer = Qwen3Tokenizer(
+            tokenizer_file_path=tokenizer_path,
+            apply_chat_template=True,
+            add_generation_prompt=True,
+            add_thinking=which_model == "reasoning",
+        )
+
+    else:
+        raise ValueError(f"Invalid choice: WHICH_MODEL={which_model}")
+
+    model = Qwen3Model(QWEN_CONFIG_06_B)
+    model.load_state_dict(torch.load(model_path))
+
+    model.to(device)
+
+    if use_compile:
+        torch._dynamo.config.allow_unspec_int_on_nn_module = True
+        model = torch.compile(model)
+
+    return model, tokenizer

Original file line number	Diff line number	Diff line change
`@@ -44,7 +44,7 @@ def parse_args():`
`44`	`44`	`"--which_model",`
`45`	`45`	`type=str,`
`46`	`46`	`default="base",`
`47`		`- choices=["base", "reasoning"],`
	`47`	`+ choices=["base", "reasoning", "instruct"],`
`48`	`48`	`help="Model variant to load. Defaults to 'base'.",`
`49`	`49`	`)`
`50`	`50`	`parser.add_argument(`