From c1d2ed1c132e70d6f14bbc6baa78071692075e62 Mon Sep 17 00:00:00 2001 From: Andrej Karpathy Date: Mon, 20 Oct 2025 00:05:09 +0000 Subject: [PATCH] use orig_model in sampling, silly of me to miss this --- scripts/base_train.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/scripts/base_train.py b/scripts/base_train.py index 518bd71..9f2cdff 100644 --- a/scripts/base_train.py +++ b/scripts/base_train.py @@ -219,7 +219,7 @@ for step in range(num_iterations + 1): "My favorite color is", "If 5*x + 3 = 13, then x is", ] - engine = Engine(orig_model, tokenizer) + engine = Engine(orig_model, tokenizer) # use orig_model to avoid recompilation for prompt in prompts: tokens = tokenizer(prompt, prepend="<|bos|>") with autocast_ctx: