Skip to content

Commit 30ae290

Browse files
committed
Use HF hub checkpoint rather than local checkpoint as the default trained induction model.
1 parent f63230f commit 30ae290

File tree

4 files changed

+5
-6
lines changed

4 files changed

+5
-6
lines changed

README.md

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -149,7 +149,7 @@ python wandering_light/training/rl_grpo.py --batch-size 32 --model-name $SFT_OUT
149149
### Evaluate local trained LLM
150150
Assuming you have a checkpoint shown below.
151151
```bash
152-
python wandering_light/evals/run_evaluation.py --budget=1 --eval_file=wandering_light/evals/data/random_inputs_500.py --solver_names=[trained_local] --budget 1 --model-name checkpoints/saved/rl/long_sft_opt_125m_s35k_no_len/
152+
python wandering_light/evals/run_evaluation.py --budget=1 --eval_file=wandering_light/evals/data/random_inputs_500.py --solver_names=[trained_local] --budget 1 --model-name abhishekraok/induction-basicfns-opt125m-longsft
153153
```
154154

155155
### Evaluation Dashboard
@@ -164,5 +164,5 @@ First finetune it using SFT, using the `--task proposer` flag. Then evaluate it.
164164

165165
### Evaluate proposer
166166
```bash
167-
python -m wandering_light.evals.evaluate_proposer --model checkpoints/saved/sft/proposer_opt_125m_2k --solver-model checkpoints/saved/rl/long_sft_opt_125m_s35k_no_len/
167+
python -m wandering_light.evals.evaluate_proposer --model checkpoints/saved/sft/proposer_opt_125m_2k --solver-model abhishekraok/induction-basicfns-opt125m-longsft
168168
```

wandering_light/constants.py

Lines changed: 1 addition & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -6,8 +6,7 @@
66

77
# Evaluation file path
88
DEFAULT_EVAL_FILE = "wandering_light/evals/data/random_inputs.py"
9-
# TODO Upload this to the internet
10-
DEFAULT_SOLVER_CHECKPOINT = "checkpoints/saved/rl/long_sft_opt_125m_s35k_no_len"
9+
DEFAULT_SOLVER_CHECKPOINT = "abhishekraok/induction-basicfns-opt125m-longsft"
1110

1211

1312
class Task(StrEnum):

wandering_light/web_ui/backend/main.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -81,7 +81,7 @@ class ExecutionResult(BaseModel):
8181
class SolverRequest(BaseModel):
8282
input_list: TypedListCreate
8383
output_list: TypedListCreate
84-
checkpoint_path: str = "checkpoints/saved/rl/long_sft_opt_125m_s35k_no_len/"
84+
checkpoint_path: str = "abhishekraok/induction-basicfns-opt125m-longsft"
8585

8686

8787
class SolverResponse(BaseModel):

wandering_light/web_ui/frontend/src/components/SolverPlayground.tsx

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -40,7 +40,7 @@ const SolverPlayground: React.FC = () => {
4040
const [inputItems, setInputItems] = useState('[1, 2, 3]');
4141
const [outputType, setOutputType] = useState('builtins.int');
4242
const [outputItems, setOutputItems] = useState('[2, 4, 6]');
43-
const [checkpointPath, setCheckpointPath] = useState('../../../checkpoints/saved/rl/long_sft_opt_125m_s35k_no_len/');
43+
const [checkpointPath, setCheckpointPath] = useState('abhishekraok/induction-basicfns-opt125m-longsft');
4444
const [solverResult, setSolverResult] = useState<SolverResponse | null>(null);
4545
const [isLoading, setIsLoading] = useState(false);
4646
const toast = useToast();

0 commit comments

Comments
 (0)