LEAN-Eval/local_runner_test.py at main · ZJUVAI/LEAN-Eval · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
# 在您的主脚本中 (例如 run_local_eval.py)
from LeanEval.runner.local_runner import LocalHuggingFaceRunner
from LeanEval.runner.local_runner_search import LocalSearchRunner
from pathlib import Path
from LeanEval.utils import process_dataset
import accelerate

def main():
    # download_path = "./data/downloaded/DeepSeek-Prover-V1.5/datasets/minif2f.jsonl"
    # output_json_path = "./data/json/minilean.json"
    # process_dataset.process_jsonl_dataset(download_path=download_path,ouput_json_path=output_json_path)
    runner = LocalHuggingFaceRunner(
        model_id="deepseek-ai/DeepSeek-Prover-V2-7B",
        dataset_path="./data/json/minif2f.json",
        output_dir_base="./outputs_runner_test",
        per_device_batch_size=1,
        max_new_tokens=512,
        mixed_precision='bf16', # 或 fp16
        num_proof_rounds=2
    )
    runner.run()

# --- 如何运行这个脚本 ---
def run_search_evaluation():
    """实例化并运行 LocalSearchRunner 的示例函数。"""

    # 为策略生成任务优化的 few-shot 示例
    tactic_shots = [
        (
            "Given the following partial proof and the current goals, what is the next single tactic to apply?\n\n"
            "### Current Proof State:\n"
            "```lean\nimport Mathlib.Tactic\n\ntheorem Nat.add_comm (n m : Nat) : n + m = m + n := by\n```\n\n"
            "### Current Goals from Lean InfoView:\n"
            "```\n- n m : ℕ ⊢ n + m = m + n\n```\n\n"
            "Your response must be the next single tactic.",
            "```lean\ninduction m\n```"
        ),
    ]

    runner = LocalSearchRunner(
        model_id="deepseek-ai/DeepSeek-Prover-V2-7B",
        dataset_path="./data/json/minilean.json",
        output_dir_base="./outputs_runner_test",
        tactic_shots=tactic_shots,
        bfs_degree=5,
        bfs_timeout=1200,
        mixed_precision='bf16' # 或 'fp16'
    )
    runner.run()


if __name__ == "__main__":
    # 使用 `accelerate launch <your_script_name>.py` 来运行
    run_search_evaluation()