Add MiniF2F execution case

2024-06-05 11:19:12 -07:00 · 2024-06-05 11:19:12 -07:00 · 61b3a1b3d2
parent a8812c103b
commit 61b3a1b3d2
4 changed files with 18 additions and 4 deletions
--- a/examples_search/Example/lakefile.lean
+++ b/examples_search/Example/lakefile.lean
@ -5,7 +5,7 @@ open Lake DSL
 --   "https://github.com/leanprover-community/aesop.git" @ "v4.8.0-rc1"
 require mathlib from git
-  "https://github.com/leanprover-community/mathlib4"
+  "https://github.com/leanprover-community/mathlib4" @ "v4.8.0-rc1"
 package Example
--- a/examples_search/miniF2F_search.py
+++ b/examples_search/miniF2F_search.py
@ -1,6 +1,6 @@
 #!/usr/bin/env python3
-import subprocess
+import subprocess, json
 from pathlib import Path
 from pantograph.server import Server
 from pantograph.search_llm import LLMAgent
@ -10,14 +10,28 @@ def get_project_and_lean_path():
    p = subprocess.check_output(['lake', 'env', 'printenv', 'LEAN_PATH'], cwd=cwd)
    return cwd, p
 def read_test_data():
    jsonl_path = Path(__file__).parent / 'test.jsonl'
    with open(jsonl_path, 'r') as f:
        return [json.loads(l) for l in list(f)]
 def try_test_data(server, agent, entry) -> bool:
    e = entry["formal_statement"]
    key_theorem, name, e = e.split(' ', 2)
    e, tail = e.split(':=', 1)
    target = "forall " + ','.join(e.rsplit(':', 1))
    print(f"Target: {target}")
    agent = LLMAgent(server)
    return agent.search(server=server, target=target, verbose=True)
 if __name__ == '__main__':
    project_path, lean_path = get_project_and_lean_path()
    print(f"$PWD: {project_path}")
    print(f"$LEAN_PATH: {lean_path}")
    test_data = read_test_data()
    server = Server(imports=["Mathlib"], project_path=project_path, lean_path=lean_path)
    target = "∀ (b h v : ℝ)  (h₀ : 0 < b ∧ 0 < h ∧ 0 < v)  (h₁ : v = 1 / 3 * (b * h))  (h₂ : b = 30)  (h₃ : h = 13 / 2) , v = 65"
    # target = "theorem mathd_algebra_478\n  (b h v : ℝ)\n  (h₀ : 0 < b ∧ 0 < h ∧ 0 < v)\n  (h₁ : v = 1 / 3 * (b * h))\n  (h₂ : b = 30)\n  (h₃ : h = 13 / 2) :\n  v = 65 := sorry"
    agent = LLMAgent(server)
-    flag = agent.search(server=server, target=target, verbose=True)
+    try_test_data(server, agent, test_data[0])
--- a/examples_search/test.jsonl
+++ b/examples_search/test.jsonl
--- a/examples_search/valid.jsonl
+++ b/examples_search/valid.jsonl