Add MiniF2F execution case
This commit is contained in:
parent
a8812c103b
commit
61b3a1b3d2
|
@ -5,7 +5,7 @@ open Lake DSL
|
|||
-- "https://github.com/leanprover-community/aesop.git" @ "v4.8.0-rc1"
|
||||
|
||||
require mathlib from git
|
||||
"https://github.com/leanprover-community/mathlib4"
|
||||
"https://github.com/leanprover-community/mathlib4" @ "v4.8.0-rc1"
|
||||
|
||||
package Example
|
||||
|
||||
|
|
|
@ -1,6 +1,6 @@
|
|||
#!/usr/bin/env python3
|
||||
|
||||
import subprocess
|
||||
import subprocess, json
|
||||
from pathlib import Path
|
||||
from pantograph.server import Server
|
||||
from pantograph.search_llm import LLMAgent
|
||||
|
@ -10,14 +10,28 @@ def get_project_and_lean_path():
|
|||
p = subprocess.check_output(['lake', 'env', 'printenv', 'LEAN_PATH'], cwd=cwd)
|
||||
return cwd, p
|
||||
|
||||
def read_test_data():
|
||||
jsonl_path = Path(__file__).parent / 'test.jsonl'
|
||||
with open(jsonl_path, 'r') as f:
|
||||
return [json.loads(l) for l in list(f)]
|
||||
|
||||
def try_test_data(server, agent, entry) -> bool:
|
||||
e = entry["formal_statement"]
|
||||
key_theorem, name, e = e.split(' ', 2)
|
||||
e, tail = e.split(':=', 1)
|
||||
target = "forall " + ','.join(e.rsplit(':', 1))
|
||||
print(f"Target: {target}")
|
||||
agent = LLMAgent(server)
|
||||
return agent.search(server=server, target=target, verbose=True)
|
||||
|
||||
if __name__ == '__main__':
|
||||
project_path, lean_path = get_project_and_lean_path()
|
||||
print(f"$PWD: {project_path}")
|
||||
print(f"$LEAN_PATH: {lean_path}")
|
||||
|
||||
test_data = read_test_data()
|
||||
server = Server(imports=["Mathlib"], project_path=project_path, lean_path=lean_path)
|
||||
target = "∀ (b h v : ℝ) (h₀ : 0 < b ∧ 0 < h ∧ 0 < v) (h₁ : v = 1 / 3 * (b * h)) (h₂ : b = 30) (h₃ : h = 13 / 2) , v = 65"
|
||||
# target = "theorem mathd_algebra_478\n (b h v : ℝ)\n (h₀ : 0 < b ∧ 0 < h ∧ 0 < v)\n (h₁ : v = 1 / 3 * (b * h))\n (h₂ : b = 30)\n (h₃ : h = 13 / 2) :\n v = 65 := sorry"
|
||||
agent = LLMAgent(server)
|
||||
flag = agent.search(server=server, target=target, verbose=True)
|
||||
|
||||
try_test_data(server, agent, test_data[0])
|
||||
|
|
Loading…
Reference in New Issue