Spaces:

delta-lab-ai
/

lean-refactor-arena

Running

App Files Files Community

lean-refactor-arena / PyPantograph /src /Test /Integration.lean

mikeljl

use pypantograph for checking submitted statements

0115dcf 6 days ago

raw

history blame contribute delete

18.5 kB

	/- Integration test for the REPL
	-/
	import LSpec
	import Pantograph
	import Repl
	import Test.Common

	namespace Pantograph.Test.Integration
	open Pantograph.Repl

	export Frontend (defaultFileName)

	deriving instance Lean.ToJson for Protocol.EnvInspect
	deriving instance Lean.ToJson for Protocol.EnvAdd
	deriving instance Lean.ToJson for Protocol.ExprEcho
	deriving instance Lean.ToJson for Protocol.OptionsSet
	deriving instance Lean.ToJson for Protocol.OptionsPrint
	deriving instance Lean.ToJson for Protocol.GoalStart
	deriving instance Lean.ToJson for Protocol.GoalPrint
	deriving instance Lean.ToJson for Protocol.GoalTactic
	deriving instance Lean.ToJson for Protocol.FrontendProcess
	deriving instance Lean.ToJson for Protocol.FrontendDataUnit
	deriving instance Lean.ToJson for Protocol.FrontendData
	deriving instance Lean.ToJson for Protocol.FrontendTrack
	deriving instance Lean.ToJson for Protocol.FrontendDistil

	abbrev TestM α := TestT MainM α
	abbrev Test := TestM Unit

	def getFileName : TestM String := do
	return (← read).coreContext.fileName

	def step { α β } [Lean.ToJson α] [Lean.ToJson β] (cmd: String) (payload: α)
	(expected: β) (name? : Option String := .none) : TestM Unit := do
	let payload := Lean.toJson payload
	let name := name?.getD s!"{cmd} {payload.compress}"
	let result ← Repl.execute { cmd, payload }
	checkEq name result.compress (Lean.toJson expected).compress
	def stepFile { α } [Lean.ToJson α] (name : String) (path : String)
	(expected : α) : TestM Unit := do
	let content ← IO.FS.readFile path
	let payload? : Except String Lean.Json := Lean.Json.parse content
	match payload? with
	\| .ok payload =>
	let expected := Lean.toJson expected
	checkEq name payload.compress expected.compress
	\| .error e => fail s!"{name} {e}"

	def test_expr_echo : Test :=
	step "expr.echo"
	({ expr := "λ {α : Sort (u + 1)} => List α", levels? := .some #[`u]}: Protocol.ExprEcho)
	({
	type := { pp? := .some "{α : Type u} → Type u" },
	expr := { pp? := .some "fun {α} => List α" }
	}: Protocol.ExprEchoResult)

	def test_option_modify : Test := do
	let pp? := Option.some "∀ (n : Nat), n + 1 = n.succ"
	let sexp? := Option.some "(:forall n (:c Nat) ((:c Eq) (:c Nat) ((:c HAdd.hAdd) (:c Nat) (:c Nat) (:c Nat) ((:c instHAdd) (:c Nat) (:c instAddNat)) 0 ((:c OfNat.ofNat) (:c Nat) (:lit 1) ((:c instOfNatNat) (:lit 1)))) ((:c Nat.succ) 0)))"
	let module? := Option.some `Init.Data.Nat.Basic
	let options: Protocol.Options := {}
	step "env.inspect" ({ name := `Nat.add_one } : Protocol.EnvInspect)
	({ type := { pp? }, module? }: Protocol.EnvInspectResult)
	step "options.set" ({ printExprAST? := .some true } : Protocol.OptionsSet)
	({ }: Protocol.OptionsSetResult)
	step "env.inspect" ({ name := `Nat.add_one } : Protocol.EnvInspect)
	({ type := { pp?, sexp? }, module? }: Protocol.EnvInspectResult)
	step "options.print" ({} : Protocol.OptionsPrint)
	({ options with printExprAST := true }: Protocol.Options)

	def test_malformed_command : Test := do
	let invalid := "invalid"
	step invalid ({ name := `Nat.add_one }: Protocol.EnvInspect)
	({ error := "command", desc := s!"Unknown command {invalid}" }: Protocol.InteractionError)
	(name? := .some "Invalid Command")
	step "expr.echo" (Lean.Json.mkObj [(invalid, .str "Random garbage data")])
	({ error := "command", desc := s!"Unable to parse json: Pantograph.Protocol.ExprEcho.expr: String expected" }:
	Protocol.InteractionError) (name? := .some "JSON Deserialization")
	def test_tactic_normal : Test := do
	let varX := { name := "_uniq.10".toName, userName := `x, type? := .some { pp? := .some "Prop" }}
	let i1 := 11
	let goal1: Protocol.Goal := {
	name := s!"_uniq.{i1}".toName,
	target := { pp? := .some "∀ (q : Prop), x ∨ q → q ∨ x" },
	vars := #[varX],
	}
	let goal2: Protocol.Goal := {
	name := "_uniq.14".toName,
	target := { pp? := .some "x ∨ y → y ∨ x" },
	vars := #[
	varX,
	{ name := "_uniq.13".toName, userName := `y, type? := .some { pp? := .some "Prop" }}
	],
	}
	step "goal.start" ({ expr := "∀ (p q: Prop), p ∨ q → q ∨ p" }: Protocol.GoalStart)
	({ stateId := 0, root := "_uniq.9".toName }: Protocol.GoalStartResult)
	step "goal.tactic" ({ stateId := 0, tactic? := .some "intro x" }: Protocol.GoalTactic)
	({ nextStateId? := .some 1, goals? := #[goal1], }: Protocol.GoalTacticResult)
	step "goal.print" ({ stateId := 1, parentExprs? := .some true, rootExpr? := .some true }: Protocol.GoalPrint)
	({
	root? := .some { pp? := s!"fun x => ?m.2"},
	parentExprs? := .some [.some { pp? := .some s!"fun x => ?m.2" }],
	}: Protocol.GoalPrintResult)
	step "goal.tactic" ({ stateId := 1, tactic? := .some "intro y" }: Protocol.GoalTactic)
	({ nextStateId? := .some 2, goals? := #[goal2], }: Protocol.GoalTacticResult)
	step "goal.tactic" ({ stateId := 1, tactic? := .some "apply Nat.le_of_succ_le" }: Protocol.GoalTactic)
	({
	messages? := .some #[{
	fileName := ← getFileName,
	kind := .anonymous,
	pos := ⟨0, 0⟩,
	data := "Tactic `apply` failed: could not unify the conclusion of `@Nat.le_of_succ_le`\n ∀ {m : Nat}, Nat.succ ?n ≤ m → ?n ≤ m\nwith the goal\n ∀ (q : Prop), x ∨ q → q ∨ x\n\nNote: The full type of `@Nat.le_of_succ_le` is\n ∀ {n m : Nat}, n.succ ≤ m → n ≤ m\n\nx : Prop\n⊢ ∀ (q : Prop), x ∨ q → q ∨ x",
	}]
	}: Protocol.GoalTacticResult)
	step "goal.tactic" ({ stateId := 0, tactic? := .some "sorry" }: Protocol.GoalTactic)
	({ nextStateId? := .some 3, goals? := .some #[], hasSorry := true }: Protocol.GoalTacticResult)
	example : (1 : Nat) + (2 * 3) = 1 + (4 - 3) + (6 - 4) + 3 := by
	simp
	def test_tactic_timeout : Test := do
	step "goal.start" ({ expr := "(1 : Nat) + (2 * 3) = 1 + (4 - 3) + (6 - 4) + 3" }: Protocol.GoalStart)
	({ stateId := 0, root := "_uniq.326".toName }: Protocol.GoalStartResult)
	-- timeout of 10 milliseconds
	step "options.set" ({ timeout? := .some 10 } : Protocol.OptionsSet)
	({ }: Protocol.OptionsSetResult)
	step "goal.tactic" ({ stateId := 0, expr? := .some "by\nsleep 1000; simp" }: Protocol.GoalTactic)
	(Protocol.InteractionError.errorIO "interrupt")
	-- ensure graceful recovery
	step "options.set" ({ timeout? := .some 0 } : Protocol.OptionsSet)
	({ }: Protocol.OptionsSetResult)
	step "goal.tactic" ({ stateId := 0, tactic? := .some "simp" }: Protocol.GoalTactic)
	({ nextStateId? := .some 1, goals? := .some #[], }: Protocol.GoalTacticResult)

	def test_automatic_mode (automatic: Bool): Test := do
	let varsPQ := #[
	{ name := "_uniq.10".toName, userName := `p, type? := .some { pp? := .some "Prop" }},
	{ name := "_uniq.13".toName, userName := `q, type? := .some { pp? := .some "Prop" }}
	]
	let h' := .mkSimple "h✝"
	let goal1: Protocol.Goal := {
	name := "_uniq.17".toName,
	target := { pp? := .some "q ∨ p" },
	vars := varsPQ ++ #[
	{ name := "_uniq.16".toName, userName := `h, type? := .some { pp? := .some "p ∨ q" }}
	],
	}
	let goal2l: Protocol.Goal := {
	name := "_uniq.57".toName,
	userName? := `inl,
	target := { pp? := .some "q ∨ p" },
	vars := varsPQ ++ #[
	{ name := "_uniq.45".toName, userName := h', type? := .some { pp? := .some "p" }, isInaccessible := true}
	],
	}
	let goal2r: Protocol.Goal := {
	name := "_uniq.70".toName,
	userName? := `inr,
	target := { pp? := .some "q ∨ p" },
	vars := varsPQ ++ #[
	{ name := "_uniq.58".toName, userName := h', type? := .some { pp? := .some "q" }, isInaccessible := true}
	],
	}
	let goal3l: Protocol.Goal := {
	name := "_uniq.76".toName,
	userName? := `inl.h,
	target := { pp? := .some "p" },
	vars := varsPQ ++ #[
	{ name := "_uniq.45".toName, userName := h', type? := .some { pp? := .some "p" }, isInaccessible := true}
	],
	}
	step "options.set" ({automaticMode? := .some automatic}: Protocol.OptionsSet)
	({}: Protocol.OptionsSetResult)
	step "goal.start" ({ expr := "∀ (p q: Prop), p ∨ q → q ∨ p"} : Protocol.GoalStart)
	({ stateId := 0, root := "_uniq.9".toName }: Protocol.GoalStartResult)
	step "goal.tactic" ({ stateId := 0, tactic? := .some "intro p q h" }: Protocol.GoalTactic)
	({ nextStateId? := .some 1, goals? := #[goal1], }: Protocol.GoalTacticResult)
	step "goal.tactic" ({ stateId := 1, tactic? := .some "cases h" }: Protocol.GoalTactic)
	({ nextStateId? := .some 2, goals? := #[goal2l, goal2r], }: Protocol.GoalTacticResult)
	let goals? := if automatic then #[goal3l, goal2r] else #[goal3l]
	step "goal.tactic" ({ stateId := 2, tactic? := .some "apply Or.inr" }: Protocol.GoalTactic)
	({ nextStateId? := .some 3, goals?, }: Protocol.GoalTacticResult)

	def test_conv_calc : Test := do
	step "options.set" ({automaticMode? := .some false}: Protocol.OptionsSet)
	({}: Protocol.OptionsSetResult)
	step "goal.start" ({ expr := "∀ (a b: Nat), (b = 2) -> 1 + a + 1 = a + b"} : Protocol.GoalStart)
	({ stateId := 0, root := "_uniq.152".toName }: Protocol.GoalStartResult)
	let vars := #[
	{ name := "_uniq.153".toName, userName := `a, type? := .some { pp? := .some "Nat" }},
	{ name := "_uniq.156".toName, userName := `b, type? := .some { pp? := .some "Nat" }},
	{ name := "_uniq.159".toName, userName := `h, type? := .some { pp? := .some "b = 2" }},
	]
	let goal : Protocol.Goal := {
	vars,
	name := "_uniq.160".toName,
	target := { pp? := "1 + a + 1 = a + b" },
	}
	step "goal.tactic" ({ stateId := 0, tactic? := .some "intro a b h" }: Protocol.GoalTactic)
	({ nextStateId? := .some 1, goals? := #[goal], }: Protocol.GoalTacticResult)
	step "goal.tactic" ({ stateId := 1, mode? := .some "calc" }: Protocol.GoalTactic)
	({ nextStateId? := .some 2, goals? := #[{ goal with fragment := .calc }], }: Protocol.GoalTacticResult)
	let goalCalc : Protocol.Goal := {
	vars,
	name := "_uniq.342".toName,
	userName? := .some `calc,
	target := { pp? := "1 + a + 1 = a + 1 + 1" },
	}
	let goalMain : Protocol.Goal := {
	vars,
	name := "_uniq.356".toName,
	fragment := .calc,
	target := { pp? := "a + 1 + 1 = a + b" },
	}
	step "goal.tactic" ({ stateId := 2, tactic? := .some "1 + a + 1 = a + 1 + 1" }: Protocol.GoalTactic)
	({ nextStateId? := .some 3, goals? := #[goalCalc, goalMain], }: Protocol.GoalTacticResult)
	let goalConv : Protocol.Goal := {
	goalCalc with
	fragment := .conv,
	userName? := .none,
	name := "_uniq.409".toName,
	}
	step "goal.tactic" ({ stateId := 3, mode? := .some "conv" }: Protocol.GoalTactic)
	({ nextStateId? := .some 4, goals? := #[goalConv], }: Protocol.GoalTacticResult)

	def test_env_add_inspect : Test := do
	let name1 := `Pantograph.mystery
	let name2 := `Pantograph.mystery2
	let name3 := `Pantograph.mystery3
	step "env.add"
	({
	name := name1,
	value := "λ (a b: Prop) => Or a b",
	isTheorem := false
	}: Protocol.EnvAdd)
	({}: Protocol.EnvAddResult)
	step "env.inspect" ({name := name1, value? := .some true} : Protocol.EnvInspect)
	({
	value? := .some { pp? := .some "fun a b => a ∨ b" },
	type := { pp? := .some "Prop → Prop → Prop" },
	}: Protocol.EnvInspectResult)
	step "env.add"
	({
	name := name2,
	type? := "Nat → Int",
	value := "λ (a: Nat) => a + 1",
	isTheorem := false
	}: Protocol.EnvAdd)
	({}: Protocol.EnvAddResult)
	step "env.inspect" ({name := name2, value? := .some true} : Protocol.EnvInspect)
	({
	value? := .some { pp? := .some "fun a => ↑a + 1" },
	type := { pp? := .some "Nat → Int" },
	}: Protocol.EnvInspectResult)
	step "env.add"
	({
	name := name3,
	levels? := .some #[`u],
	type? := "(α : Type u) → α → (α × α)",
	value := "λ (α : Type u) (x : α) => (x, x)",
	isTheorem := false
	}: Protocol.EnvAdd)
	({}: Protocol.EnvAddResult)
	step "env.inspect" ({name := name3} : Protocol.EnvInspect)
	({
	type := { pp? := .some "(α : Type u) → α → α × α" },
	}: Protocol.EnvInspectResult)

	example : ∀ (p: Prop), p → p := by
	intro p h
	exact h

	def test_frontend_process_invocations : Test := do
	let file := "example : ∀ (p q: Prop), p → p ∨ q := by\n intro p q h\n exact Or.inl h"
	let goal1 := "p q : Prop\nh : p\n⊢ p ∨ q"
	IO.FS.withTempDir λ tempdir => do
	let filename := s!"{tempdir}/invocations.jsonl"
	step "frontend.process"
	({
	file? := .some file,
	invocations? := .some filename,
	}: Protocol.FrontendProcess)
	({
	units := [{
	boundary := (0, file.utf8ByteSize),
	nInvocations? := .some 2,
	}],
	}: Protocol.FrontendProcessResult)
	stepFile (α := Protocol.FrontendData) "invocations" filename
	{ units := [{
	invocations? := .some [
	{
	goalBefore := "⊢ ∀ (p q : Prop), p → p ∨ q",
	goalAfter := goal1,
	tactic := "intro p q h",
	usedConstants := #[],
	},
	{
	goalBefore := goal1 ,
	goalAfter := "",
	tactic := "exact Or.inl h",
	usedConstants := #[`Or.inl],
	},
	]
	} ] }

	def test_frontend_process_import_open : Test := do
	let header := "import Init\nopen Nat\nuniverse u"
	let goal1: Protocol.Goal := {
	name := "_uniq.64".toName,
	target := { pp? := .some "n + 1 = n.succ" },
	vars := #[{ name := "_uniq.63".toName, userName := `n, type? := .some { pp? := .some "Nat" }}],
	}
	step "frontend.process"
	({
	file? := .some header,
	readHeader := true,
	inheritEnv := true,
	}: Protocol.FrontendProcess)
	({
	units := [
	{ boundary := (12, 21) },
	{ boundary := (21, header.utf8ByteSize) },
	],
	}: Protocol.FrontendProcessResult)
	step "goal.start" ({ expr := "∀ (n : Nat), n + 1 = Nat.succ n"} : Protocol.GoalStart)
	({ stateId := 0, root := "_uniq.62".toName }: Protocol.GoalStartResult)
	step "goal.tactic" ({ stateId := 0, tactic? := .some "intro n" }: Protocol.GoalTactic)
	({ nextStateId? := .some 1, goals? := #[goal1], }: Protocol.GoalTacticResult)
	step "goal.tactic" ({ stateId := 1, tactic? := .some "apply add_one" }: Protocol.GoalTactic)
	({ nextStateId? := .some 2, goals? := .some #[], }: Protocol.GoalTacticResult)
	step "goal.start" ({ expr := "∀ (x : Sort u), Sort (u + 1)"} : Protocol.GoalStart)
	({ stateId := 3, root := "_uniq.5".toName }: Protocol.GoalStartResult)

	def test_frontend_track : Test := do
	step "frontend.track"
	({
	src := "def f : Nat := sorry",
	dst := "def f : Nat := false",
	}: Protocol.FrontendTrack)
	({
	srcMessages := #[
	{
	fileName := defaultFileName,
	kind := `hasSorry,
	pos := ⟨1, 4⟩,
	endPos := .some ⟨1, 5⟩,
	severity := .warning,
	data := "declaration uses 'sorry'"
	}
	],
	dstMessages := #[
	{
	fileName := defaultFileName,
	kind := .anonymous,
	pos := ⟨1, 15⟩,
	endPos := .some ⟨1, 20⟩,
	severity := .error,
	data := "Type mismatch\n false\nhas type\n Bool\nbut is expected to have type\n Nat"
	},
	],
	} : Protocol.FrontendTrackResult)

	def test_frontend_distil_simple : Test := do
	let file := "theorem mystery (p: Prop) : p → p := sorry"
	let goal1: Protocol.Goal := {
	name := "_uniq.3".toName,
	target := { pp? := .some "∀ (p : Prop), p → p" },
	}
	step "frontend.distil"
	({
	file,
	binderName? := `x,
	}: Protocol.FrontendDistil)
	({
	targets := [{
	stateId := 0,
	goals := #[goal1],
	}],
	} : Protocol.FrontendDistilResult)

	example : 1 + 2 = 3 := rfl
	example (p: Prop): p → p := by simp

	def test_frontend_distil_multiple : Test := do
	let solved := "theorem solved : 1 + 2 = 3 := rfl\n"
	let withSorry := "theorem mystery (p: Prop): p → p := sorry"
	let file := s!"{solved}{withSorry}"
	let goal1: Protocol.Goal := {
	name := "_uniq.190".toName,
	target := { pp? := .some "p → p" },
	vars := #[{ name := "_uniq.189".toName, userName := `p, type? := .some { pp? := .some "Prop" }}],
	}
	step "frontend.distil"
	({
	file,
	ignoreValues := false,
	}: Protocol.FrontendDistil)
	({
	targets := [{
	stateId := 0,
	goals := #[goal1],
	}],
	}: Protocol.FrontendDistilResult)

	/-- Ensure there cannot be circular references -/
	def test_frontend_distil_circular : Test := do
	let withSorry := "theorem mystery : 1 + 2 = 2 + 3 := sorry"
	let goal1: Protocol.Goal := {
	name := "_uniq.1".toName,
	target := { pp? := .some "1 + 2 = 2 + 3" },
	vars := #[],
	}
	step "frontend.distil"
	({
	file := withSorry,
	}: Protocol.FrontendDistil)
	({
	targets := [{
	stateId := 0,
	goals := #[goal1],
	}],
	} : Protocol.FrontendDistilResult)
	step "goal.tactic" ({ stateId := 0, tactic? := .some "exact?" }: Protocol.GoalTactic)
	({
	messages? := .some #[{
	fileName := ← getFileName,
	kind := .anonymous,
	pos := ⟨0, 0⟩,
	data := "`exact?` could not close the goal. Try `apply?` to see partial suggestions."
	}]
	} : Protocol.GoalTacticResult)


	def runTestSuite (env : Lean.Environment) (steps : Test): IO LSpec.TestSeq := do
	-- Setup the environment for execution
	let coreContext ← createCoreContext #[]
	let mainM : MainM LSpec.TestSeq := runTest steps
	mainM.run { coreContext } \|>.run' { env }

	def suite (env : Lean.Environment): List (String × IO LSpec.TestSeq) :=
	let tests := [
	("expr.echo", test_expr_echo),
	("options.set options.print", test_option_modify),
	("Malformed command", test_malformed_command),
	("goal.tactic normal", test_tactic_normal),
	("goal.tactic Timeout", test_tactic_timeout),
	("Manual Mode", test_automatic_mode false),
	("Automatic Mode", test_automatic_mode true),
	("goal.tactic conv calc", test_conv_calc),
	("env.add env.inspect", test_env_add_inspect),

	("frontend.process invocations", test_frontend_process_invocations),
	("frontend.process import", test_frontend_process_import_open),
	("frontend.track", test_frontend_track),
	("frontend.distil simple", test_frontend_distil_simple),
	("frontend.distil multiple", test_frontend_distil_multiple),
	("frontend.distil circular", test_frontend_distil_circular),
	]
	tests.map (fun (name, test) => (name, runTestSuite env test))