blanchet@41335
|
1 |
(* Title: HOL/Tools/Sledgehammer/sledgehammer_run.ML
|
wenzelm@28477
|
2 |
Author: Fabian Immler, TU Muenchen
|
wenzelm@32996
|
3 |
Author: Makarius
|
blanchet@35967
|
4 |
Author: Jasmin Blanchette, TU Muenchen
|
wenzelm@28477
|
5 |
|
blanchet@38255
|
6 |
Sledgehammer's heart.
|
wenzelm@28477
|
7 |
*)
|
wenzelm@28477
|
8 |
|
blanchet@41335
|
9 |
signature SLEDGEHAMMER_RUN =
|
wenzelm@28477
|
10 |
sig
|
blanchet@47148
|
11 |
type minimize_command = ATP_Proof_Reconstruct.minimize_command
|
blanchet@39232
|
12 |
type relevance_override = Sledgehammer_Filter.relevance_override
|
blanchet@43862
|
13 |
type mode = Sledgehammer_Provers.mode
|
blanchet@41335
|
14 |
type params = Sledgehammer_Provers.params
|
blanchet@39733
|
15 |
|
blanchet@43861
|
16 |
val someN : string
|
blanchet@43861
|
17 |
val noneN : string
|
blanchet@43861
|
18 |
val timeoutN : string
|
blanchet@43861
|
19 |
val unknownN : string
|
blanchet@38290
|
20 |
val run_sledgehammer :
|
blanchet@46391
|
21 |
params -> mode -> int -> relevance_override
|
blanchet@46391
|
22 |
-> ((string * string list) list -> string -> minimize_command)
|
blanchet@43861
|
23 |
-> Proof.state -> bool * (string * Proof.state)
|
wenzelm@28477
|
24 |
end;
|
wenzelm@28477
|
25 |
|
blanchet@41335
|
26 |
structure Sledgehammer_Run : SLEDGEHAMMER_RUN =
|
wenzelm@28477
|
27 |
struct
|
wenzelm@28477
|
28 |
|
blanchet@43926
|
29 |
open ATP_Util
|
blanchet@47148
|
30 |
open ATP_Problem_Generate
|
blanchet@47148
|
31 |
open ATP_Proof_Reconstruct
|
blanchet@38257
|
32 |
open Sledgehammer_Util
|
blanchet@49265
|
33 |
open Sledgehammer_Fact
|
blanchet@41335
|
34 |
open Sledgehammer_Provers
|
blanchet@41339
|
35 |
open Sledgehammer_Minimize
|
blanchet@49265
|
36 |
open Sledgehammer_Filter
|
blanchet@40253
|
37 |
|
blanchet@43861
|
38 |
val someN = "some"
|
blanchet@43861
|
39 |
val noneN = "none"
|
blanchet@43861
|
40 |
val timeoutN = "timeout"
|
blanchet@43861
|
41 |
val unknownN = "unknown"
|
blanchet@43861
|
42 |
|
blanchet@43861
|
43 |
val ordered_outcome_codes = [someN, unknownN, timeoutN, noneN]
|
blanchet@43861
|
44 |
|
blanchet@43861
|
45 |
fun max_outcome_code codes =
|
blanchet@43861
|
46 |
NONE
|
blanchet@43861
|
47 |
|> fold (fn candidate =>
|
blanchet@43861
|
48 |
fn accum as SOME _ => accum
|
blanchet@43861
|
49 |
| NONE => if member (op =) codes candidate then SOME candidate
|
blanchet@43861
|
50 |
else NONE)
|
blanchet@43861
|
51 |
ordered_outcome_codes
|
blanchet@43861
|
52 |
|> the_default unknownN
|
blanchet@43861
|
53 |
|
blanchet@41456
|
54 |
fun prover_description ctxt ({verbose, blocking, ...} : params) name num_facts i
|
blanchet@41337
|
55 |
n goal =
|
blanchet@43846
|
56 |
(name,
|
blanchet@43846
|
57 |
(if verbose then
|
blanchet@43846
|
58 |
" with " ^ string_of_int num_facts ^ " fact" ^ plural_s num_facts
|
blanchet@43846
|
59 |
else
|
blanchet@43846
|
60 |
"") ^
|
blanchet@43846
|
61 |
" on " ^ (if n = 1 then "goal" else "subgoal " ^ string_of_int i) ^
|
blanchet@46250
|
62 |
(if blocking then "."
|
blanchet@46250
|
63 |
else "\n" ^ Syntax.string_of_term ctxt (Thm.term_of (Thm.cprem_of goal i))))
|
blanchet@41337
|
64 |
|
blanchet@46577
|
65 |
fun launch_prover (params as {debug, verbose, blocking, max_relevant, slice,
|
blanchet@43900
|
66 |
timeout, expect, ...})
|
blanchet@48402
|
67 |
mode minimize_command only {state, goal, subgoal, subgoal_count, facts}
|
blanchet@48402
|
68 |
name =
|
blanchet@41337
|
69 |
let
|
blanchet@41337
|
70 |
val ctxt = Proof.context_of state
|
blanchet@43719
|
71 |
val hard_timeout = Time.+ (timeout, timeout)
|
blanchet@41337
|
72 |
val birth_time = Time.now ()
|
blanchet@43719
|
73 |
val death_time = Time.+ (birth_time, hard_timeout)
|
blanchet@41337
|
74 |
val max_relevant =
|
blanchet@43314
|
75 |
max_relevant
|
blanchet@46577
|
76 |
|> the_default (default_max_relevant_for_prover ctxt slice name)
|
blanchet@41337
|
77 |
val num_facts = length facts |> not only ? Integer.min max_relevant
|
blanchet@43847
|
78 |
fun desc () =
|
blanchet@41337
|
79 |
prover_description ctxt params name num_facts subgoal subgoal_count goal
|
blanchet@41337
|
80 |
val problem =
|
blanchet@48919
|
81 |
{state = state, goal = goal, subgoal = subgoal,
|
blanchet@48919
|
82 |
subgoal_count = subgoal_count,
|
blanchet@48919
|
83 |
facts = facts
|
blanchet@48919
|
84 |
|> not (Sledgehammer_Provers.is_ho_atp ctxt name)
|
blanchet@48919
|
85 |
? filter_out (curry (op =) Induction o snd o snd o fst
|
blanchet@48919
|
86 |
o untranslated_fact)
|
blanchet@48919
|
87 |
|> take num_facts}
|
blanchet@41501
|
88 |
fun really_go () =
|
blanchet@41511
|
89 |
problem
|
blanchet@43892
|
90 |
|> get_minimizing_prover ctxt mode name params minimize_command
|
blanchet@44102
|
91 |
|> (fn {outcome, preplay, message, message_tail, ...} =>
|
blanchet@43846
|
92 |
(if outcome = SOME ATP_Proof.TimedOut then timeoutN
|
blanchet@43846
|
93 |
else if is_some outcome then noneN
|
blanchet@44102
|
94 |
else someN, fn () => message (preplay ()) ^ message_tail))
|
blanchet@41337
|
95 |
fun go () =
|
blanchet@41337
|
96 |
let
|
blanchet@41337
|
97 |
val (outcome_code, message) =
|
blanchet@41337
|
98 |
if debug then
|
blanchet@41337
|
99 |
really_go ()
|
blanchet@41337
|
100 |
else
|
blanchet@41337
|
101 |
(really_go ()
|
blanchet@43893
|
102 |
handle ERROR msg => (unknownN, fn () => "Error: " ^ msg ^ "\n")
|
blanchet@41337
|
103 |
| exn =>
|
blanchet@41337
|
104 |
if Exn.is_interrupt exn then
|
blanchet@41337
|
105 |
reraise exn
|
blanchet@41337
|
106 |
else
|
blanchet@43893
|
107 |
(unknownN, fn () => "Internal error:\n" ^
|
blanchet@43893
|
108 |
ML_Compiler.exn_message exn ^ "\n"))
|
blanchet@41337
|
109 |
val _ =
|
blanchet@41390
|
110 |
(* The "expect" argument is deliberately ignored if the prover is
|
blanchet@41390
|
111 |
missing so that the "Metis_Examples" can be processed on any
|
blanchet@41390
|
112 |
machine. *)
|
blanchet@41390
|
113 |
if expect = "" orelse outcome_code = expect orelse
|
blanchet@41390
|
114 |
not (is_prover_installed ctxt name) then
|
blanchet@41337
|
115 |
()
|
blanchet@41337
|
116 |
else if blocking then
|
blanchet@41337
|
117 |
error ("Unexpected outcome: " ^ quote outcome_code ^ ".")
|
blanchet@41337
|
118 |
else
|
blanchet@41337
|
119 |
warning ("Unexpected outcome: " ^ quote outcome_code ^ ".");
|
blanchet@43846
|
120 |
in (outcome_code, message) end
|
blanchet@41337
|
121 |
in
|
blanchet@43862
|
122 |
if mode = Auto_Try then
|
blanchet@43847
|
123 |
let val (outcome_code, message) = TimeLimit.timeLimit timeout go () in
|
blanchet@43847
|
124 |
(outcome_code,
|
blanchet@43847
|
125 |
state
|
blanchet@43847
|
126 |
|> outcome_code = someN
|
blanchet@43847
|
127 |
? Proof.goal_message (fn () =>
|
blanchet@43847
|
128 |
[Pretty.str "",
|
wenzelm@46537
|
129 |
Pretty.mark Isabelle_Markup.hilite (Pretty.str (message ()))]
|
blanchet@43847
|
130 |
|> Pretty.chunks))
|
blanchet@41337
|
131 |
end
|
blanchet@41337
|
132 |
else if blocking then
|
blanchet@43847
|
133 |
let
|
blanchet@43847
|
134 |
val (outcome_code, message) = TimeLimit.timeLimit hard_timeout go ()
|
blanchet@43847
|
135 |
in
|
blanchet@43899
|
136 |
(if outcome_code = someN orelse mode = Normal then
|
blanchet@43899
|
137 |
quote name ^ ": " ^ message ()
|
blanchet@43899
|
138 |
else
|
blanchet@43899
|
139 |
"")
|
blanchet@43846
|
140 |
|> Async_Manager.break_into_chunks
|
blanchet@43846
|
141 |
|> List.app Output.urgent_message;
|
blanchet@43847
|
142 |
(outcome_code, state)
|
blanchet@41337
|
143 |
end
|
blanchet@41337
|
144 |
else
|
blanchet@43847
|
145 |
(Async_Manager.launch das_tool birth_time death_time (desc ())
|
blanchet@43893
|
146 |
((fn (outcome_code, message) =>
|
blanchet@43900
|
147 |
(verbose orelse outcome_code = someN,
|
blanchet@43900
|
148 |
message ())) o go);
|
blanchet@43847
|
149 |
(unknownN, state))
|
blanchet@41337
|
150 |
end
|
blanchet@41337
|
151 |
|
blanchet@41483
|
152 |
fun class_of_smt_solver ctxt name =
|
blanchet@41483
|
153 |
ctxt |> select_smt_solver name
|
blanchet@41483
|
154 |
|> SMT_Config.solver_class_of |> SMT_Utils.string_of_class
|
blanchet@41483
|
155 |
|
blanchet@43862
|
156 |
val auto_try_max_relevant_divisor = 2 (* FUDGE *)
|
blanchet@40241
|
157 |
|
blanchet@43787
|
158 |
fun run_sledgehammer (params as {debug, verbose, blocking, provers,
|
blanchet@46577
|
159 |
relevance_thresholds, max_relevant, slice,
|
blanchet@48402
|
160 |
...})
|
blanchet@43862
|
161 |
mode i (relevance_override as {only, ...}) minimize_command state =
|
blanchet@40240
|
162 |
if null provers then
|
blanchet@40240
|
163 |
error "No prover is set."
|
blanchet@39564
|
164 |
else case subgoal_count state of
|
blanchet@43861
|
165 |
0 => (Output.urgent_message "No subgoal!"; (false, (noneN, state)))
|
blanchet@39564
|
166 |
| n =>
|
blanchet@39564
|
167 |
let
|
blanchet@39610
|
168 |
val _ = Proof.assert_backward state
|
blanchet@43862
|
169 |
val print = if mode = Normal then Output.urgent_message else K ()
|
blanchet@41483
|
170 |
val state =
|
blanchet@41483
|
171 |
state |> Proof.map_context (Config.put SMT_Config.verbose debug)
|
blanchet@40441
|
172 |
val ctxt = Proof.context_of state
|
blanchet@40441
|
173 |
val {facts = chained_ths, goal, ...} = Proof.goal state
|
blanchet@43884
|
174 |
val chained_ths = chained_ths |> normalize_chained_theorems
|
blanchet@43845
|
175 |
val (_, hyp_ts, concl_t) = strip_subgoal ctxt goal i
|
blanchet@45483
|
176 |
val ho_atp = exists (Sledgehammer_Provers.is_ho_atp ctxt) provers
|
blanchet@45483
|
177 |
val facts =
|
blanchet@45483
|
178 |
nearly_all_facts ctxt ho_atp relevance_override chained_ths hyp_ts
|
blanchet@45483
|
179 |
concl_t
|
nik@45450
|
180 |
val _ = () |> not blocking ? kill_provers
|
blanchet@42591
|
181 |
val _ = case find_first (not o is_prover_supported ctxt) provers of
|
blanchet@41189
|
182 |
SOME name => error ("No such prover: " ^ name ^ ".")
|
blanchet@41189
|
183 |
| NONE => ()
|
blanchet@42644
|
184 |
val _ = print "Sledgehammering..."
|
blanchet@43785
|
185 |
val (smts, (ueq_atps, full_atps)) =
|
blanchet@43785
|
186 |
provers |> List.partition (is_smt_prover ctxt)
|
blanchet@43785
|
187 |
||> List.partition (is_unit_equational_atp ctxt)
|
blanchet@48402
|
188 |
fun launch_provers state get_facts translate provers =
|
blanchet@41502
|
189 |
let
|
blanchet@41502
|
190 |
val facts = get_facts ()
|
blanchet@41502
|
191 |
val num_facts = length facts
|
blanchet@41502
|
192 |
val facts = facts ~~ (0 upto num_facts - 1)
|
blanchet@41502
|
193 |
|> map (translate num_facts)
|
blanchet@41502
|
194 |
val problem =
|
blanchet@41502
|
195 |
{state = state, goal = goal, subgoal = i, subgoal_count = n,
|
blanchet@48402
|
196 |
facts = facts}
|
blanchet@43862
|
197 |
val launch = launch_prover params mode minimize_command only
|
blanchet@41502
|
198 |
in
|
blanchet@43862
|
199 |
if mode = Auto_Try orelse mode = Try then
|
blanchet@43861
|
200 |
(unknownN, state)
|
blanchet@43862
|
201 |
|> fold (fn prover => fn accum as (outcome_code, _) =>
|
blanchet@43861
|
202 |
if outcome_code = someN then accum
|
blanchet@43861
|
203 |
else launch problem prover)
|
blanchet@43861
|
204 |
provers
|
blanchet@41502
|
205 |
else
|
blanchet@41502
|
206 |
provers
|
wenzelm@47763
|
207 |
|> (if blocking then Par_List.map else map)
|
blanchet@43861
|
208 |
(launch problem #> fst)
|
blanchet@43861
|
209 |
|> max_outcome_code |> rpair state
|
blanchet@41502
|
210 |
end
|
blanchet@43793
|
211 |
fun get_facts label is_appropriate_prop relevance_fudge provers =
|
blanchet@41483
|
212 |
let
|
blanchet@41483
|
213 |
val max_max_relevant =
|
blanchet@41483
|
214 |
case max_relevant of
|
blanchet@41483
|
215 |
SOME n => n
|
blanchet@41483
|
216 |
| NONE =>
|
blanchet@43314
|
217 |
0 |> fold (Integer.max
|
blanchet@46577
|
218 |
o default_max_relevant_for_prover ctxt slice)
|
blanchet@41483
|
219 |
provers
|
blanchet@43862
|
220 |
|> mode = Auto_Try
|
blanchet@43862
|
221 |
? (fn n => n div auto_try_max_relevant_divisor)
|
blanchet@41483
|
222 |
val is_built_in_const =
|
blanchet@41483
|
223 |
is_built_in_const_for_prover ctxt (hd provers)
|
blanchet@41483
|
224 |
in
|
blanchet@44217
|
225 |
facts
|
blanchet@44217
|
226 |
|> (case is_appropriate_prop of
|
blanchet@44217
|
227 |
SOME is_app => filter (is_app o prop_of o snd)
|
blanchet@44217
|
228 |
| NONE => I)
|
blanchet@45483
|
229 |
|> relevant_facts ctxt relevance_thresholds max_max_relevant
|
blanchet@45483
|
230 |
is_built_in_const relevance_fudge relevance_override
|
blanchet@45483
|
231 |
chained_ths hyp_ts concl_t
|
blanchet@41483
|
232 |
|> tap (fn facts =>
|
blanchet@41483
|
233 |
if debug then
|
blanchet@41483
|
234 |
label ^ plural_s (length provers) ^ ": " ^
|
blanchet@41483
|
235 |
(if null facts then
|
blanchet@41483
|
236 |
"Found no relevant facts."
|
blanchet@41483
|
237 |
else
|
blanchet@41483
|
238 |
"Including (up to) " ^ string_of_int (length facts) ^
|
blanchet@41483
|
239 |
" relevant fact" ^ plural_s (length facts) ^ ":\n" ^
|
blanchet@41483
|
240 |
(facts |> map (fst o fst) |> space_implode " ") ^ ".")
|
blanchet@42644
|
241 |
|> print
|
blanchet@41483
|
242 |
else
|
blanchet@41483
|
243 |
())
|
blanchet@41483
|
244 |
end
|
blanchet@43793
|
245 |
fun launch_atps label is_appropriate_prop atps accum =
|
blanchet@43787
|
246 |
if null atps then
|
blanchet@41502
|
247 |
accum
|
blanchet@44217
|
248 |
else if is_some is_appropriate_prop andalso
|
blanchet@44217
|
249 |
not (the is_appropriate_prop concl_t) then
|
blanchet@43787
|
250 |
(if verbose orelse length atps = length provers then
|
blanchet@43787
|
251 |
"Goal outside the scope of " ^
|
blanchet@43787
|
252 |
space_implode " " (serial_commas "and" (map quote atps)) ^ "."
|
blanchet@43787
|
253 |
|> Output.urgent_message
|
blanchet@43787
|
254 |
else
|
blanchet@43787
|
255 |
();
|
blanchet@43787
|
256 |
accum)
|
blanchet@41502
|
257 |
else
|
blanchet@43785
|
258 |
launch_provers state
|
blanchet@43793
|
259 |
(get_facts label is_appropriate_prop atp_relevance_fudge o K atps)
|
blanchet@48402
|
260 |
(K (Untranslated_Fact o fst)) atps
|
blanchet@42617
|
261 |
fun launch_smts accum =
|
blanchet@42617
|
262 |
if null smts then
|
blanchet@41483
|
263 |
accum
|
blanchet@41483
|
264 |
else
|
blanchet@41483
|
265 |
let
|
blanchet@44217
|
266 |
val facts = get_facts "SMT solver" NONE smt_relevance_fudge smts
|
blanchet@43517
|
267 |
val weight = SMT_Weighted_Fact oo weight_smt_fact ctxt
|
blanchet@41483
|
268 |
in
|
blanchet@41483
|
269 |
smts |> map (`(class_of_smt_solver ctxt))
|
blanchet@41483
|
270 |
|> AList.group (op =)
|
blanchet@48402
|
271 |
|> map (snd #> launch_provers state (K facts) weight #> fst)
|
blanchet@43861
|
272 |
|> max_outcome_code |> rpair state
|
blanchet@41483
|
273 |
end
|
blanchet@44217
|
274 |
val launch_full_atps = launch_atps "ATP" NONE full_atps
|
blanchet@43785
|
275 |
val launch_ueq_atps =
|
blanchet@44217
|
276 |
launch_atps "Unit equational provers" (SOME is_unit_equality) ueq_atps
|
blanchet@41510
|
277 |
fun launch_atps_and_smt_solvers () =
|
blanchet@43884
|
278 |
[launch_full_atps, launch_smts, launch_ueq_atps]
|
wenzelm@47763
|
279 |
|> Par_List.map (fn f => ignore (f (unknownN, state)))
|
blanchet@42644
|
280 |
handle ERROR msg => (print ("Error: " ^ msg); error msg)
|
blanchet@43862
|
281 |
fun maybe f (accum as (outcome_code, _)) =
|
blanchet@43862
|
282 |
accum |> (mode = Normal orelse outcome_code <> someN) ? f
|
blanchet@40241
|
283 |
in
|
blanchet@43861
|
284 |
(unknownN, state)
|
blanchet@43785
|
285 |
|> (if blocking then
|
blanchet@43862
|
286 |
launch_full_atps
|
blanchet@43862
|
287 |
#> mode <> Auto_Try ? (maybe launch_ueq_atps #> maybe launch_smts)
|
blanchet@43785
|
288 |
else
|
blanchet@43785
|
289 |
(fn p => Future.fork (tap launch_atps_and_smt_solvers) |> K p))
|
blanchet@42644
|
290 |
handle TimeLimit.TimeOut =>
|
blanchet@43861
|
291 |
(print "Sledgehammer ran out of time."; (unknownN, state))
|
blanchet@40241
|
292 |
end
|
blanchet@43861
|
293 |
|> `(fn (outcome_code, _) => outcome_code = someN)
|
blanchet@38290
|
294 |
|
wenzelm@28582
|
295 |
end;
|