src/HOL/Mirabelle/Tools/mirabelle_sledgehammer.ML
author blanchet
Fri, 20 Jul 2012 22:19:45 +0200
changeset 49396 1b7d798460bb
parent 49336 c552d7f1720b
child 49414 4bacc8983b3d
permissions -rw-r--r--
renamed ML structures
wenzelm@48718
     1
(*  Title:      HOL/Mirabelle/Tools/mirabelle_sledgehammer.ML
wenzelm@32564
     2
    Author:     Jasmin Blanchette and Sascha Boehme and Tobias Nipkow, TU Munich
boehmes@32385
     3
*)
boehmes@32385
     4
boehmes@32385
     5
structure Mirabelle_Sledgehammer : MIRABELLE_ACTION =
boehmes@32385
     6
struct
boehmes@32385
     7
sultana@48351
     8
(*To facilitate synching the description of Mirabelle Sledgehammer parameters
sultana@48351
     9
 (in ../lib/Tools/mirabelle) with the parameters actually used by this
sultana@48351
    10
 interface, the former extracts PARAMETER and DESCRIPTION from code below which
sultana@48351
    11
 has this pattern (provided it appears in a single line):
sultana@48351
    12
   val .*K = "PARAMETER" (*DESCRIPTION*)
sultana@48351
    13
*)
sultana@48351
    14
(*NOTE: descriptions mention parameters (particularly NAME) without a defined range.*)
sultana@48351
    15
val proverK = "prover" (*=NAME: name of the external prover to call*)
sultana@48351
    16
val prover_timeoutK = "prover_timeout" (*=TIME: timeout for invoked ATP (seconds of process time)*)
sultana@48351
    17
val keepK = "keep" (*=PATH: path where to keep temporary files created by sledgehammer*)
sultana@48351
    18
val minimizeK = "minimize" (*: enable minimization of theorem set found by sledgehammer*)
sultana@48351
    19
                           (*refers to minimization attempted by Mirabelle*)
sultana@48351
    20
val minimize_timeoutK = "minimize_timeout" (*=TIME: timeout for each minimization step (seconds of*)
sultana@48351
    21
sultana@48351
    22
val reconstructorK = "reconstructor" (*=NAME: how to reconstruct proofs (ie. using metis/smt)*)
sultana@48351
    23
val metis_ftK = "metis_ft" (*: apply metis with fully-typed encoding to the theorems found by sledgehammer*)
sultana@48351
    24
blanchet@49308
    25
val max_factsK = "max_facts" (*=NUM: max. relevant clauses to use*)
sultana@48351
    26
val max_relevantK = "max_relevant" (*=NUM: max. relevant clauses to use*)
sultana@48351
    27
val max_callsK = "max_calls" (*=NUM: max. no. of calls to sledgehammer*)
sultana@48351
    28
val preplay_timeoutK = "preplay_timeout" (*=TIME: timeout for finding reconstructed proof*)
sultana@48351
    29
val sh_minimizeK = "sh_minimize" (*: instruct sledgehammer to run its minimizer*)
sultana@48351
    30
sultana@48351
    31
val check_trivialK = "check_trivial" (*: check if goals are "trivial" (false by default)*)
sultana@48351
    32
val type_encK = "type_enc" (*=STRING: type encoding scheme*)
sultana@48351
    33
val lam_transK = "lam_trans" (*=STRING: lambda translation scheme*)
sultana@48351
    34
val strictK = "strict" (*=BOOL: run in strict mode*)
sultana@48351
    35
val sliceK = "slice" (*=BOOL: allow sledgehammer-level strategy-scheduling*)
sultana@48351
    36
val uncurried_aliasesK = "uncurried_aliases" (*=SMART_BOOL: use fresh function names to alias curried applications*)
sultana@48351
    37
val e_selection_heuristicK = "e_selection_heuristic" (*: FIXME*)
sultana@48351
    38
val term_orderK = "term_order" (*: FIXME*)
sultana@48351
    39
val force_sosK = "force_sos" (*: use SOS*)
sultana@48351
    40
val max_new_mono_instancesK = "max_new_mono_instances" (*=NUM: max. new monomorphic instances*)
sultana@48351
    41
val max_mono_itersK = "max_mono_iters" (*=NUM: max. iterations of monomorphiser*)
blanchet@45305
    42
boehmes@32521
    43
fun sh_tag id = "#" ^ string_of_int id ^ " sledgehammer: "
boehmes@32525
    44
fun minimize_tag id = "#" ^ string_of_int id ^ " minimize (sledgehammer): "
blanchet@40915
    45
fun reconstructor_tag reconstructor id =
blanchet@40915
    46
  "#" ^ string_of_int id ^ " " ^ (!reconstructor) ^ " (sledgehammer): "
boehmes@32521
    47
boehmes@32525
    48
val separator = "-----"
boehmes@32525
    49
sultana@48352
    50
(*FIXME sensible to have Mirabelle-level Sledgehammer defaults?*)
sultana@48352
    51
(*defaults used in this Mirabelle action*)
sultana@47696
    52
val preplay_timeout_default = "4"
sultana@48352
    53
val lam_trans_default = "smart"
sultana@48352
    54
val uncurried_aliases_default = "smart"
sultana@48352
    55
val type_enc_default = "smart"
sultana@48352
    56
val strict_default = "false"
blanchet@49308
    57
val max_facts_default = "smart"
sultana@48352
    58
val slice_default = "true"
sultana@48352
    59
val max_calls_default = "10000000"
sultana@48352
    60
val trivial_default = "false"
sultana@48352
    61
val minimize_timeout_default = 5
sultana@47697
    62
sultana@47697
    63
(*If a key is present in args then augment a list with its pair*)
sultana@47697
    64
(*This is used to avoid fixing default values at the Mirabelle level, and
sultana@47697
    65
  instead use the default values of the tool (Sledgehammer in this case).*)
sultana@47697
    66
fun available_parameter args key label list =
sultana@47697
    67
  let
sultana@47697
    68
    val value = AList.lookup (op =) args key
sultana@47697
    69
  in if is_some value then (label, the value) :: list else list end
sultana@47697
    70
boehmes@32521
    71
nipkow@32549
    72
datatype sh_data = ShData of {
nipkow@32549
    73
  calls: int,
nipkow@32549
    74
  success: int,
blanchet@39583
    75
  nontriv_calls: int,
blanchet@39583
    76
  nontriv_success: int,
nipkow@32585
    77
  lemmas: int,
nipkow@32810
    78
  max_lems: int,
nipkow@32549
    79
  time_isa: int,
blanchet@40243
    80
  time_prover: int,
blanchet@40243
    81
  time_prover_fail: int}
boehmes@32521
    82
blanchet@40915
    83
datatype re_data = ReData of {
nipkow@32549
    84
  calls: int,
nipkow@32549
    85
  success: int,
blanchet@39583
    86
  nontriv_calls: int,
blanchet@39583
    87
  nontriv_success: int,
nipkow@32676
    88
  proofs: int,
nipkow@32549
    89
  time: int,
nipkow@32550
    90
  timeout: int,
nipkow@32990
    91
  lemmas: int * int * int,
blanchet@39587
    92
  posns: (Position.T * bool) list
nipkow@32550
    93
  }
boehmes@32521
    94
nipkow@32571
    95
datatype min_data = MinData of {
nipkow@32609
    96
  succs: int,
blanchet@35866
    97
  ab_ratios: int
nipkow@32571
    98
  }
boehmes@32521
    99
nipkow@32810
   100
fun make_sh_data
blanchet@39583
   101
      (calls,success,nontriv_calls,nontriv_success,lemmas,max_lems,time_isa,
blanchet@40243
   102
       time_prover,time_prover_fail) =
blanchet@39583
   103
  ShData{calls=calls, success=success, nontriv_calls=nontriv_calls,
blanchet@39583
   104
         nontriv_success=nontriv_success, lemmas=lemmas, max_lems=max_lems,
blanchet@40243
   105
         time_isa=time_isa, time_prover=time_prover,
blanchet@40243
   106
         time_prover_fail=time_prover_fail}
boehmes@32521
   107
blanchet@35866
   108
fun make_min_data (succs, ab_ratios) =
blanchet@35866
   109
  MinData{succs=succs, ab_ratios=ab_ratios}
nipkow@32571
   110
blanchet@40915
   111
fun make_re_data (calls,success,nontriv_calls,nontriv_success,proofs,time,
blanchet@39583
   112
                  timeout,lemmas,posns) =
blanchet@40915
   113
  ReData{calls=calls, success=success, nontriv_calls=nontriv_calls,
blanchet@39583
   114
         nontriv_success=nontriv_success, proofs=proofs, time=time,
nipkow@32990
   115
         timeout=timeout, lemmas=lemmas, posns=posns}
boehmes@32521
   116
blanchet@39583
   117
val empty_sh_data = make_sh_data (0, 0, 0, 0, 0, 0, 0, 0, 0)
blanchet@35871
   118
val empty_min_data = make_min_data (0, 0)
blanchet@40915
   119
val empty_re_data = make_re_data (0, 0, 0, 0, 0, 0, 0, (0,0,0), [])
boehmes@32521
   120
blanchet@39583
   121
fun tuple_of_sh_data (ShData {calls, success, nontriv_calls, nontriv_success,
blanchet@39583
   122
                              lemmas, max_lems, time_isa,
blanchet@40243
   123
  time_prover, time_prover_fail}) = (calls, success, nontriv_calls,
blanchet@40243
   124
  nontriv_success, lemmas, max_lems, time_isa, time_prover, time_prover_fail)
boehmes@32521
   125
blanchet@35866
   126
fun tuple_of_min_data (MinData {succs, ab_ratios}) = (succs, ab_ratios)
nipkow@32533
   127
blanchet@40915
   128
fun tuple_of_re_data (ReData {calls, success, nontriv_calls, nontriv_success,
blanchet@39583
   129
  proofs, time, timeout, lemmas, posns}) = (calls, success, nontriv_calls,
blanchet@39583
   130
  nontriv_success, proofs, time, timeout, lemmas, posns)
nipkow@32571
   131
boehmes@34033
   132
blanchet@40915
   133
datatype reconstructor_mode =
blanchet@40915
   134
  Unminimized | Minimized | UnminimizedFT | MinimizedFT
boehmes@34033
   135
boehmes@34033
   136
datatype data = Data of {
boehmes@34033
   137
  sh: sh_data,
boehmes@34033
   138
  min: min_data,
blanchet@40915
   139
  re_u: re_data, (* reconstructor with unminimized set of lemmas *)
blanchet@40915
   140
  re_m: re_data, (* reconstructor with minimized set of lemmas *)
blanchet@40915
   141
  re_uft: re_data, (* reconstructor with unminimized set of lemmas and fully-typed *)
blanchet@40915
   142
  re_mft: re_data, (* reconstructor with minimized set of lemmas and fully-typed *)
boehmes@34033
   143
  mini: bool   (* with minimization *)
boehmes@34033
   144
  }
boehmes@34033
   145
blanchet@40915
   146
fun make_data (sh, min, re_u, re_m, re_uft, re_mft, mini) =
blanchet@40915
   147
  Data {sh=sh, min=min, re_u=re_u, re_m=re_m, re_uft=re_uft, re_mft=re_mft,
boehmes@34033
   148
    mini=mini}
boehmes@34033
   149
boehmes@34033
   150
val empty_data = make_data (empty_sh_data, empty_min_data,
blanchet@40915
   151
  empty_re_data, empty_re_data, empty_re_data, empty_re_data, false)
boehmes@34033
   152
blanchet@40915
   153
fun map_sh_data f (Data {sh, min, re_u, re_m, re_uft, re_mft, mini}) =
boehmes@34033
   154
  let val sh' = make_sh_data (f (tuple_of_sh_data sh))
blanchet@40915
   155
  in make_data (sh', min, re_u, re_m, re_uft, re_mft, mini) end
boehmes@34033
   156
blanchet@40915
   157
fun map_min_data f (Data {sh, min, re_u, re_m, re_uft, re_mft, mini}) =
boehmes@34033
   158
  let val min' = make_min_data (f (tuple_of_min_data min))
blanchet@40915
   159
  in make_data (sh, min', re_u, re_m, re_uft, re_mft, mini) end
boehmes@34033
   160
blanchet@40915
   161
fun map_re_data f m (Data {sh, min, re_u, re_m, re_uft, re_mft, mini}) =
boehmes@34033
   162
  let
boehmes@34033
   163
    fun map_me g Unminimized   (u, m, uft, mft) = (g u, m, uft, mft)
boehmes@34033
   164
      | map_me g Minimized     (u, m, uft, mft) = (u, g m, uft, mft)
boehmes@34033
   165
      | map_me g UnminimizedFT (u, m, uft, mft) = (u, m, g uft, mft)
boehmes@34033
   166
      | map_me g MinimizedFT   (u, m, uft, mft) = (u, m, uft, g mft)
boehmes@34033
   167
blanchet@40915
   168
    val f' = make_re_data o f o tuple_of_re_data
boehmes@34033
   169
blanchet@40915
   170
    val (re_u', re_m', re_uft', re_mft') =
blanchet@40915
   171
      map_me f' m (re_u, re_m, re_uft, re_mft)
blanchet@40915
   172
  in make_data (sh, min, re_u', re_m', re_uft', re_mft', mini) end
boehmes@34033
   173
blanchet@40915
   174
fun set_mini mini (Data {sh, min, re_u, re_m, re_uft, re_mft, ...}) =
blanchet@40915
   175
  make_data (sh, min, re_u, re_m, re_uft, re_mft, mini)
nipkow@32990
   176
nipkow@32990
   177
fun inc_max (n:int) (s,sos,m) = (s+n, sos + n*n, Int.max(m,n));
nipkow@32536
   178
nipkow@32810
   179
val inc_sh_calls =  map_sh_data
blanchet@40243
   180
  (fn (calls, success, nontriv_calls, nontriv_success, lemmas,max_lems, time_isa, time_prover, time_prover_fail)
blanchet@40243
   181
    => (calls + 1, success, nontriv_calls, nontriv_success, lemmas, max_lems, time_isa, time_prover, time_prover_fail))
boehmes@32521
   182
nipkow@32810
   183
val inc_sh_success = map_sh_data
blanchet@40243
   184
  (fn (calls, success, nontriv_calls, nontriv_success, lemmas,max_lems, time_isa, time_prover, time_prover_fail)
blanchet@40243
   185
    => (calls, success + 1, nontriv_calls, nontriv_success, lemmas,max_lems, time_isa, time_prover, time_prover_fail))
blanchet@39583
   186
blanchet@39583
   187
val inc_sh_nontriv_calls =  map_sh_data
blanchet@40243
   188
  (fn (calls, success, nontriv_calls, nontriv_success, lemmas,max_lems, time_isa, time_prover, time_prover_fail)
blanchet@40243
   189
    => (calls, success, nontriv_calls + 1, nontriv_success, lemmas, max_lems, time_isa, time_prover, time_prover_fail))
blanchet@39583
   190
blanchet@39583
   191
val inc_sh_nontriv_success = map_sh_data
blanchet@40243
   192
  (fn (calls, success, nontriv_calls, nontriv_success, lemmas,max_lems, time_isa, time_prover, time_prover_fail)
blanchet@40243
   193
    => (calls, success, nontriv_calls, nontriv_success + 1, lemmas,max_lems, time_isa, time_prover, time_prover_fail))
nipkow@32585
   194
nipkow@32810
   195
fun inc_sh_lemmas n = map_sh_data
blanchet@40243
   196
  (fn (calls,success,nontriv_calls, nontriv_success, lemmas,max_lems,time_isa,time_prover,time_prover_fail)
blanchet@40243
   197
    => (calls,success,nontriv_calls, nontriv_success, lemmas+n,max_lems,time_isa,time_prover,time_prover_fail))
boehmes@32521
   198
nipkow@32810
   199
fun inc_sh_max_lems n = map_sh_data
blanchet@40243
   200
  (fn (calls,success,nontriv_calls, nontriv_success, lemmas,max_lems,time_isa,time_prover,time_prover_fail)
blanchet@40243
   201
    => (calls,success,nontriv_calls, nontriv_success, lemmas,Int.max(max_lems,n),time_isa,time_prover,time_prover_fail))
nipkow@32549
   202
nipkow@32810
   203
fun inc_sh_time_isa t = map_sh_data
blanchet@40243
   204
  (fn (calls,success,nontriv_calls, nontriv_success, lemmas,max_lems,time_isa,time_prover,time_prover_fail)
blanchet@40243
   205
    => (calls,success,nontriv_calls, nontriv_success, lemmas,max_lems,time_isa + t,time_prover,time_prover_fail))
nipkow@32549
   206
blanchet@40243
   207
fun inc_sh_time_prover t = map_sh_data
blanchet@40243
   208
  (fn (calls,success,nontriv_calls, nontriv_success, lemmas,max_lems,time_isa,time_prover,time_prover_fail)
blanchet@40243
   209
    => (calls,success,nontriv_calls, nontriv_success, lemmas,max_lems,time_isa,time_prover + t,time_prover_fail))
nipkow@32571
   210
blanchet@40243
   211
fun inc_sh_time_prover_fail t = map_sh_data
blanchet@40243
   212
  (fn (calls,success,nontriv_calls, nontriv_success, lemmas,max_lems,time_isa,time_prover,time_prover_fail)
blanchet@40243
   213
    => (calls,success,nontriv_calls, nontriv_success, lemmas,max_lems,time_isa,time_prover,time_prover_fail + t))
nipkow@32571
   214
nipkow@32810
   215
val inc_min_succs = map_min_data
blanchet@35866
   216
  (fn (succs,ab_ratios) => (succs+1, ab_ratios))
nipkow@32609
   217
nipkow@32810
   218
fun inc_min_ab_ratios r = map_min_data
blanchet@35866
   219
  (fn (succs, ab_ratios) => (succs, ab_ratios+r))
nipkow@32549
   220
blanchet@40915
   221
val inc_reconstructor_calls = map_re_data
blanchet@39583
   222
  (fn (calls,success,nontriv_calls, nontriv_success, proofs,time,timeout,lemmas,posns)
blanchet@39583
   223
    => (calls + 1, success, nontriv_calls, nontriv_success, proofs, time, timeout, lemmas,posns))
nipkow@32549
   224
blanchet@40915
   225
val inc_reconstructor_success = map_re_data
blanchet@39583
   226
  (fn (calls,success,nontriv_calls, nontriv_success, proofs,time,timeout,lemmas,posns)
blanchet@39583
   227
    => (calls, success + 1, nontriv_calls, nontriv_success, proofs, time, timeout, lemmas,posns))
blanchet@39583
   228
blanchet@40915
   229
val inc_reconstructor_nontriv_calls = map_re_data
blanchet@39583
   230
  (fn (calls,success,nontriv_calls, nontriv_success, proofs,time,timeout,lemmas,posns)
blanchet@39583
   231
    => (calls, success, nontriv_calls + 1, nontriv_success, proofs, time, timeout, lemmas,posns))
blanchet@39583
   232
blanchet@40915
   233
val inc_reconstructor_nontriv_success = map_re_data
blanchet@39583
   234
  (fn (calls,success,nontriv_calls, nontriv_success, proofs,time,timeout,lemmas,posns)
blanchet@39583
   235
    => (calls, success, nontriv_calls, nontriv_success + 1, proofs, time, timeout, lemmas,posns))
nipkow@32676
   236
blanchet@40915
   237
val inc_reconstructor_proofs = map_re_data
blanchet@39583
   238
  (fn (calls,success,nontriv_calls, nontriv_success, proofs,time,timeout,lemmas,posns)
blanchet@39583
   239
    => (calls, success, nontriv_calls, nontriv_success, proofs + 1, time, timeout, lemmas,posns))
nipkow@32549
   240
blanchet@40915
   241
fun inc_reconstructor_time m t = map_re_data
blanchet@39583
   242
 (fn (calls,success,nontriv_calls, nontriv_success, proofs,time,timeout,lemmas,posns)
blanchet@39583
   243
  => (calls, success, nontriv_calls, nontriv_success, proofs, time + t, timeout, lemmas,posns)) m
nipkow@32549
   244
blanchet@40915
   245
val inc_reconstructor_timeout = map_re_data
blanchet@39583
   246
  (fn (calls,success,nontriv_calls, nontriv_success, proofs,time,timeout,lemmas,posns)
blanchet@39583
   247
    => (calls, success, nontriv_calls, nontriv_success, proofs, time, timeout + 1, lemmas,posns))
nipkow@32549
   248
blanchet@40915
   249
fun inc_reconstructor_lemmas m n = map_re_data
blanchet@39583
   250
  (fn (calls,success,nontriv_calls, nontriv_success, proofs,time,timeout,lemmas,posns)
blanchet@39583
   251
    => (calls, success, nontriv_calls, nontriv_success, proofs, time, timeout, inc_max n lemmas, posns)) m
nipkow@32549
   252
blanchet@40915
   253
fun inc_reconstructor_posns m pos = map_re_data
blanchet@39583
   254
  (fn (calls,success,nontriv_calls, nontriv_success, proofs,time,timeout,lemmas,posns)
blanchet@39583
   255
    => (calls, success, nontriv_calls, nontriv_success, proofs, time, timeout, lemmas, pos::posns)) m
boehmes@32521
   256
blanchet@44961
   257
val str0 = string_of_int o the_default 0
blanchet@44961
   258
boehmes@32521
   259
local
boehmes@32521
   260
boehmes@32521
   261
val str = string_of_int
boehmes@32521
   262
val str3 = Real.fmt (StringCvt.FIX (SOME 3))
boehmes@32521
   263
fun percentage a b = string_of_int (a * 100 div b)
boehmes@32521
   264
fun time t = Real.fromInt t / 1000.0
boehmes@32521
   265
fun avg_time t n =
boehmes@32521
   266
  if n > 0 then (Real.fromInt t / 1000.0) / Real.fromInt n else 0.0
boehmes@32521
   267
boehmes@34033
   268
fun log_sh_data log
blanchet@40243
   269
    (calls, success, nontriv_calls, nontriv_success, lemmas, max_lems, time_isa, time_prover, time_prover_fail) =
nipkow@32810
   270
 (log ("Total number of sledgehammer calls: " ^ str calls);
nipkow@32810
   271
  log ("Number of successful sledgehammer calls: " ^ str success);
nipkow@32810
   272
  log ("Number of sledgehammer lemmas: " ^ str lemmas);
nipkow@32810
   273
  log ("Max number of sledgehammer lemmas: " ^ str max_lems);
nipkow@32810
   274
  log ("Success rate: " ^ percentage success calls ^ "%");
blanchet@39583
   275
  log ("Total number of nontrivial sledgehammer calls: " ^ str nontriv_calls);
blanchet@39583
   276
  log ("Number of successful nontrivial sledgehammer calls: " ^ str nontriv_success);
nipkow@32810
   277
  log ("Total time for sledgehammer calls (Isabelle): " ^ str3 (time time_isa));
blanchet@40243
   278
  log ("Total time for successful sledgehammer calls (ATP): " ^ str3 (time time_prover));
blanchet@40243
   279
  log ("Total time for failed sledgehammer calls (ATP): " ^ str3 (time time_prover_fail));
nipkow@32536
   280
  log ("Average time for sledgehammer calls (Isabelle): " ^
nipkow@32810
   281
    str3 (avg_time time_isa calls));
nipkow@32533
   282
  log ("Average time for successful sledgehammer calls (ATP): " ^
blanchet@40243
   283
    str3 (avg_time time_prover success));
nipkow@32536
   284
  log ("Average time for failed sledgehammer calls (ATP): " ^
blanchet@40243
   285
    str3 (avg_time time_prover_fail (calls - success)))
nipkow@32533
   286
  )
boehmes@32521
   287
blanchet@39587
   288
fun str_of_pos (pos, triv) =
blanchet@48593
   289
  str0 (Position.line_of pos) ^ ":" ^ str0 (Position.offset_of pos) ^
blanchet@44961
   290
  (if triv then "[T]" else "")
nipkow@32551
   291
blanchet@40915
   292
fun log_re_data log tag sh_calls (re_calls, re_success, re_nontriv_calls,
blanchet@40915
   293
     re_nontriv_success, re_proofs, re_time, re_timeout,
blanchet@40915
   294
    (lemmas, lems_sos, lems_max), re_posns) =
blanchet@40915
   295
 (log ("Total number of " ^ tag ^ "reconstructor calls: " ^ str re_calls);
blanchet@40915
   296
  log ("Number of successful " ^ tag ^ "reconstructor calls: " ^ str re_success ^
blanchet@40915
   297
    " (proof: " ^ str re_proofs ^ ")");
blanchet@40915
   298
  log ("Number of " ^ tag ^ "reconstructor timeouts: " ^ str re_timeout);
blanchet@40915
   299
  log ("Success rate: " ^ percentage re_success sh_calls ^ "%");
blanchet@40915
   300
  log ("Total number of nontrivial " ^ tag ^ "reconstructor calls: " ^ str re_nontriv_calls);
blanchet@40915
   301
  log ("Number of successful nontrivial " ^ tag ^ "reconstructor calls: " ^ str re_nontriv_success ^
blanchet@40915
   302
    " (proof: " ^ str re_proofs ^ ")");
blanchet@40915
   303
  log ("Number of successful " ^ tag ^ "reconstructor lemmas: " ^ str lemmas);
blanchet@40915
   304
  log ("SOS of successful " ^ tag ^ "reconstructor lemmas: " ^ str lems_sos);
blanchet@40915
   305
  log ("Max number of successful " ^ tag ^ "reconstructor lemmas: " ^ str lems_max);
blanchet@40915
   306
  log ("Total time for successful " ^ tag ^ "reconstructor calls: " ^ str3 (time re_time));
blanchet@40915
   307
  log ("Average time for successful " ^ tag ^ "reconstructor calls: " ^
blanchet@40915
   308
    str3 (avg_time re_time re_success));
nipkow@32551
   309
  if tag=""
blanchet@40915
   310
  then log ("Proved: " ^ space_implode " " (map str_of_pos re_posns))
nipkow@32551
   311
  else ()
nipkow@32551
   312
 )
nipkow@32571
   313
blanchet@35866
   314
fun log_min_data log (succs, ab_ratios) =
nipkow@32609
   315
  (log ("Number of successful minimizations: " ^ string_of_int succs);
blanchet@35866
   316
   log ("After/before ratios: " ^ string_of_int ab_ratios)
nipkow@32571
   317
  )
nipkow@32571
   318
boehmes@32521
   319
in
boehmes@32521
   320
blanchet@40915
   321
fun log_data id log (Data {sh, min, re_u, re_m, re_uft, re_mft, mini}) =
boehmes@34033
   322
  let
boehmes@34033
   323
    val ShData {calls=sh_calls, ...} = sh
boehmes@34033
   324
blanchet@40915
   325
    fun app_if (ReData {calls, ...}) f = if calls > 0 then f () else ()
blanchet@40915
   326
    fun log_re tag m =
blanchet@40915
   327
      log_re_data log tag sh_calls (tuple_of_re_data m)
blanchet@40915
   328
    fun log_reconstructor (tag1, m1) (tag2, m2) = app_if m1 (fn () =>
blanchet@40915
   329
      (log_re tag1 m1; log ""; app_if m2 (fn () => log_re tag2 m2)))
boehmes@34033
   330
  in
boehmes@34033
   331
    if sh_calls > 0
boehmes@34033
   332
    then
boehmes@34033
   333
     (log ("\n\n\nReport #" ^ string_of_int id ^ ":\n");
boehmes@34033
   334
      log_sh_data log (tuple_of_sh_data sh);
boehmes@34033
   335
      log "";
boehmes@34033
   336
      if not mini
blanchet@40915
   337
      then log_reconstructor ("", re_u) ("fully-typed ", re_uft)
boehmes@34033
   338
      else
blanchet@40915
   339
        app_if re_u (fn () =>
blanchet@40915
   340
         (log_reconstructor ("unminimized ", re_u) ("unminimized fully-typed ", re_uft);
boehmes@34033
   341
          log "";
blanchet@40915
   342
          app_if re_m (fn () =>
boehmes@34033
   343
            (log_min_data log (tuple_of_min_data min); log "";
blanchet@40915
   344
             log_reconstructor ("", re_m) ("fully-typed ", re_mft))))))
boehmes@34033
   345
    else ()
boehmes@34033
   346
  end
boehmes@32521
   347
boehmes@32521
   348
end
boehmes@32521
   349
boehmes@32521
   350
boehmes@32521
   351
(* Warning: we implicitly assume single-threaded execution here! *)
wenzelm@32740
   352
val data = Unsynchronized.ref ([] : (int * data) list)
boehmes@32521
   353
wenzelm@32740
   354
fun init id thy = (Unsynchronized.change data (cons (id, empty_data)); thy)
wenzelm@32567
   355
fun done id ({log, ...}: Mirabelle.done_args) =
boehmes@32521
   356
  AList.lookup (op =) (!data) id
boehmes@32521
   357
  |> Option.map (log_data id log)
boehmes@32521
   358
  |> K ()
boehmes@32521
   359
wenzelm@32740
   360
fun change_data id f = (Unsynchronized.change data (AList.map_entry (op =) id f); ())
boehmes@32521
   361
boehmes@32521
   362
blanchet@43315
   363
fun get_prover ctxt args =
boehmes@33016
   364
  let
blanchet@40243
   365
    fun default_prover_name () =
blanchet@40250
   366
      hd (#provers (Sledgehammer_Isar.default_params ctxt []))
wenzelm@47937
   367
      handle List.Empty => error "No ATP available."
blanchet@41335
   368
    fun get_prover name =
blanchet@49265
   369
      (name, Sledgehammer_Minimize.get_minimizing_prover ctxt
blanchet@49336
   370
                Sledgehammer_Provers.Normal (K ()) name)
boehmes@33016
   371
  in
boehmes@33016
   372
    (case AList.lookup (op =) args proverK of
blanchet@40243
   373
      SOME name => get_prover name
blanchet@40243
   374
    | NONE => get_prover (default_prover_name ()))
boehmes@33016
   375
  end
boehmes@32525
   376
blanchet@47168
   377
type stature = ATP_Problem_Generate.stature
blanchet@38991
   378
blanchet@40915
   379
(* hack *)
blanchet@41605
   380
fun reconstructor_from_msg args msg =
blanchet@41605
   381
  (case AList.lookup (op =) args reconstructorK of
blanchet@41605
   382
    SOME name => name
blanchet@41605
   383
  | NONE =>
blanchet@46390
   384
    if String.isSubstring "metis (" msg then
blanchet@46390
   385
      msg |> Substring.full
blanchet@46390
   386
          |> Substring.position "metis ("
blanchet@46390
   387
          |> snd |> Substring.position ")"
blanchet@46390
   388
          |> fst |> Substring.string
blanchet@46390
   389
          |> suffix ")"
blanchet@46390
   390
    else if String.isSubstring "metis" msg then
blanchet@46390
   391
      "metis"
blanchet@46390
   392
    else
blanchet@46390
   393
      "smt")
blanchet@40915
   394
boehmes@32521
   395
local
boehmes@32521
   396
nipkow@32536
   397
datatype sh_result =
blanchet@47168
   398
  SH_OK of int * int * (string * stature) list |
nipkow@32536
   399
  SH_FAIL of int * int |
nipkow@32536
   400
  SH_ERROR
nipkow@32536
   401
blanchet@49308
   402
fun run_sh prover_name prover type_enc strict max_facts slice lam_trans
blanchet@47920
   403
        uncurried_aliases e_selection_heuristic term_order force_sos
blanchet@47920
   404
        hard_timeout timeout preplay_timeout sh_minimizeLST
blanchet@47920
   405
        max_new_mono_instancesLST max_mono_itersLST dir pos st =
boehmes@32521
   406
  let
blanchet@39242
   407
    val {context = ctxt, facts = chained_ths, goal} = Proof.goal st
blanchet@39242
   408
    val i = 1
blanchet@44961
   409
    fun set_file_name (SOME dir) =
blanchet@41585
   410
        Config.put Sledgehammer_Provers.dest_dir dir
blanchet@44961
   411
        #> Config.put Sledgehammer_Provers.problem_prefix
blanchet@45283
   412
          ("prob_" ^ str0 (Position.line_of pos) ^ "__")
blanchet@41585
   413
        #> Config.put SMT_Config.debug_files
blanchet@43929
   414
          (dir ^ "/" ^ Name.desymbolize false (ATP_Util.timestamp ()) ^ "_"
blanchet@41586
   415
          ^ serial_string ())
blanchet@44961
   416
      | set_file_name NONE = I
blanchet@39567
   417
    val st' =
blanchet@47901
   418
      st
blanchet@47901
   419
      |> Proof.map_context
blanchet@47901
   420
           (set_file_name dir
blanchet@47903
   421
            #> (Option.map (Config.put ATP_Systems.e_selection_heuristic)
blanchet@47903
   422
                  e_selection_heuristic |> the_default I)
blanchet@47920
   423
            #> (Option.map (Config.put ATP_Systems.term_order)
blanchet@47920
   424
                  term_order |> the_default I)
blanchet@47901
   425
            #> (Option.map (Config.put ATP_Systems.force_sos)
blanchet@47901
   426
                  force_sos |> the_default I))
blanchet@49308
   427
    val params as {max_facts, slice, ...} =
blanchet@40250
   428
      Sledgehammer_Isar.default_params ctxt
sultana@47697
   429
         ([("verbose", "true"),
blanchet@44493
   430
           ("type_enc", type_enc),
blanchet@47214
   431
           ("strict", strict),
sultana@48352
   432
           ("lam_trans", lam_trans |> the_default lam_trans_default),
sultana@48352
   433
           ("uncurried_aliases", uncurried_aliases |> the_default uncurried_aliases_default),
blanchet@49308
   434
           ("max_facts", max_facts),
blanchet@46577
   435
           ("slice", slice),
blanchet@45305
   436
           ("timeout", string_of_int timeout),
blanchet@45305
   437
           ("preplay_timeout", preplay_timeout)]
sultana@47697
   438
          |> sh_minimizeLST (*don't confuse the two minimization flags*)
sultana@47697
   439
          |> max_new_mono_instancesLST
sultana@47697
   440
          |> max_mono_itersLST)
blanchet@49308
   441
    val default_max_facts =
blanchet@49308
   442
      Sledgehammer_Provers.default_max_facts_for_prover ctxt slice prover_name
blanchet@43793
   443
    val is_appropriate_prop =
blanchet@43793
   444
      Sledgehammer_Provers.is_appropriate_prop_for_prover ctxt prover_name
blanchet@43929
   445
    val (_, hyp_ts, concl_t) = ATP_Util.strip_subgoal ctxt goal i
boehmes@32573
   446
    val time_limit =
boehmes@32573
   447
      (case hard_timeout of
boehmes@32573
   448
        NONE => I
boehmes@32573
   449
      | SOME secs => TimeLimit.timeLimit (Time.fromSeconds secs))
blanchet@43794
   450
    fun failed failure =
blanchet@46232
   451
      ({outcome = SOME failure, used_facts = [], run_time = Time.zeroTime,
blanchet@46390
   452
        preplay =
blanchet@47148
   453
          K (ATP_Proof_Reconstruct.Failed_to_Play Sledgehammer_Provers.plain_metis),
blanchet@44102
   454
        message = K "", message_tail = ""}, ~1)
blanchet@46232
   455
    val ({outcome, used_facts, run_time, preplay, message, message_tail}
blanchet@46232
   456
         : Sledgehammer_Provers.prover_result,
blanchet@41523
   457
        time_isa) = time_limit (Mirabelle.cpu_time (fn () =>
blanchet@41523
   458
      let
blanchet@43794
   459
        val _ = if is_appropriate_prop concl_t then ()
blanchet@43794
   460
                else raise Fail "inappropriate"
blanchet@45483
   461
        val ho_atp = Sledgehammer_Provers.is_ho_atp ctxt prover_name
blanchet@49314
   462
        val reserved = Sledgehammer_Util.reserved_isar_keyword_table ()
blanchet@49314
   463
        val css_table = Sledgehammer_Fact.clasimpset_rule_table_of ctxt
blanchet@41523
   464
        val facts =
blanchet@49303
   465
          Sledgehammer_Fact.nearly_all_facts ctxt ho_atp
blanchet@49314
   466
              Sledgehammer_Fact.no_fact_override reserved css_table chained_ths
blanchet@49314
   467
              hyp_ts concl_t
blanchet@44217
   468
          |> filter (is_appropriate_prop o prop_of o snd)
blanchet@49396
   469
          |> Sledgehammer_MaSh.relevant_facts ctxt params prover_name
blanchet@49308
   470
                 (the_default default_max_facts max_facts)
blanchet@49307
   471
                 Sledgehammer_Fact.no_fact_override hyp_ts concl_t
blanchet@41523
   472
        val problem =
blanchet@41523
   473
          {state = st', goal = goal, subgoal = i,
blanchet@41523
   474
           subgoal_count = Sledgehammer_Util.subgoal_count st,
blanchet@49304
   475
           facts = facts |> map (apfst (apfst (fn name => name ())))
blanchet@49304
   476
                         |> map Sledgehammer_Provers.Untranslated_Fact}
blanchet@46391
   477
      in prover params (K (K (K ""))) problem end)) ()
blanchet@43794
   478
      handle TimeLimit.TimeOut => failed ATP_Proof.TimedOut
blanchet@43794
   479
           | Fail "inappropriate" => failed ATP_Proof.Inappropriate
blanchet@46232
   480
    val time_prover = run_time |> Time.toMilliseconds
blanchet@44102
   481
    val msg = message (preplay ()) ^ message_tail
boehmes@32521
   482
  in
blanchet@36405
   483
    case outcome of
blanchet@43893
   484
      NONE => (msg, SH_OK (time_isa, time_prover, used_facts))
blanchet@43893
   485
    | SOME _ => (msg, SH_FAIL (time_isa, time_prover))
boehmes@32521
   486
  end
blanchet@38228
   487
  handle ERROR msg => ("error: " ^ msg, SH_ERROR)
boehmes@32521
   488
boehmes@32454
   489
fun thms_of_name ctxt name =
boehmes@32454
   490
  let
wenzelm@36970
   491
    val lex = Keyword.get_lexicons
wenzelm@43232
   492
    val get = maps (Proof_Context.get_fact ctxt o fst)
boehmes@32454
   493
  in
boehmes@32454
   494
    Source.of_string name
wenzelm@40772
   495
    |> Symbol.source
wenzelm@36969
   496
    |> Token.source {do_recover=SOME false} lex Position.start
wenzelm@36969
   497
    |> Token.source_proper
wenzelm@36969
   498
    |> Source.source Token.stopper (Parse_Spec.xthms1 >> get) NONE
boehmes@32454
   499
    |> Source.exhaust
boehmes@32454
   500
  end
boehmes@32452
   501
boehmes@32498
   502
in
boehmes@32498
   503
blanchet@44961
   504
fun run_sledgehammer trivial args reconstructor named_thms id
blanchet@44961
   505
      ({pre=st, log, pos, ...}: Mirabelle.run_args) =
boehmes@32385
   506
  let
blanchet@39586
   507
    val triv_str = if trivial then "[T] " else ""
nipkow@32536
   508
    val _ = change_data id inc_sh_calls
blanchet@39583
   509
    val _ = if trivial then () else change_data id inc_sh_nontriv_calls
blanchet@43315
   510
    val (prover_name, prover) = get_prover (Proof.context_of st) args
sultana@48352
   511
    val type_enc = AList.lookup (op =) args type_encK |> the_default type_enc_default
sultana@48352
   512
    val strict = AList.lookup (op =) args strictK |> the_default strict_default
blanchet@49308
   513
    val max_facts =
blanchet@49308
   514
      case AList.lookup (op =) args max_factsK of
blanchet@49308
   515
        SOME max => max
blanchet@49308
   516
      | NONE => case AList.lookup (op =) args max_relevantK of
blanchet@49308
   517
                  SOME max => max
blanchet@49308
   518
                | NONE => max_facts_default
sultana@48352
   519
    val slice = AList.lookup (op =) args sliceK |> the_default slice_default
blanchet@46385
   520
    val lam_trans = AList.lookup (op =) args lam_transK
blanchet@47243
   521
    val uncurried_aliases = AList.lookup (op =) args uncurried_aliasesK
blanchet@47903
   522
    val e_selection_heuristic = AList.lookup (op =) args e_selection_heuristicK
blanchet@47920
   523
    val term_order = AList.lookup (op =) args term_orderK
blanchet@44970
   524
    val force_sos = AList.lookup (op =) args force_sosK
blanchet@43590
   525
      |> Option.map (curry (op <>) "false")
boehmes@32525
   526
    val dir = AList.lookup (op =) args keepK
boehmes@32541
   527
    val timeout = Mirabelle.get_int_setting args (prover_timeoutK, 30)
blanchet@41516
   528
    (* always use a hard timeout, but give some slack so that the automatic
blanchet@41516
   529
       minimizer has a chance to do its magic *)
sultana@47696
   530
    val preplay_timeout = AList.lookup (op =) args preplay_timeoutK
sultana@47696
   531
      |> the_default preplay_timeout_default
sultana@47697
   532
    val sh_minimizeLST = available_parameter args sh_minimizeK "minimize"
sultana@47697
   533
    val max_new_mono_instancesLST =
sultana@47697
   534
      available_parameter args max_new_mono_instancesK max_new_mono_instancesK
sultana@47697
   535
    val max_mono_itersLST = available_parameter args max_mono_itersK max_mono_itersK
blanchet@41516
   536
    val hard_timeout = SOME (2 * timeout)
blanchet@41403
   537
    val (msg, result) =
blanchet@49308
   538
      run_sh prover_name prover type_enc strict max_facts slice lam_trans
blanchet@47920
   539
        uncurried_aliases e_selection_heuristic term_order force_sos
blanchet@47920
   540
        hard_timeout timeout preplay_timeout sh_minimizeLST
blanchet@47920
   541
        max_new_mono_instancesLST max_mono_itersLST dir pos st
boehmes@32525
   542
  in
nipkow@32536
   543
    case result of
blanchet@40243
   544
      SH_OK (time_isa, time_prover, names) =>
blanchet@38939
   545
        let
blanchet@47168
   546
          fun get_thms (name, stature) =
blanchet@48025
   547
            try (thms_of_name (Proof.context_of st)) name
blanchet@48025
   548
            |> Option.map (pair (name, stature))
boehmes@32525
   549
        in
nipkow@32810
   550
          change_data id inc_sh_success;
blanchet@39583
   551
          if trivial then () else change_data id inc_sh_nontriv_success;
nipkow@32810
   552
          change_data id (inc_sh_lemmas (length names));
nipkow@32810
   553
          change_data id (inc_sh_max_lems (length names));
nipkow@32810
   554
          change_data id (inc_sh_time_isa time_isa);
blanchet@40243
   555
          change_data id (inc_sh_time_prover time_prover);
blanchet@41605
   556
          reconstructor := reconstructor_from_msg args msg;
blanchet@39061
   557
          named_thms := SOME (map_filter get_thms names);
blanchet@39586
   558
          log (sh_tag id ^ triv_str ^ "succeeded (" ^ string_of_int time_isa ^ "+" ^
blanchet@40243
   559
            string_of_int time_prover ^ ") [" ^ prover_name ^ "]:\n" ^ msg)
boehmes@32525
   560
        end
blanchet@40243
   561
    | SH_FAIL (time_isa, time_prover) =>
nipkow@32536
   562
        let
nipkow@32536
   563
          val _ = change_data id (inc_sh_time_isa time_isa)
blanchet@40243
   564
          val _ = change_data id (inc_sh_time_prover_fail time_prover)
blanchet@39586
   565
        in log (sh_tag id ^ triv_str ^ "failed: " ^ msg) end
nipkow@32536
   566
    | SH_ERROR => log (sh_tag id ^ "failed: " ^ msg)
boehmes@32525
   567
  end
boehmes@32525
   568
boehmes@32525
   569
end
boehmes@32525
   570
blanchet@40915
   571
fun run_minimize args reconstructor named_thms id
blanchet@40915
   572
        ({pre=st, log, ...}: Mirabelle.run_args) =
boehmes@32525
   573
  let
blanchet@40250
   574
    val ctxt = Proof.context_of st
nipkow@32571
   575
    val n0 = length (these (!named_thms))
blanchet@43315
   576
    val (prover_name, _) = get_prover ctxt args
sultana@48352
   577
    val type_enc = AList.lookup (op =) args type_encK |> the_default type_enc_default
sultana@48352
   578
    val strict = AList.lookup (op =) args strictK |> the_default strict_default
boehmes@32525
   579
    val timeout =
boehmes@32525
   580
      AList.lookup (op =) args minimize_timeoutK
wenzelm@40875
   581
      |> Option.map (fst o read_int o raw_explode)  (* FIXME Symbol.explode (?) *)
sultana@48352
   582
      |> the_default minimize_timeout_default
sultana@47696
   583
    val preplay_timeout = AList.lookup (op =) args preplay_timeoutK
sultana@47696
   584
      |> the_default preplay_timeout_default
sultana@47697
   585
    val sh_minimizeLST = available_parameter args sh_minimizeK "minimize"
sultana@47697
   586
    val max_new_mono_instancesLST =
sultana@47697
   587
      available_parameter args max_new_mono_instancesK max_new_mono_instancesK
sultana@47697
   588
    val max_mono_itersLST = available_parameter args max_mono_itersK max_mono_itersK
blanchet@43905
   589
    val params = Sledgehammer_Isar.default_params ctxt
sultana@47697
   590
     ([("provers", prover_name),
blanchet@41403
   591
       ("verbose", "true"),
blanchet@44493
   592
       ("type_enc", type_enc),
blanchet@47214
   593
       ("strict", strict),
blanchet@45305
   594
       ("timeout", string_of_int timeout),
sultana@47697
   595
       ("preplay_timeout", preplay_timeout)]
sultana@47697
   596
      |> sh_minimizeLST (*don't confuse the two minimization flags*)
sultana@47697
   597
      |> max_new_mono_instancesLST
sultana@47697
   598
      |> max_mono_itersLST)
blanchet@37587
   599
    val minimize =
blanchet@49336
   600
      Sledgehammer_Minimize.minimize_facts (K ()) prover_name params
blanchet@43905
   601
          true 1 (Sledgehammer_Util.subgoal_count st)
boehmes@32525
   602
    val _ = log separator
blanchet@44102
   603
    val (used_facts, (preplay, message, message_tail)) =
blanchet@44102
   604
      minimize st (these (!named_thms))
blanchet@44102
   605
    val msg = message (preplay ()) ^ message_tail
boehmes@32525
   606
  in
blanchet@43893
   607
    case used_facts of
blanchet@43893
   608
      SOME named_thms' =>
nipkow@32609
   609
        (change_data id inc_min_succs;
nipkow@32609
   610
         change_data id (inc_min_ab_ratios ((100 * length named_thms') div n0));
nipkow@32571
   611
         if length named_thms' = n0
nipkow@32571
   612
         then log (minimize_tag id ^ "already minimal")
blanchet@41605
   613
         else (reconstructor := reconstructor_from_msg args msg;
blanchet@40915
   614
               named_thms := SOME named_thms';
nipkow@32571
   615
               log (minimize_tag id ^ "succeeded:\n" ^ msg))
nipkow@32571
   616
        )
blanchet@43893
   617
    | NONE => log (minimize_tag id ^ "failed: " ^ msg)
boehmes@32525
   618
  end
boehmes@32525
   619
blanchet@45413
   620
fun override_params prover type_enc timeout =
blanchet@45413
   621
  [("provers", prover),
blanchet@49308
   622
   ("max_facts", "0"),
blanchet@45413
   623
   ("type_enc", type_enc),
blanchet@47214
   624
   ("strict", "true"),
blanchet@46577
   625
   ("slice", "false"),
blanchet@45318
   626
   ("timeout", timeout |> Time.toSeconds |> string_of_int)]
blanchet@45301
   627
blanchet@40915
   628
fun run_reconstructor trivial full m name reconstructor named_thms id
wenzelm@32567
   629
    ({pre=st, timeout, log, pos, ...}: Mirabelle.run_args) =
boehmes@32525
   630
  let
blanchet@45319
   631
    fun do_reconstructor named_thms ctxt =
blanchet@45319
   632
      let
blanchet@45319
   633
        val ref_of_str =
blanchet@45319
   634
          suffix ";" #> Outer_Syntax.scan Position.none #> Parse_Spec.xthm
blanchet@45319
   635
          #> fst
blanchet@45319
   636
        val thms = named_thms |> maps snd
blanchet@45319
   637
        val facts = named_thms |> map (ref_of_str o fst o fst)
blanchet@49307
   638
        val fact_override = {add = facts, del = [], only = true}
blanchet@45437
   639
        fun my_timeout time_slice =
blanchet@45437
   640
          timeout |> Time.toReal |> curry Real.* time_slice |> Time.fromReal
blanchet@45437
   641
        fun sledge_tac time_slice prover type_enc =
blanchet@45413
   642
          Sledgehammer_Tactics.sledgehammer_as_oracle_tac ctxt
blanchet@49307
   643
              (override_params prover type_enc (my_timeout time_slice))
blanchet@49307
   644
              fact_override
blanchet@45319
   645
      in
blanchet@45319
   646
        if !reconstructor = "sledgehammer_tac" then
blanchet@47263
   647
          sledge_tac 0.2 ATP_Systems.z3_tptpN "mono_native"
blanchet@45639
   648
          ORELSE' sledge_tac 0.2 ATP_Systems.eN "mono_guards??"
blanchet@45639
   649
          ORELSE' sledge_tac 0.2 ATP_Systems.vampireN "mono_guards??"
blanchet@45639
   650
          ORELSE' sledge_tac 0.2 ATP_Systems.spassN "poly_tags"
blanchet@47193
   651
          ORELSE' Metis_Tactic.metis_tac [] ATP_Problem_Generate.combsN
blanchet@47148
   652
            ctxt thms
blanchet@45319
   653
        else if !reconstructor = "smt" then
blanchet@45319
   654
          SMT_Solver.smt_tac ctxt thms
blanchet@46390
   655
        else if full then
blanchet@47148
   656
          Metis_Tactic.metis_tac [ATP_Proof_Reconstruct.full_typesN]
blanchet@47148
   657
            ATP_Proof_Reconstruct.metis_default_lam_trans ctxt thms
blanchet@46390
   658
        else if String.isPrefix "metis (" (!reconstructor) then
blanchet@46390
   659
          let
blanchet@46390
   660
            val (type_encs, lam_trans) =
blanchet@46390
   661
              !reconstructor
blanchet@46390
   662
              |> Outer_Syntax.scan Position.start
blanchet@46390
   663
              |> filter Token.is_proper |> tl
blanchet@46390
   664
              |> Metis_Tactic.parse_metis_options |> fst
blanchet@47148
   665
              |>> the_default [ATP_Proof_Reconstruct.partial_typesN]
blanchet@47148
   666
              ||> the_default ATP_Proof_Reconstruct.metis_default_lam_trans
blanchet@46390
   667
          in Metis_Tactic.metis_tac type_encs lam_trans ctxt thms end
blanchet@45319
   668
        else if !reconstructor = "metis" then
blanchet@47148
   669
          Metis_Tactic.metis_tac [] ATP_Proof_Reconstruct.metis_default_lam_trans ctxt
blanchet@46390
   670
            thms
blanchet@45319
   671
        else
blanchet@45319
   672
          K all_tac
blanchet@45319
   673
      end
blanchet@45319
   674
    fun apply_reconstructor named_thms =
blanchet@45319
   675
      Mirabelle.can_apply timeout (do_reconstructor named_thms) st
boehmes@32521
   676
boehmes@32521
   677
    fun with_time (false, t) = "failed (" ^ string_of_int t ^ ")"
blanchet@40915
   678
      | with_time (true, t) = (change_data id (inc_reconstructor_success m);
blanchet@40915
   679
          if trivial then ()
blanchet@40915
   680
          else change_data id (inc_reconstructor_nontriv_success m);
blanchet@40915
   681
          change_data id (inc_reconstructor_lemmas m (length named_thms));
blanchet@40915
   682
          change_data id (inc_reconstructor_time m t);
blanchet@40915
   683
          change_data id (inc_reconstructor_posns m (pos, trivial));
blanchet@40915
   684
          if name = "proof" then change_data id (inc_reconstructor_proofs m)
blanchet@40915
   685
          else ();
boehmes@32521
   686
          "succeeded (" ^ string_of_int t ^ ")")
blanchet@45319
   687
    fun timed_reconstructor named_thms =
blanchet@45319
   688
      (with_time (Mirabelle.cpu_time apply_reconstructor named_thms), true)
blanchet@40915
   689
      handle TimeLimit.TimeOut => (change_data id (inc_reconstructor_timeout m);
boehmes@34048
   690
               ("timeout", false))
boehmes@34048
   691
           | ERROR msg => ("error: " ^ msg, false)
boehmes@32521
   692
boehmes@32525
   693
    val _ = log separator
blanchet@40915
   694
    val _ = change_data id (inc_reconstructor_calls m)
blanchet@40915
   695
    val _ = if trivial then ()
blanchet@40915
   696
            else change_data id (inc_reconstructor_nontriv_calls m)
boehmes@32521
   697
  in
blanchet@45319
   698
    named_thms
blanchet@40915
   699
    |> timed_reconstructor
blanchet@40915
   700
    |>> log o prefix (reconstructor_tag reconstructor id)
boehmes@34048
   701
    |> snd
boehmes@32521
   702
  end
boehmes@32432
   703
blanchet@41524
   704
val try_timeout = seconds 5.0
blanchet@39583
   705
blanchet@45302
   706
(* crude hack *)
blanchet@45302
   707
val num_sledgehammer_calls = Unsynchronized.ref 0
blanchet@45302
   708
boehmes@34033
   709
fun sledgehammer_action args id (st as {pre, name, ...}: Mirabelle.run_args) =
wenzelm@35596
   710
  let val goal = Thm.major_prem_of (#goal (Proof.goal pre)) in
wenzelm@35596
   711
    if can Logic.dest_conjunction goal orelse can Logic.dest_equals goal
wenzelm@35596
   712
    then () else
wenzelm@35596
   713
    let
blanchet@45302
   714
      val max_calls =
sultana@48352
   715
        AList.lookup (op =) args max_callsK |> the_default max_calls_default
blanchet@45302
   716
        |> Int.fromString |> the
blanchet@45302
   717
      val _ = num_sledgehammer_calls := !num_sledgehammer_calls + 1;
blanchet@45305
   718
    in
blanchet@45302
   719
      if !num_sledgehammer_calls > max_calls then ()
blanchet@45302
   720
      else
blanchet@45305
   721
        let
blanchet@45305
   722
          val reconstructor = Unsynchronized.ref ""
blanchet@45305
   723
          val named_thms =
blanchet@47168
   724
            Unsynchronized.ref (NONE : ((string * stature) * thm list) list option)
blanchet@45305
   725
          val minimize = AList.defined (op =) args minimizeK
blanchet@45305
   726
          val metis_ft = AList.defined (op =) args metis_ftK
blanchet@45305
   727
          val trivial =
sultana@48352
   728
            if AList.lookup (op =) args check_trivialK |> the_default trivial_default
sultana@48072
   729
                            |> Bool.fromString |> the then
sultana@48072
   730
              Try0.try0 (SOME try_timeout) ([], [], [], []) pre
sultana@48072
   731
              handle TimeLimit.TimeOut => false
sultana@48072
   732
            else false
blanchet@45305
   733
          fun apply_reconstructor m1 m2 =
blanchet@45305
   734
            if metis_ft
blanchet@45305
   735
            then
blanchet@45305
   736
              if not (Mirabelle.catch_result (reconstructor_tag reconstructor) false
blanchet@45305
   737
                  (run_reconstructor trivial false m1 name reconstructor
blanchet@45305
   738
                       (these (!named_thms))) id st)
blanchet@45305
   739
              then
blanchet@45305
   740
                (Mirabelle.catch_result (reconstructor_tag reconstructor) false
blanchet@45305
   741
                  (run_reconstructor trivial true m2 name reconstructor
blanchet@45305
   742
                       (these (!named_thms))) id st; ())
blanchet@45305
   743
              else ()
blanchet@45305
   744
            else
blanchet@45305
   745
              (Mirabelle.catch_result (reconstructor_tag reconstructor) false
blanchet@45305
   746
                (run_reconstructor trivial false m1 name reconstructor
blanchet@45305
   747
                     (these (!named_thms))) id st; ())
blanchet@45305
   748
        in
blanchet@45305
   749
          change_data id (set_mini minimize);
blanchet@45305
   750
          Mirabelle.catch sh_tag (run_sledgehammer trivial args reconstructor
blanchet@45305
   751
                                                   named_thms) id st;
blanchet@45305
   752
          if is_some (!named_thms)
blanchet@45302
   753
          then
blanchet@45305
   754
           (apply_reconstructor Unminimized UnminimizedFT;
blanchet@45305
   755
            if minimize andalso not (null (these (!named_thms)))
blanchet@45305
   756
            then
blanchet@45305
   757
             (Mirabelle.catch minimize_tag
blanchet@45305
   758
                  (run_minimize args reconstructor named_thms) id st;
blanchet@45305
   759
              apply_reconstructor Minimized MinimizedFT)
blanchet@45305
   760
            else ())
blanchet@45305
   761
          else ()
blanchet@45305
   762
        end
wenzelm@35596
   763
    end
nipkow@32810
   764
  end
boehmes@32385
   765
boehmes@32511
   766
fun invoke args =
blanchet@44431
   767
  Mirabelle.register (init, sledgehammer_action args, done)
boehmes@32385
   768
boehmes@32385
   769
end