src/HOL/Tools/ATP/atp_proof.ML
author blanchet
Sat, 29 Oct 2011 13:15:58 +0200
changeset 46172 866b075aa99b
parent 46104 7187bce94e88
child 46422 a62c7a21f4ab
permissions -rw-r--r--
added sorted DFG output for coming version of SPASS
     1 (*  Title:      HOL/Tools/ATP/atp_proof.ML
     2     Author:     Lawrence C. Paulson, Cambridge University Computer Laboratory
     3     Author:     Claire Quigley, Cambridge University Computer Laboratory
     4     Author:     Jasmin Blanchette, TU Muenchen
     5 
     6 Abstract representation of ATP proofs and TSTP/SPASS syntax.
     7 *)
     8 
     9 signature ATP_PROOF =
    10 sig
    11   type ('a, 'b) ho_term = ('a, 'b) ATP_Problem.ho_term
    12   type ('a, 'b, 'c) formula = ('a, 'b, 'c) ATP_Problem.formula
    13   type 'a problem = 'a ATP_Problem.problem
    14 
    15   exception UNRECOGNIZED_ATP_PROOF of unit
    16 
    17   datatype failure =
    18     Unprovable |
    19     GaveUp |
    20     ProofMissing |
    21     ProofIncomplete |
    22     UnsoundProof of bool * string list |
    23     CantConnect |
    24     TimedOut |
    25     Inappropriate |
    26     OutOfResources |
    27     NoPerl |
    28     NoLibwwwPerl |
    29     MalformedInput |
    30     MalformedOutput |
    31     Interrupted |
    32     Crashed |
    33     InternalError |
    34     UnknownError of string
    35 
    36   type step_name = string * string list option
    37 
    38   datatype 'a step =
    39     Definition of step_name * 'a * 'a |
    40     Inference of step_name * 'a * string * step_name list
    41 
    42   type 'a proof = ('a, 'a, ('a, 'a) ho_term) formula step list
    43 
    44   val short_output : bool -> string -> string
    45   val string_for_failure : failure -> string
    46   val extract_important_message : string -> string
    47   val extract_known_failure :
    48     (failure * string) list -> string -> failure option
    49   val extract_tstplike_proof_and_outcome :
    50     bool -> bool -> (string * string) list -> (failure * string) list -> string
    51     -> string * failure option
    52   val is_same_atp_step : step_name -> step_name -> bool
    53   val scan_general_id : string list -> string * string list
    54   val parse_formula :
    55     string list -> (string, 'a, (string, 'a) ho_term) formula * string list
    56   val atp_proof_from_tstplike_proof :
    57     string problem -> string -> string -> string proof
    58   val clean_up_atp_proof_dependencies : string proof -> string proof
    59   val map_term_names_in_atp_proof :
    60     (string -> string) -> string proof -> string proof
    61   val nasty_atp_proof : string Symtab.table -> string proof -> string proof
    62 end;
    63 
    64 structure ATP_Proof : ATP_PROOF =
    65 struct
    66 
    67 open ATP_Util
    68 open ATP_Problem
    69 
    70 exception UNRECOGNIZED_ATP_PROOF of unit
    71 
    72 datatype failure =
    73   Unprovable |
    74   GaveUp |
    75   ProofMissing |
    76   ProofIncomplete |
    77   UnsoundProof of bool * string list |
    78   CantConnect |
    79   TimedOut |
    80   Inappropriate |
    81   OutOfResources |
    82   NoPerl |
    83   NoLibwwwPerl |
    84   MalformedInput |
    85   MalformedOutput |
    86   Interrupted |
    87   Crashed |
    88   InternalError |
    89   UnknownError of string
    90 
    91 fun elide_string threshold s =
    92   if size s > threshold then
    93     String.extract (s, 0, SOME (threshold div 2 - 5)) ^ " ...... " ^
    94     String.extract (s, size s - (threshold + 1) div 2 + 6, NONE)
    95   else
    96     s
    97 fun short_output verbose output =
    98   if verbose then
    99     if output = "" then "No details available" else elide_string 1000 output
   100   else
   101     ""
   102 
   103 val missing_message_tail =
   104   " appears to be missing. You will need to install it if you want to invoke \
   105   \remote provers."
   106 
   107 fun involving [] = ""
   108   | involving ss =
   109     "involving " ^ space_implode " " (Try.serial_commas "and" (map quote ss)) ^
   110     " "
   111 
   112 fun string_for_failure Unprovable = "The problem is unprovable."
   113   | string_for_failure GaveUp = "The prover gave up."
   114   | string_for_failure ProofMissing =
   115     "The prover claims the conjecture is a theorem but did not provide a proof."
   116   | string_for_failure ProofIncomplete =
   117     "The prover claims the conjecture is a theorem but provided an incomplete \
   118     \proof."
   119   | string_for_failure (UnsoundProof (false, ss)) =
   120     "The prover found a type-unsound proof " ^ involving ss ^
   121     "(or, less likely, your axioms are inconsistent). Specify a sound type \
   122     \encoding or omit the \"type_enc\" option."
   123   | string_for_failure (UnsoundProof (true, ss)) =
   124     "The prover found a type-unsound proof " ^ involving ss ^
   125     "even though a supposedly type-sound encoding was used (or, less likely, \
   126     \your axioms are inconsistent). Please report this to the Isabelle \
   127     \developers."
   128   | string_for_failure CantConnect = "Cannot connect to remote server."
   129   | string_for_failure TimedOut = "Timed out."
   130   | string_for_failure Inappropriate =
   131     "The problem lies outside the prover's scope."
   132   | string_for_failure OutOfResources = "The prover ran out of resources."
   133   | string_for_failure NoPerl = "Perl" ^ missing_message_tail
   134   | string_for_failure NoLibwwwPerl =
   135     "The Perl module \"libwww-perl\"" ^ missing_message_tail
   136   | string_for_failure MalformedInput =
   137     "The generated problem is malformed. Please report this to the Isabelle \
   138     \developers."
   139   | string_for_failure MalformedOutput = "The prover output is malformed."
   140   | string_for_failure Interrupted = "The prover was interrupted."
   141   | string_for_failure Crashed = "The prover crashed."
   142   | string_for_failure InternalError = "An internal prover error occurred."
   143   | string_for_failure (UnknownError string) =
   144     "A prover error occurred" ^
   145     (if string = "" then ". (Pass the \"verbose\" option for details.)"
   146      else ":\n" ^ string)
   147 
   148 fun extract_delimited (begin_delim, end_delim) output =
   149   output |> first_field begin_delim |> the |> snd
   150          |> first_field end_delim |> the |> fst
   151          |> first_field "\n" |> the |> snd
   152   handle Option.Option => ""
   153 
   154 val tstp_important_message_delims =
   155   ("% SZS start RequiredInformation", "% SZS end RequiredInformation")
   156 
   157 fun extract_important_message output =
   158   case extract_delimited tstp_important_message_delims output of
   159     "" => ""
   160   | s => s |> space_explode "\n" |> filter_out (curry (op =) "")
   161            |> map (perhaps (try (unprefix "%")))
   162            |> map (perhaps (try (unprefix " ")))
   163            |> space_implode "\n " |> quote
   164 
   165 (* Splits by the first possible of a list of delimiters. *)
   166 fun extract_tstplike_proof delims output =
   167   case pairself (find_first (fn s => String.isSubstring s output))
   168                 (ListPair.unzip delims) of
   169     (SOME begin_delim, SOME end_delim) =>
   170     extract_delimited (begin_delim, end_delim) output
   171   | _ => ""
   172 
   173 fun extract_known_failure known_failures output =
   174   known_failures
   175   |> find_first (fn (_, pattern) => String.isSubstring pattern output)
   176   |> Option.map fst
   177 
   178 fun extract_tstplike_proof_and_outcome verbose complete proof_delims
   179                                        known_failures output =
   180   case (extract_tstplike_proof proof_delims output,
   181         extract_known_failure known_failures output) of
   182     (_, SOME ProofIncomplete) => ("", SOME ProofIncomplete)
   183   | ("", SOME ProofMissing) => ("", NONE)
   184   | ("", SOME failure) =>
   185     ("", SOME (if failure = GaveUp andalso complete then Unprovable
   186                else failure))
   187   | ("", NONE) => ("", SOME (UnknownError (short_output verbose output)))
   188   | (tstplike_proof, _) => (tstplike_proof, NONE)
   189 
   190 type step_name = string * string list option
   191 
   192 fun is_same_atp_step (s1, _) (s2, _) = s1 = s2
   193 
   194 val vampire_fact_prefix = "f"
   195 
   196 fun step_name_ord p =
   197   let val q = pairself fst p in
   198     (* The "unprefix" part is to cope with remote Vampire's output. The proper
   199        solution would be to perform a topological sort, e.g. using the nice
   200        "Graph" functor. *)
   201     case pairself (Int.fromString
   202                    o perhaps (try (unprefix vampire_fact_prefix))) q of
   203       (NONE, NONE) => string_ord q
   204     | (NONE, SOME _) => LESS
   205     | (SOME _, NONE) => GREATER
   206     | (SOME i, SOME j) => int_ord (i, j)
   207   end
   208 
   209 datatype 'a step =
   210   Definition of step_name * 'a * 'a |
   211   Inference of step_name * 'a * string * step_name list
   212 
   213 type 'a proof = ('a, 'a, ('a, 'a) ho_term) formula step list
   214 
   215 fun step_name (Definition (name, _, _)) = name
   216   | step_name (Inference (name, _, _, _)) = name
   217 
   218 (**** PARSING OF TSTP FORMAT ****)
   219 
   220 (* FIXME: temporary hack *)
   221 fun repair_waldmeister_step_name s =
   222   case space_explode "." s of
   223     [a, b, c, d] =>
   224     (case a of "0" => "X" | "1" => "Y" | _ => "Z" ^ a) ^
   225     (if size b = 1 then "0" else "") ^ b ^ c ^ d
   226   | _ => s
   227 
   228 (* Strings enclosed in single quotes (e.g., file names) *)
   229 val scan_general_id =
   230   $$ "'" |-- Scan.repeat (~$$ "'") --| $$ "'"
   231      >> implode >> repair_waldmeister_step_name
   232   || Scan.repeat ($$ "$") -- Scan.many1 Symbol.is_letdig
   233      >> (fn (ss1, ss2) => implode ss1 ^ implode ss2)
   234 
   235 val skip_term =
   236   let
   237     fun skip _ accum [] = (accum, [])
   238       | skip 0 accum (ss as "," :: _) = (accum, ss)
   239       | skip 0 accum (ss as ")" :: _) = (accum, ss)
   240       | skip 0 accum (ss as "]" :: _) = (accum, ss)
   241       | skip n accum ((s as "(") :: ss) = skip (n + 1) (s :: accum) ss
   242       | skip n accum ((s as "[") :: ss) = skip (n + 1) (s :: accum) ss
   243       | skip n accum ((s as "]") :: ss) = skip (n - 1) (s :: accum) ss
   244       | skip n accum ((s as ")") :: ss) = skip (n - 1) (s :: accum) ss
   245       | skip n accum (s :: ss) = skip n (s :: accum) ss
   246   in skip 0 [] #>> (rev #> implode) end
   247 
   248 datatype source =
   249   File_Source of string * string option |
   250   Inference_Source of string * string list
   251 
   252 val dummy_phi = AAtom (ATerm ("", []))
   253 val dummy_inference = Inference_Source ("", [])
   254 
   255 fun parse_dependencies x = (skip_term ::: Scan.repeat ($$ "," |-- skip_term)) x
   256 
   257 fun parse_source x =
   258   (Scan.this_string "file" |-- $$ "(" |-- scan_general_id --
   259      Scan.option ($$ "," |-- scan_general_id) --| $$ ")"
   260      >> File_Source
   261    || Scan.this_string "inference" |-- $$ "(" |-- scan_general_id
   262         --| skip_term --| $$ "," --| skip_term --| $$ "," --| $$ "["
   263         -- parse_dependencies --| $$ "]" --| $$ ")"
   264        >> Inference_Source
   265    || skip_term >> K dummy_inference) x
   266 
   267 fun list_app (f, args) =
   268   fold (fn arg => fn f => ATerm (tptp_app, [f, arg])) args f
   269 
   270 (* We ignore TFF and THF types for now. *)
   271 fun parse_type_stuff x =
   272   Scan.repeat (($$ tptp_has_type || $$ tptp_fun_type) |-- parse_arg) x
   273 and parse_arg x =
   274   ($$ "(" |-- parse_term --| $$ ")" --| parse_type_stuff
   275    || scan_general_id --| parse_type_stuff
   276         -- Scan.optional ($$ "(" |-- parse_terms --| $$ ")") []
   277       >> ATerm) x
   278 and parse_app x =
   279   (parse_arg -- Scan.repeat ($$ tptp_app |-- parse_arg) >> list_app) x
   280 and parse_term x =
   281   (parse_app -- Scan.option (Scan.option ($$ tptp_not_infix) --| $$ tptp_equal
   282                              -- parse_app)
   283    >> (fn (u1, NONE) => u1
   284         | (u1, SOME (NONE, u2)) => ATerm ("equal", [u1, u2])
   285         | (u1, SOME (SOME _, u2)) =>
   286           ATerm (tptp_not, [ATerm ("equal", [u1, u2])]))) x
   287 and parse_terms x =
   288   (parse_term ::: Scan.repeat ($$ "," |-- parse_term)) x
   289 
   290 (* TODO: Avoid duplication with "parse_term" above. *)
   291 fun parse_atom x =
   292   (parse_term -- Scan.option (Scan.option ($$ tptp_not_infix) --| $$ tptp_equal
   293                               -- parse_term)
   294    >> (fn (u1, NONE) => AAtom u1
   295         | (u1, SOME (NONE, u2)) => AAtom (ATerm ("equal", [u1, u2]))
   296         | (u1, SOME (SOME _, u2)) =>
   297           mk_anot (AAtom (ATerm ("equal", [u1, u2]))))) x
   298 
   299 fun ho_term_head (ATerm (s, _)) = s
   300 
   301 (* TPTP formulas are fully parenthesized, so we don't need to worry about
   302    operator precedence. *)
   303 fun parse_literal x =
   304   ((Scan.repeat ($$ tptp_not) >> length)
   305       -- ($$ "(" |-- parse_formula --| $$ ")"
   306           || parse_quantified_formula
   307           || parse_atom)
   308       >> (fn (n, phi) => phi |> n mod 2 = 1 ? mk_anot)) x
   309 and parse_formula x =
   310   (parse_literal
   311    -- Scan.option ((Scan.this_string tptp_implies
   312                     || Scan.this_string tptp_iff
   313                     || Scan.this_string tptp_not_iff
   314                     || Scan.this_string tptp_if
   315                     || $$ tptp_or
   316                     || $$ tptp_and) -- parse_formula)
   317    >> (fn (phi1, NONE) => phi1
   318         | (phi1, SOME (c, phi2)) =>
   319           if c = tptp_implies then mk_aconn AImplies phi1 phi2
   320           else if c = tptp_iff then mk_aconn AIff phi1 phi2
   321           else if c = tptp_not_iff then mk_anot (mk_aconn AIff phi1 phi2)
   322           else if c = tptp_if then mk_aconn AImplies phi2 phi1
   323           else if c = tptp_or then mk_aconn AOr phi1 phi2
   324           else if c = tptp_and then mk_aconn AAnd phi1 phi2
   325           else raise Fail ("impossible connective " ^ quote c))) x
   326 and parse_quantified_formula x =
   327   (($$ tptp_forall >> K AForall || $$ tptp_exists >> K AExists)
   328    --| $$ "[" -- parse_terms --| $$ "]" --| $$ ":" -- parse_literal
   329    >> (fn ((q, ts), phi) =>
   330           (* We ignore TFF and THF types for now. *)
   331           AQuant (q, map (rpair NONE o ho_term_head) ts, phi))) x
   332 
   333 val parse_tstp_extra_arguments =
   334   Scan.optional ($$ "," |-- parse_source --| Scan.option ($$ "," |-- skip_term))
   335                 dummy_inference
   336 
   337 val waldmeister_conjecture = "conjecture_1"
   338 
   339 val tofof_fact_prefix = "fof_"
   340 
   341 fun is_same_term subst tm1 tm2 =
   342   let
   343     fun do_term_pair _ NONE = NONE
   344       | do_term_pair (ATerm (s1, tm1), ATerm (s2, tm2)) (SOME subst) =
   345         case pairself is_tptp_variable (s1, s2) of
   346           (true, true) =>
   347           (case AList.lookup (op =) subst s1 of
   348              SOME s2' => if s2' = s2 then SOME subst else NONE
   349            | NONE =>
   350              if null (AList.find (op =) subst s2) then SOME ((s1, s2) :: subst)
   351              else NONE)
   352         | (false, false) =>
   353           if s1 = s2 andalso length tm1 = length tm2 then
   354             SOME subst |> fold do_term_pair (tm1 ~~ tm2)
   355           else
   356             NONE
   357         | _ => NONE
   358   in SOME subst |> do_term_pair (tm1, tm2) |> is_some end
   359 
   360 fun is_same_formula subst (AQuant (q1, xs1, phi1)) (AQuant (q2, xs2, phi2)) =
   361     q1 = q2 andalso length xs1 = length xs2 andalso
   362     is_same_formula ((map fst xs1 ~~ map fst xs2) @ subst) phi1 phi2
   363   | is_same_formula subst (AConn (c1, phis1)) (AConn (c2, phis2)) =
   364     c1 = c2 andalso length phis1 = length phis2 andalso
   365     forall (uncurry (is_same_formula subst)) (phis1 ~~ phis2)
   366   | is_same_formula subst (AAtom (ATerm ("equal", [tm11, tm12]))) (AAtom tm2) =
   367     is_same_term subst (ATerm ("equal", [tm11, tm12])) tm2 orelse
   368     is_same_term subst (ATerm ("equal", [tm12, tm11])) tm2
   369   | is_same_formula subst (AAtom tm1) (AAtom tm2) = is_same_term subst tm1 tm2
   370   | is_same_formula _ _ _ = false
   371 
   372 fun matching_formula_line_identifier phi (Formula (ident, _, phi', _, _)) =
   373     if is_same_formula [] phi phi' then SOME ident else NONE
   374   | matching_formula_line_identifier _ _ = NONE
   375 
   376 fun find_formula_in_problem problem phi =
   377   problem |> maps snd |> map_filter (matching_formula_line_identifier phi)
   378           |> try (single o hd)
   379 
   380 (* Syntax: (cnf|fof|tff|thf)\(<num>, <formula_role>,
   381             <formula> <extra_arguments>\).
   382    The <num> could be an identifier, but we assume integers. *)
   383 fun parse_tstp_line problem =
   384   ((Scan.this_string tptp_cnf || Scan.this_string tptp_fof
   385     || Scan.this_string tptp_tff || Scan.this_string tptp_thf) -- $$ "(")
   386     |-- scan_general_id --| $$ "," -- Symbol.scan_id --| $$ ","
   387     -- (parse_formula || skip_term >> K dummy_phi) -- parse_tstp_extra_arguments
   388     --| $$ ")" --| $$ "."
   389    >> (fn (((num, role), phi), deps) =>
   390           let
   391             val (name, rule, deps) =
   392               (* Waldmeister isn't exactly helping. *)
   393               case deps of
   394                 File_Source (_, SOME s) =>
   395                 ((num,
   396                   if s = waldmeister_conjecture then
   397                     find_formula_in_problem problem (mk_anot phi)
   398                   else
   399                     SOME [s |> perhaps (try (unprefix tofof_fact_prefix))]), "",
   400                  [])
   401               | File_Source _ =>
   402                 ((num, find_formula_in_problem problem phi), "", [])
   403               | Inference_Source (rule, deps) => ((num, NONE), rule, deps)
   404           in
   405             case role of
   406               "definition" =>
   407               (case phi of
   408                  AConn (AIff, [phi1 as AAtom _, phi2]) =>
   409                  Definition (name, phi1, phi2)
   410                | AAtom (ATerm ("equal", _)) =>
   411                  (* Vampire's equality proxy axiom *)
   412                  Inference (name, phi, rule, map (rpair NONE) deps)
   413                | _ => raise UNRECOGNIZED_ATP_PROOF ())
   414             | _ => Inference (name, phi, rule, map (rpair NONE) deps)
   415           end)
   416 
   417 (**** PARSING OF SPASS OUTPUT ****)
   418 
   419 (* SPASS returns clause references of the form "x.y". We ignore "y", whose role
   420    is not clear anyway. *)
   421 val parse_dot_name = scan_general_id --| $$ "." --| scan_general_id
   422 
   423 val parse_spass_annotations =
   424   Scan.optional ($$ ":" |-- Scan.repeat (parse_dot_name
   425                                          --| Scan.option ($$ ","))) []
   426 
   427 (* It is not clear why some literals are followed by sequences of stars and/or
   428    pluses. We ignore them. *)
   429 fun parse_decorated_atom x =
   430   (parse_atom --| Scan.repeat ($$ "*" || $$ "+" || $$ " ")) x
   431 
   432 fun mk_horn ([], []) = AAtom (ATerm ("c_False", []))
   433   | mk_horn ([], pos_lits) = foldr1 (uncurry (mk_aconn AOr)) pos_lits
   434   | mk_horn (neg_lits, []) = mk_anot (foldr1 (uncurry (mk_aconn AAnd)) neg_lits)
   435   | mk_horn (neg_lits, pos_lits) =
   436     mk_aconn AImplies (foldr1 (uncurry (mk_aconn AAnd)) neg_lits)
   437                       (foldr1 (uncurry (mk_aconn AOr)) pos_lits)
   438 
   439 fun parse_horn_clause x =
   440   (Scan.repeat parse_decorated_atom --| $$ "|" --| $$ "|"
   441      -- Scan.repeat parse_decorated_atom --| $$ "-" --| $$ ">"
   442      -- Scan.repeat parse_decorated_atom
   443    >> (mk_horn o apfst (op @))) x
   444 
   445 fun resolve_spass_num spass_names num =
   446   case Int.fromString num of
   447     SOME j => if j > 0 andalso j <= Vector.length spass_names then
   448                 SOME (Vector.sub (spass_names, j - 1))
   449               else
   450                 NONE
   451   | NONE => NONE
   452 
   453 (* Syntax: <num>[0:<inference><annotations>] <atoms> || <atoms> -> <atoms>. *)
   454 fun parse_spass_line spass_names =
   455   scan_general_id --| $$ "[" --| $$ "0" --| $$ ":" -- Symbol.scan_id
   456     -- parse_spass_annotations --| $$ "]" -- parse_horn_clause --| $$ "."
   457   >> (fn (((num, rule), deps), u) =>
   458          Inference ((num, resolve_spass_num spass_names num), u, rule,
   459                     map (swap o `(resolve_spass_num spass_names)) deps))
   460 
   461 (* Syntax: <name> *)
   462 fun parse_satallax_line x =
   463   (scan_general_id --| Scan.option ($$ " ")
   464    >> (fn s => Inference ((s, SOME [s]), dummy_phi, "", []))) x
   465 
   466 fun parse_line problem spass_names =
   467   parse_tstp_line problem || parse_spass_line spass_names || parse_satallax_line
   468 fun parse_proof problem spass_names tstp =
   469   tstp |> strip_spaces_except_between_idents
   470        |> raw_explode
   471        |> Scan.finite Symbol.stopper
   472               (Scan.error (!! (fn _ => raise UNRECOGNIZED_ATP_PROOF ())
   473                               (Scan.repeat1 (parse_line problem spass_names))))
   474        |> fst
   475 
   476 (** SPASS's FLOTTER hack **)
   477 
   478 (* This is a hack required for keeping track of facts after they have been
   479    clausified by SPASS's FLOTTER preprocessor. The "ATP/scripts/spass" script is
   480    also part of this hack. *)
   481 
   482 val set_ClauseFormulaRelationN = "set_ClauseFormulaRelation"
   483 
   484 fun extract_clause_sequence output =
   485   let
   486     val tokens_of = String.tokens (not o Char.isAlphaNum)
   487     fun extract_num ("clause" :: (ss as _ :: _)) = Int.fromString (List.last ss)
   488       | extract_num _ = NONE
   489   in output |> split_lines |> map_filter (extract_num o tokens_of) end
   490 
   491 fun is_head_digit s = Char.isDigit (String.sub (s, 0))
   492 val scan_integer = Scan.many1 is_head_digit >> (the o Int.fromString o implode)
   493 
   494 val parse_clause_formula_pair =
   495   $$ "(" |-- scan_integer --| $$ ","
   496   -- (Symbol.scan_id ::: Scan.repeat ($$ "," |-- Symbol.scan_id)) --| $$ ")"
   497   --| Scan.option ($$ ",")
   498 val parse_clause_formula_relation =
   499   Scan.this_string set_ClauseFormulaRelationN |-- $$ "("
   500   |-- Scan.repeat parse_clause_formula_pair
   501 val extract_clause_formula_relation =
   502   Substring.full #> Substring.position set_ClauseFormulaRelationN
   503   #> snd #> Substring.position "." #> fst #> Substring.string
   504   #> raw_explode #> filter_out Symbol.is_blank #> parse_clause_formula_relation
   505   #> fst
   506 
   507 fun extract_spass_name_vector output =
   508   (if String.isSubstring set_ClauseFormulaRelationN output then
   509      let
   510        val num_seq = extract_clause_sequence output
   511        val name_map = extract_clause_formula_relation output
   512        val name_seq = num_seq |> map (these o AList.lookup (op =) name_map)
   513      in name_seq end
   514    else
   515      [])
   516   |> Vector.fromList
   517 
   518 fun atp_proof_from_tstplike_proof _ _ "" = []
   519   | atp_proof_from_tstplike_proof problem output tstp =
   520     tstp ^ "$" (* the $ sign acts as a sentinel (FIXME: needed?) *)
   521     |> parse_proof problem (extract_spass_name_vector output)
   522     |> sort (step_name_ord o pairself step_name)
   523 
   524 fun clean_up_dependencies _ [] = []
   525   | clean_up_dependencies seen ((step as Definition (name, _, _)) :: steps) =
   526     step :: clean_up_dependencies (name :: seen) steps
   527   | clean_up_dependencies seen (Inference (name, u, rule, deps) :: steps) =
   528     Inference (name, u, rule,
   529                map_filter (fn dep => find_first (is_same_atp_step dep) seen)
   530                           deps) ::
   531     clean_up_dependencies (name :: seen) steps
   532 
   533 fun clean_up_atp_proof_dependencies proof = clean_up_dependencies [] proof
   534 
   535 fun map_term_names_in_term f (ATerm (s, ts)) =
   536   ATerm (f s, map (map_term_names_in_term f) ts)
   537 fun map_term_names_in_formula f (AQuant (q, xs, phi)) =
   538     AQuant (q, xs, map_term_names_in_formula f phi)
   539   | map_term_names_in_formula f (AConn (c, phis)) =
   540     AConn (c, map (map_term_names_in_formula f) phis)
   541   | map_term_names_in_formula f (AAtom t) = AAtom (map_term_names_in_term f t)
   542 fun map_term_names_in_step f (Definition (name, phi1, phi2)) =
   543     Definition (name, map_term_names_in_formula f phi1,
   544                 map_term_names_in_formula f phi2)
   545   | map_term_names_in_step f (Inference (name, phi, rule, deps)) =
   546     Inference (name, map_term_names_in_formula f phi, rule, deps)
   547 fun map_term_names_in_atp_proof f = map (map_term_names_in_step f)
   548 
   549 fun nasty_name pool s = s |> Symtab.lookup pool |> the_default s
   550 fun nasty_atp_proof pool =
   551   if Symtab.is_empty pool then I
   552   else map_term_names_in_atp_proof (nasty_name pool)
   553 
   554 end;