wneuper/isa: doc-src/Sledgehammer/sledgehammer.tex@d7447b8c4265 (annotated)

blanchet@36918	1	\documentclass[a4paper,12pt]{article}
blanchet@36918	2	\usepackage[T1]{fontenc}
blanchet@36918	3	\usepackage{amsmath}
blanchet@36918	4	\usepackage{amssymb}
blanchet@36918	5	\usepackage[english,french]{babel}
blanchet@36918	6	\usepackage{color}
blanchet@36918	7	\usepackage{footmisc}
blanchet@36918	8	\usepackage{graphicx}
blanchet@36918	9	%\usepackage{mathpazo}
blanchet@36918	10	\usepackage{multicol}
blanchet@36918	11	\usepackage{stmaryrd}
blanchet@36918	12	%\usepackage[scaled=.85]{beramono}
wenzelm@43382	13	\usepackage{../../lib/texinputs/isabelle,../iman,../pdfsetup}
blanchet@36918	14
blanchet@36918	15	%\oddsidemargin=4.6mm
blanchet@36918	16	%\evensidemargin=4.6mm
blanchet@36918	17	%\textwidth=150mm
blanchet@36918	18	%\topmargin=4.6mm
blanchet@36918	19	%\headheight=0mm
blanchet@36918	20	%\headsep=0mm
blanchet@36918	21	%\textheight=234mm
blanchet@36918	22
blanchet@36918	23	\def\Colon{\mathord{:\mkern-1.5mu:}}
blanchet@36918	24	%\def\lbrakk{\mathopen{\lbrack\mkern-3.25mu\lbrack}}
blanchet@36918	25	%\def\rbrakk{\mathclose{\rbrack\mkern-3.255mu\rbrack}}
blanchet@36918	26	\def\lparr{\mathopen{(\mkern-4mu\mid}}
blanchet@36918	27	\def\rparr{\mathclose{\mid\mkern-4mu)}}
blanchet@36918	28
blanchet@36918	29	\def\unk{{?}}
blanchet@36918	30	\def\undef{(\lambda x.\; \unk)}
blanchet@36918	31	%\def\unr{\textit{others}}
blanchet@36918	32	\def\unr{\ldots}
blanchet@36918	33	\def\Abs#1{\hbox{\rm{\flqq}}{\,#1\,}\hbox{\rm{\frqq}}}
blanchet@36918	34	\def\Q{{\smash{\lower.2ex\hbox{$\scriptstyle?$}}}}
blanchet@36918	35
blanchet@36918	36	\urlstyle{tt}
blanchet@36918	37
blanchet@36918	38	\begin{document}
blanchet@36918	39
blanchet@36918	40	\selectlanguage{english}
blanchet@36918	41
blanchet@36918	42	\title{\includegraphics[scale=0.5]{isabelle_sledgehammer} \\[4ex]
blanchet@36918	43	Hammering Away \\[\smallskipamount]
blanchet@36918	44	\Large A User's Guide to Sledgehammer for Isabelle/HOL}
blanchet@36918	45	\author{\hbox{} \\
blanchet@36918	46	Jasmin Christian Blanchette \\
blanchet@36918	47	{\normalsize Institut f\"ur Informatik, Technische Universit\"at M\"unchen} \\
blanchet@36918	48	\hbox{}}
blanchet@36918	49
blanchet@36918	50	\maketitle
blanchet@36918	51
blanchet@36918	52	\tableofcontents
blanchet@36918	53
blanchet@36918	54	\setlength{\parskip}{.7em plus .2em minus .1em}
blanchet@36918	55	\setlength{\parindent}{0pt}
blanchet@36918	56	\setlength{\abovedisplayskip}{\parskip}
blanchet@36918	57	\setlength{\abovedisplayshortskip}{.9\parskip}
blanchet@36918	58	\setlength{\belowdisplayskip}{\parskip}
blanchet@36918	59	\setlength{\belowdisplayshortskip}{.9\parskip}
blanchet@36918	60
blanchet@36918	61	% General-purpose enum environment with correct spacing
blanchet@36918	62	\newenvironment{enum}%
blanchet@36918	63	{\begin{list}{}{%
blanchet@36918	64	\setlength{\topsep}{.1\parskip}%
blanchet@36918	65	\setlength{\partopsep}{.1\parskip}%
blanchet@36918	66	\setlength{\itemsep}{\parskip}%
blanchet@36918	67	\advance\itemsep by-\parsep}}
blanchet@36918	68	{\end{list}}
blanchet@36918	69
blanchet@36918	70	\def\pre{\begingroup\vskip0pt plus1ex\advance\leftskip by\leftmargin
blanchet@36918	71	\advance\rightskip by\leftmargin}
blanchet@36918	72	\def\post{\vskip0pt plus1ex\endgroup}
blanchet@36918	73
blanchet@36918	74	\def\prew{\pre\advance\rightskip by-\leftmargin}
blanchet@36918	75	\def\postw{\post}
blanchet@36918	76
blanchet@36918	77	\section{Introduction}
blanchet@36918	78	\label{introduction}
blanchet@36918	79
blanchet@36918	80	Sledgehammer is a tool that applies first-order automatic theorem provers (ATPs)
blanchet@41190	81	and satisfiability-modulo-theories (SMT) solvers on the current goal. The
blanchet@40254	82	supported ATPs are E \cite{schulz-2002}, SPASS \cite{weidenbach-et-al-2009},
blanchet@43628	83	Vampire \cite{riazanov-voronkov-2002}, SInE-E \cite{sine}, SNARK
blanchet@43628	84	\cite{snark}, and ToFoF-E \cite{tofof}. The ATPs are run either locally or
blanchet@43628	85	remotely via the System\-On\-TPTP web service \cite{sutcliffe-2000}. In addition
blanchet@43628	86	to the ATPs, the SMT solvers Z3 \cite{z3} is used by default, and you can tell
blanchet@43628	87	Sledgehammer to try Yices \cite{yices} and CVC3 \cite{cvc3} as well; these
blanchet@43628	88	are run either locally or on a server in Munich.
blanchet@36918	89
blanchet@40254	90	The problem passed to the automatic provers consists of your current goal
blanchet@40254	91	together with a heuristic selection of hundreds of facts (theorems) from the
blanchet@40254	92	current theory context, filtered by relevance. Because jobs are run in the
blanchet@40254	93	background, you can continue to work on your proof by other means. Provers can
blanchet@40254	94	be run in parallel. Any reply (which may arrive half a minute later) will appear
blanchet@40254	95	in the Proof General response buffer.
blanchet@37517	96
blanchet@40254	97	The result of a successful proof search is some source text that usually (but
blanchet@40254	98	not always) reconstructs the proof within Isabelle. For ATPs, the reconstructed
blanchet@40254	99	proof relies on the general-purpose Metis prover \cite{metis}, which is fully
blanchet@40254	100	integrated into Isabelle/HOL, with explicit inferences going through the kernel.
blanchet@40254	101	Thus its results are correct by construction.
blanchet@36918	102
blanchet@39566	103	In this manual, we will explicitly invoke the \textbf{sledgehammer} command.
blanchet@39566	104	Sledgehammer also provides an automatic mode that can be enabled via the
blanchet@39566	105	``Auto Sledgehammer'' option from the ``Isabelle'' menu in Proof General. In
blanchet@39566	106	this mode, Sledgehammer is run on every newly entered theorem. The time limit
blanchet@39566	107	for Auto Sledgehammer and other automatic tools can be set using the ``Auto
blanchet@39566	108	Tools Time Limit'' option.
blanchet@39566	109
blanchet@36918	110	\newbox\boxA
blanchet@36918	111	\setbox\boxA=\hbox{\texttt{nospam}}
blanchet@36918	112
blanchet@43628	113	\newcommand\authoremail{\texttt{blan{\color{white}nospam}\kern-\wd\boxA{}chette@\allowbreak
blanchet@43628	114	in.\allowbreak tum.\allowbreak de}}
blanchet@43628	115
blanchet@40937	116	To run Sledgehammer, you must make sure that the theory \textit{Sledgehammer} is
blanchet@40937	117	imported---this is rarely a problem in practice since it is part of
blanchet@40937	118	\textit{Main}. Examples of Sledgehammer use can be found in Isabelle's
blanchet@36918	119	\texttt{src/HOL/Metis\_Examples} directory.
blanchet@36918	120	Comments and bug reports concerning Sledgehammer or this manual should be
blanchet@43628	121	directed to \authoremail.
blanchet@36918	122
blanchet@36918	123	\vskip2.5\smallskipamount
blanchet@36918	124
blanchet@36918	125	%\textbf{Acknowledgment.} The author would like to thank Mark Summerfield for
blanchet@36918	126	%suggesting several textual improvements.
blanchet@36918	127
blanchet@36918	128	\section{Installation}
blanchet@36918	129	\label{installation}
blanchet@36918	130
blanchet@36918	131	Sledgehammer is part of Isabelle, so you don't need to install it. However, it
blanchet@43628	132	relies on third-party automatic theorem provers (ATPs) and SMT solvers.
blanchet@43628	133
blanchet@43628	134	\subsection{Installing ATPs}
blanchet@43628	135
blanchet@40254	136	Currently, E, SPASS, and Vampire can be run locally; in addition, E, Vampire,
blanchet@43628	137	SInE-E, SNARK, and ToFoF-E are available remotely via System\-On\-TPTP
blanchet@43628	138	\cite{sutcliffe-2000}. If you want better performance, you should at least
blanchet@43628	139	install E and SPASS locally.
blanchet@36918	140
blanchet@38289	141	There are three main ways to install ATPs on your machine:
blanchet@36918	142
blanchet@36918	143	\begin{enum}
blanchet@36918	144	\item[$\bullet$] If you installed an official Isabelle package with everything
blanchet@36918	145	inside, it should already include properly setup executables for E and SPASS,
blanchet@38289	146	ready to use.%
blanchet@38289	147	\footnote{Vampire's license prevents us from doing the same for this otherwise
blanchet@38289	148	wonderful tool.}
blanchet@36918	149
blanchet@38289	150	\item[$\bullet$] Alternatively, you can download the Isabelle-aware E and SPASS
blanchet@36918	151	binary packages from Isabelle's download page. Extract the archives, then add a
blanchet@42618	152	line to your \texttt{\$ISABELLE\_HOME\_USER/etc/components}%
blanchet@42618	153	\footnote{The variable \texttt{\$ISABELLE\_HOME\_USER} is set by Isabelle at
blanchet@42618	154	startup. Its value can be retrieved by invoking \texttt{isabelle}
blanchet@42618	155	\texttt{getenv} \texttt{ISABELLE\_HOME\_USER} on the command line.}
blanchet@42618	156	file with the absolute
blanchet@40444	157	path to E or SPASS. For example, if the \texttt{components} does not exist yet
blanchet@40444	158	and you extracted SPASS to \texttt{/usr/local/spass-3.7}, create the
blanchet@40444	159	\texttt{components} file with the single line
blanchet@36918	160
blanchet@36918	161	\prew
blanchet@36918	162	\texttt{/usr/local/spass-3.7}
blanchet@36918	163	\postw
blanchet@36918	164
blanchet@38289	165	in it.
blanchet@38289	166
blanchet@38289	167	\item[$\bullet$] If you prefer to build E or SPASS yourself, or obtained a
blanchet@38289	168	Vampire executable from somewhere (e.g., \url{http://www.vprover.org/}),
blanchet@38289	169	set the environment variable \texttt{E\_HOME}, \texttt{SPASS\_HOME}, or
blanchet@38289	170	\texttt{VAMPIRE\_HOME} to the directory that contains the \texttt{eproof},
blanchet@38309	171	\texttt{SPASS}, or \texttt{vampire} executable. Sledgehammer has been tested
blanchet@43714	172	with E 1.0 and 1.2, SPASS 3.5 and 3.7, and Vampire 0.6 and 1.0%
blanchet@38309	173	\footnote{Following the rewrite of Vampire, the counter for version numbers was
blanchet@43714	174	reset to 0; hence the (new) Vampire versions 0.6 and 1.0 are more recent than,
blanchet@43714	175	say, Vampire 11.5.}%
blanchet@38309	176	. Since the ATPs' output formats are neither documented nor stable, other
blanchet@43628	177	versions of the ATPs might or might not work well with Sledgehammer. Ideally,
blanchet@43628	178	also set \texttt{E\_VERSION}, \texttt{SPASS\_VERSION}, or
blanchet@43628	179	\texttt{VAMPIRE\_VERSION} to the ATP's version number (e.g., ``1.2'').
blanchet@36918	180	\end{enum}
blanchet@36918	181
blanchet@43628	182	To check whether E and SPASS are successfully installed, follow the example in
blanchet@43628	183	\S\ref{first-steps}. If the remote versions of E and SPASS are used (identified
blanchet@43628	184	by the prefix ``\emph{remote\_}''), or if the local versions fail to solve the
blanchet@43628	185	easy goal presented there, this is a sign that something is wrong with your
blanchet@43628	186	installation.
blanchet@36918	187
blanchet@37517	188	Remote ATP invocation via the SystemOnTPTP web service requires Perl with the
blanchet@39388	189	World Wide Web Library (\texttt{libwww-perl}) installed. If you must use a proxy
blanchet@39388	190	server to access the Internet, set the \texttt{http\_proxy} environment variable
blanchet@39389	191	to the proxy, either in the environment in which Isabelle is launched or in your
blanchet@42618	192	\texttt{\char`\~/\$ISABELLE\_HOME\_USER/etc/settings} file. Here are a few examples:
blanchet@39388	193
blanchet@39388	194	\prew
blanchet@39389	195	\texttt{http\_proxy=http://proxy.example.org} \\
blanchet@39389	196	\texttt{http\_proxy=http://proxy.example.org:8080} \\
blanchet@39389	197	\texttt{http\_proxy=http://joeblow:pAsSwRd@proxy.example.org}
blanchet@39388	198	\postw
blanchet@37517	199
blanchet@43628	200	\subsection{Installing SMT Solvers}
blanchet@43628	201
blanchet@43628	202	CVC3, Yices, and Z3 can be run locally or remotely on a Munich server. If you
blanchet@43628	203	want better performance and get the ability to replay proofs that rely on the
blanchet@43628	204	\emph{smt} proof method, you should at least install Z3 locally.
blanchet@43628	205
blanchet@43628	206	There are two main ways of installing SMT solvers locally.
blanchet@43628	207
blanchet@43628	208	\begin{enum}
blanchet@43628	209	\item[$\bullet$] If you installed an official Isabelle package with everything
blanchet@43628	210	inside, it should already include properly setup executables for CVC3 and Z3,
blanchet@43628	211	ready to use.%
blanchet@43628	212	\footnote{Yices's license prevents us from doing the same for this otherwise
blanchet@43628	213	wonderful tool.}
blanchet@43628	214	For Z3, you additionally need to set the environment variable
blanchet@43628	215	\texttt{Z3\_NON\_COMMERCIAL} to ``yes'' to confirm that you are a noncommercial
blanchet@43628	216	user.
blanchet@43628	217
blanchet@43628	218	\item[$\bullet$] Otherwise, follow the instructions documented in the \emph{SMT}
blanchet@43628	219	theory (\texttt{\$ISABELLE\_HOME/src/HOL/SMT.thy}).
blanchet@43628	220	\end{enum}
blanchet@43628	221
blanchet@36918	222	\section{First Steps}
blanchet@36918	223	\label{first-steps}
blanchet@36918	224
blanchet@36918	225	To illustrate Sledgehammer in context, let us start a theory file and
blanchet@36918	226	attempt to prove a simple lemma:
blanchet@36918	227
blanchet@36918	228	\prew
blanchet@36918	229	\textbf{theory}~\textit{Scratch} \\
blanchet@36918	230	\textbf{imports}~\textit{Main} \\
blanchet@36918	231	\textbf{begin} \\[2\smallskipamount]
blanchet@36918	232	%
blanchet@36918	233	\textbf{lemma} ``$[a] = [b] \,\longleftrightarrow\, a = b$'' \\
blanchet@36918	234	\textbf{sledgehammer}
blanchet@36918	235	\postw
blanchet@36918	236
blanchet@37517	237	Instead of issuing the \textbf{sledgehammer} command, you can also find
blanchet@37517	238	Sledgehammer in the ``Commands'' submenu of the ``Isabelle'' menu in Proof
blanchet@37517	239	General or press the Emacs key sequence C-c C-a C-s.
blanchet@37517	240	Either way, Sledgehammer produces the following output after a few seconds:
blanchet@36918	241
blanchet@36918	242	\prew
blanchet@36918	243	\slshape
blanchet@40241	244	Sledgehammer: ``\textit{e}'' for subgoal 1: \\
blanchet@36918	245	$([a] = [b]) = (a = b)$ \\
blanchet@36918	246	Try this command: \textbf{by} (\textit{metis hd.simps}). \\
blanchet@38289	247	To minimize the number of lemmas, try this: \\
blanchet@40240	248	\textbf{sledgehammer} \textit{minimize} [\textit{prover} = \textit{e}] (\textit{hd.simps}). \\[3\smallskipamount]
blanchet@36918	249	%
blanchet@40241	250	Sledgehammer: ``\textit{spass}'' for subgoal 1: \\
blanchet@36918	251	$([a] = [b]) = (a = b)$ \\
blanchet@36918	252	Try this command: \textbf{by} (\textit{metis insert\_Nil last\_ConsL}). \\
blanchet@38289	253	To minimize the number of lemmas, try this: \\
blanchet@40240	254	\textbf{sledgehammer} \textit{minimize} [\textit{prover} = \textit{spass}] (\textit{insert\_Nil last\_ConsL}). \\[3\smallskipamount]
blanchet@36918	255	%
blanchet@40254	256	Sledgehammer: ``\textit{vampire}'' for subgoal 1: \\
blanchet@36918	257	$([a] = [b]) = (a = b)$ \\
blanchet@43715	258	Try this command: \textbf{by} (\textit{metis eq\_commute last\_snoc}). \\
blanchet@38289	259	To minimize the number of lemmas, try this: \\
blanchet@40254	260	\textbf{sledgehammer} \textit{minimize} [\textit{prover} = \textit{vampire}]~(\textit{eq\_commute last\_snoc}). \\[3\smallskipamount]
blanchet@40254	261	%
blanchet@40254	262	Sledgehammer: ``\textit{remote\_sine\_e}'' for subgoal 1: \\
blanchet@40254	263	$([a] = [b]) = (a = b)$ \\
blanchet@43715	264	Try this command: \textbf{by} (\textit{metis hd.simps}). \\
blanchet@40254	265	To minimize the number of lemmas, try this: \\
blanchet@43715	266	\textbf{sledgehammer} \textit{minimize} [\textit{prover} = \textit{remote\_sine\_e}]~(\textit{hd.simps}). \\[3\smallskipamount]
blanchet@41190	267	%
blanchet@41190	268	Sledgehammer: ``\textit{remote\_z3}'' for subgoal 1: \\
blanchet@41190	269	$([a] = [b]) = (a = b)$ \\
blanchet@43715	270	Try this command: \textbf{by} (\textit{metis hd.simps}). \\
blanchet@41190	271	To minimize the number of lemmas, try this: \\
blanchet@41190	272	\textbf{sledgehammer} \textit{minimize} [\textit{prover} = \textit{remote\_sine\_e}]~(\textit{hd.simps}).
blanchet@36918	273	\postw
blanchet@36918	274
blanchet@41190	275	Sledgehammer ran E, SPASS, Vampire, SInE-E, and Z3 in parallel. Depending on
blanchet@41190	276	which provers are installed and how many processor cores are available, some of
blanchet@41190	277	the provers might be missing or present with a \textit{remote\_} prefix.
blanchet@36918	278
blanchet@40254	279	For each successful prover, Sledgehammer gives a one-liner proof that uses the
blanchet@40254	280	\textit{metis} or \textit{smt} method. You can click the proof to insert it into
blanchet@40254	281	the theory text. You can click the ``\textbf{sledgehammer} \textit{minimize}''
blanchet@40254	282	command if you want to look for a shorter (and probably faster) proof. But here
blanchet@40254	283	the proof found by E looks perfect, so click it to finish the proof.
blanchet@36918	284
blanchet@36918	285	You can ask Sledgehammer for an Isar text proof by passing the
blanchet@36918	286	\textit{isar\_proof} option:
blanchet@36918	287
blanchet@36918	288	\prew
blanchet@36918	289	\textbf{sledgehammer} [\textit{isar\_proof}]
blanchet@36918	290	\postw
blanchet@36918	291
blanchet@36918	292	When Isar proof construction is successful, it can yield proofs that are more
blanchet@36918	293	readable and also faster than the \textit{metis} one-liners. This feature is
blanchet@40254	294	experimental and is only available for ATPs.
blanchet@36918	295
blanchet@37517	296	\section{Hints}
blanchet@37517	297	\label{hints}
blanchet@37517	298
blanchet@43628	299	\newcommand\point[1]{{\sl\bfseries#1}\par\nopagebreak}
blanchet@43628	300
blanchet@43628	301	\point{Presimplify the goal}
blanchet@43628	302
blanchet@37517	303	For best results, first simplify your problem by calling \textit{auto} or at
blanchet@37517	304	least \textit{safe} followed by \textit{simp\_all}. None of the ATPs contain
blanchet@37517	305	arithmetic decision procedures. They are not especially good at heavy rewriting,
blanchet@37517	306	but because they regard equations as undirected, they often prove theorems that
blanchet@37517	307	require the reverse orientation of a \textit{simp} rule. Higher-order problems
blanchet@37517	308	can be tackled, but the success rate is better for first-order problems. Hence,
blanchet@37517	309	you may get better results if you first simplify the problem to remove
blanchet@37517	310	higher-order features.
blanchet@37517	311
blanchet@43628	312	\point{Make sure at least E, SPASS, Vampire, and Z3 are installed}
blanchet@43628	313
blanchet@43628	314	Locally installed provers are faster and more reliable than those running on
blanchet@43628	315	servers. See \S\ref{installation} for details on how to install them.
blanchet@43628	316
blanchet@43628	317	\point{Familiarize yourself with the most important options}
blanchet@43628	318
blanchet@43628	319	Sledgehammer's options are fully documented in \S\ref{command-syntax}. Many of
blanchet@43628	320	the options are very specialized, but serious users of the tool should at least
blanchet@43628	321	familiarize themselves with the following options:
blanchet@43628	322
blanchet@43628	323	\begin{enum}
blanchet@43628	324	\item[$\bullet$] \textbf{\textit{provers}} specifies the ATP and SMT solvers to
blanchet@43628	325	use (e.g., ``\textit{provers} = \textit{e spass remote\_vampire}'').
blanchet@43628	326
blanchet@43719	327	\item[$\bullet$] \textbf{\textit{timeout}} controls the provers' time limit. It
blanchet@43719	328	is set to 30 seconds, but since Sledgehammer runs asynchronously you should not
blanchet@43719	329	hesitate to raise this limit to 60 or 120 seconds if you are the kind of user
blanchet@43719	330	who can think clearly while ATPs are active.
blanchet@43628	331
blanchet@43628	332	\item[$\bullet$] \textbf{\textit{full\_types}} specifies whether type-sound
blanchet@43628	333	encodings should be used. By default, Sledgehammer employs a mixture of
blanchet@43628	334	type-sound and type-unsound encodings, occasionally yielding unsound ATP proofs.
blanchet@43628	335	(SMT solver proofs should always be sound, although we occasionally find
blanchet@43628	336	soundness bugs in the solvers.)
blanchet@43628	337
blanchet@43628	338	\item[$\bullet$] \textbf{\textit{max\_relevant}} specifies the maximum number of
blanchet@43628	339	facts that should be passed to the provers. By default, the value is
blanchet@43628	340	prover-dependent but varies between about 150 and 1000. If the provers time out,
blanchet@43628	341	you can try lowering this value to, say, 100 or 50 and see if that helps.
blanchet@43628	342
blanchet@43628	343	\item[$\bullet$] \textbf{\textit{isar\_proof}} specifies that Isar proofs should
blanchet@43628	344	be generated, instead of one-liner Metis proofs. The length of the Isar proofs
blanchet@43628	345	can be controlled by setting \textit{isar\_shrink\_factor}.
blanchet@43628	346	\end{enum}
blanchet@43628	347
blanchet@43628	348	Options can be set globally using \textbf{sledgehammer\_params}. Fact selection
blanchet@43628	349	can be influenced by specifying ``$(\textit{add}{:}~\textit{some\_facts})$'' after
blanchet@43628	350	the \textbf{sledgehammer} call to ensure that certain facts are included, or
blanchet@43628	351	simply ``$(\textit{some\_facts})$'' to force Sledgehammer to run only with
blanchet@43628	352	$\textit{some\_facts}$.
blanchet@43628	353
blanchet@43628	354	\section{Frequently Asked Questions}
blanchet@43628	355	\label{frequently-asked-questions}
blanchet@43628	356
blanchet@43628	357	\point{Why does Metis fail to reconstruct the proof?}
blanchet@43628	358
blanchet@43628	359	There can be many reasons. If Metis runs seemingly forever, that's a sign that
blanchet@43628	360	the proof is too difficult for it. Metis is complete, so it should eventually
blanchet@43628	361	find it, but that's little consolation. There are several possible solutions:
blanchet@43628	362
blanchet@43628	363	\begin{enum}
blanchet@43628	364	\item[$\bullet$] Try the \textit{isar\_proof} option to obtain a step-by-step
blanchet@43628	365	Isar proof where each step is justified by Metis. Since the steps are fairly
blanchet@43628	366	small, Metis is more likely to be able to replay them.
blanchet@43628	367
blanchet@43628	368	\item[$\bullet$] Try the \textit{smt} proof method instead of \textit{metis}. It
blanchet@43628	369	is usually stronger, but you need to have Z3 available to replay the proofs,
blanchet@43628	370	trust the SMT solver, or use certificates. See the documentation in the
blanchet@43628	371	\emph{SMT} theory (\texttt{\$ISABELLE\_HOME/src/HOL/SMT.thy}) for details.
blanchet@43628	372
blanchet@43628	373	\item[$\bullet$] Try the \textit{blast} or \textit{auto} proof methods, passing
blanchet@43628	374	facts via \textbf{unfolding}, \textbf{using}, \textit{intro}{:},
blanchet@43628	375	\textit{elim}{:}, \textit{dest}{:}, or \textit{simp}{:}, as appropriate.
blanchet@43628	376	\end{enum}
blanchet@43628	377
blanchet@43628	378	% * sometimes Metis runs into some error, e.g. a type error. then it tries
blanchet@43628	379	% again with metisFT, where FT stands for ``full type information'
blanchet@43628	380	% * metisFT is much slower, but its proof search is fully typed, and it also
blanchet@43628	381	% includes more powerful rules such as the axiom ``$x = \mathit{True}
blanchet@43628	382	% \mathrel{\lor} x = \mathit{False}$'' for reasoning in higher-order places
blanchet@43628	383	% (e.g., in set comprehensions)
blanchet@43628	384	%
blanchet@43628	385	% * finally, in some cases the ATP proof is simply type-incorrect.
blanchet@43628	386	% Sledgehammer drops some type information to speed up the search. Try
blanchet@43628	387	% Sledgehammer again with full type information: \textit{full\_types}
blanchet@43628	388	% (\S\ref{problem-encoding}), or choose a specific type encoding with
blanchet@43628	389	% \textit{type\_sys} (\S\ref{problem-encoding}). Older versions of
blanchet@43628	390	% Sledgehammer were frequent victims of this problem. Now this should very
blanchet@43628	391	% seldom be an issue, but if you notice too many unsound proofs, contact
blanchet@43628	392	%
blanchet@43628	393	%\point{How can I easily tell whether a Sledgehammer proof is sound?}
blanchet@43628	394	%
blanchet@43628	395	%Easiest way: Once it's found: ... by (metis facts)
blanchet@43628	396	%try
blanchet@43628	397	%sledgehammer [full\_types] (facts)
blanchet@43628	398	%
blanchet@43628	399	%should usually give unprovable or refind the proof fairly quickly
blanchet@43628	400	%
blanchet@43628	401	%Same trick if you believe that there exists a proof with certain facts.
blanchet@43628	402	%
blanchet@43628	403	%\point{Which facts does Sledgehammer select?}
blanchet@43628	404	%
blanchet@43628	405	% * heuristic
blanchet@43628	406	% * and several hundreds
blanchet@43628	407	% * show them: debug
blanchet@43628	408	% * influence it with sledgehammer (add: xxx)
blanchet@43628	409	%
blanchet@43628	410	% * S/h good at finding short proofs combining a handful of existing lemmas
blanchet@43628	411	% * for deeper proofs, you must restrict the number of facts, e.g.
blanchet@43628	412	% max\_relevant = 50
blanchet@43628	413	% * but then proof reconstruction is an issue
blanchet@43628	414	%
blanchet@43628	415	%\point{Why are the Isar proofs generated by Sledgehammer so ugly?}
blanchet@43628	416	%
blanchet@43628	417	% * experimental
blanchet@43628	418	% * working on this
blanchet@43628	419	% * there is a large body of research into transforming resolution proofs into
blanchet@43628	420	% natural deduction proofs (e.g., Isar proofs)
blanchet@43628	421	% * meantime: isar\_shrink\_factor
blanchet@43628	422	%
blanchet@43628	423	%
blanchet@43628	424	%\point{Should I let Sledgehammer minimize the number of lemmas?}
blanchet@43628	425	%
blanchet@43628	426	% * in general, yes
blanchet@43628	427	% * proofs involving fewer lemmas tend to be shorter as well, and hence easier
blanchet@43628	428	% to re-find by Metis
blanchet@43628	429	% * but the opposite is sometimes the case
blanchet@43628	430
blanchet@43719	431	% Why is Sledgehammer automatically minimizing sometimes?
blanchet@43719	432	% * some provers (e.g. CVC3 and Yices)
blanchet@43719	433	% * also, sometimes E finds a proof but doesn't give a proof object
blanchet@43719	434
blanchet@43628	435	\point{I got a strange error from Sledgehammer---what should I do?}
blanchet@43628	436
blanchet@43628	437	Sledgehammer tries to give informative error messages. Please report any strange
blanchet@43628	438	error to \authoremail. This applies double if you get the message
blanchet@43628	439
blanchet@43628	440	\begin{quote}
blanchet@43628	441	\slshape
blanchet@43746	442	The prover found a type-unsound proof involving ``\textit{foo}'',
blanchet@43746	443	``\textit{bar}'', ``\textit{baz}'' even though a supposedly type-sound encoding
blanchet@43746	444	was used (or, less likely, your axioms are inconsistent). You might want to
blanchet@43746	445	report this to the Isabelle developers.
blanchet@43628	446	\end{quote}
blanchet@43628	447
blanchet@43628	448	\point{Auto can solve it---why not Sledgehammer?}
blanchet@43628	449
blanchet@43628	450	Problems can be easy for \textit{auto} and difficult for automatic provers, but
blanchet@43628	451	the reverse is also true, so don't be discouraged if your first attempts fail.
blanchet@39566	452	Because the system refers to all theorems known to Isabelle, it is particularly
blanchet@39566	453	suitable when your goal has a short proof from lemmas that you don't know about.
blanchet@37517	454
blanchet@36918	455	\section{Command Syntax}
blanchet@36918	456	\label{command-syntax}
blanchet@36918	457
blanchet@36918	458	Sledgehammer can be invoked at any point when there is an open goal by entering
blanchet@36918	459	the \textbf{sledgehammer} command in the theory file. Its general syntax is as
blanchet@36918	460	follows:
blanchet@36918	461
blanchet@36918	462	\prew
blanchet@36918	463	\textbf{sledgehammer} \textit{subcommand\/$^?$ options\/$^?$ facts\_override\/$^?$ num\/$^?$}
blanchet@36918	464	\postw
blanchet@36918	465
blanchet@36918	466	For convenience, Sledgehammer is also available in the ``Commands'' submenu of
blanchet@36918	467	the ``Isabelle'' menu in Proof General or by pressing the Emacs key sequence C-c
blanchet@36918	468	C-a C-s. This is equivalent to entering the \textbf{sledgehammer} command with
blanchet@36918	469	no arguments in the theory text.
blanchet@36918	470
blanchet@36918	471	In the general syntax, the \textit{subcommand} may be any of the following:
blanchet@36918	472
blanchet@36918	473	\begin{enum}
blanchet@40444	474	\item[$\bullet$] \textbf{\textit{run} (the default):} Runs Sledgehammer on
blanchet@40444	475	subgoal number \textit{num} (1 by default), with the given options and facts.
blanchet@36918	476
blanchet@36918	477	\item[$\bullet$] \textbf{\textit{minimize}:} Attempts to minimize the provided facts
blanchet@36918	478	(specified in the \textit{facts\_override} argument) to obtain a simpler proof
blanchet@36918	479	involving fewer facts. The options and goal number are as for \textit{run}.
blanchet@36918	480
blanchet@40444	481	\item[$\bullet$] \textbf{\textit{messages}:} Redisplays recent messages issued
blanchet@40444	482	by Sledgehammer. This allows you to examine results that might have been lost
blanchet@40444	483	due to Sledgehammer's asynchronous nature. The \textit{num} argument specifies a
blanchet@36918	484	limit on the number of messages to display (5 by default).
blanchet@36918	485
blanchet@42591	486	\item[$\bullet$] \textbf{\textit{supported\_provers}:} Prints the list of
blanchet@42588	487	automatic provers supported by Sledgehammer. See \S\ref{installation} and
blanchet@42588	488	\S\ref{mode-of-operation} for more information on how to install automatic
blanchet@42588	489	provers.
blanchet@36918	490
blanchet@40240	491	\item[$\bullet$] \textbf{\textit{running\_provers}:} Prints information about
blanchet@40240	492	currently running automatic provers, including elapsed runtime and remaining
blanchet@40240	493	time until timeout.
blanchet@36918	494
blanchet@40240	495	\item[$\bullet$] \textbf{\textit{kill\_provers}:} Terminates all running
blanchet@40240	496	automatic provers.
blanchet@36918	497
blanchet@36918	498	\item[$\bullet$] \textbf{\textit{refresh\_tptp}:} Refreshes the list of remote
blanchet@36918	499	ATPs available at System\-On\-TPTP \cite{sutcliffe-2000}.
blanchet@36918	500	\end{enum}
blanchet@36918	501
blanchet@36918	502	Sledgehammer's behavior can be influenced by various \textit{options}, which can
blanchet@36918	503	be specified in brackets after the \textbf{sledgehammer} command. The
blanchet@36918	504	\textit{options} are a list of key--value pairs of the form ``[$k_1 = v_1,
blanchet@36918	505	\ldots, k_n = v_n$]''. For Boolean options, ``= \textit{true}'' is optional. For
blanchet@36918	506	example:
blanchet@36918	507
blanchet@36918	508	\prew
blanchet@36918	509	\textbf{sledgehammer} [\textit{isar\_proof}, \,\textit{timeout} = 120$\,s$]
blanchet@36918	510	\postw
blanchet@36918	511
blanchet@36918	512	Default values can be set using \textbf{sledgehammer\_\allowbreak params}:
blanchet@36918	513
blanchet@36918	514	\prew
blanchet@36918	515	\textbf{sledgehammer\_params} \textit{options}
blanchet@36918	516	\postw
blanchet@36918	517
blanchet@36918	518	The supported options are described in \S\ref{option-reference}.
blanchet@36918	519
blanchet@36918	520	The \textit{facts\_override} argument lets you alter the set of facts that go
blanchet@36918	521	through the relevance filter. It may be of the form ``(\textit{facts})'', where
blanchet@36918	522	\textit{facts} is a space-separated list of Isabelle facts (theorems, local
blanchet@36918	523	assumptions, etc.), in which case the relevance filter is bypassed and the given
blanchet@39566	524	facts are used. It may also be of the form ``(\textit{add}:\ \textit{facts}$_1$)'',
blanchet@39566	525	``(\textit{del}:\ \textit{facts}$_2$)'', or ``(\textit{add}:\ \textit{facts}$_1$\
blanchet@39566	526	\textit{del}:\ \textit{facts}$_2$)'', where the relevance filter is instructed to
blanchet@36918	527	proceed as usual except that it should consider \textit{facts}$_1$
blanchet@36918	528	highly-relevant and \textit{facts}$_2$ fully irrelevant.
blanchet@36918	529
blanchet@39566	530	You can instruct Sledgehammer to run automatically on newly entered theorems by
blanchet@39566	531	enabling the ``Auto Sledgehammer'' option from the ``Isabelle'' menu in Proof
blanchet@40240	532	General. For automatic runs, only the first prover set using \textit{provers}
blanchet@43601	533	(\S\ref{mode-of-operation}) is considered, fewer facts are passed to the prover,
blanchet@43601	534	\textit{slicing} (\S\ref{mode-of-operation}) is disabled, \textit{timeout}
blanchet@40254	535	(\S\ref{mode-of-operation}) is superseded by the ``Auto Tools Time Limit'' in
blanchet@43601	536	Proof General's ``Isabelle'' menu, \textit{full\_types}
blanchet@43601	537	(\S\ref{problem-encoding}) is enabled, and \textit{verbose}
blanchet@43601	538	(\S\ref{output-format}) and \textit{debug} (\S\ref{output-format}) are disabled.
blanchet@43601	539	Sledgehammer's output is also more concise.
blanchet@39566	540
blanchet@36918	541	\section{Option Reference}
blanchet@36918	542	\label{option-reference}
blanchet@36918	543
blanchet@36918	544	\def\flushitem#1{\item[]\noindent\kern-\leftmargin \textbf{#1}}
blanchet@36918	545	\def\qty#1{$\left<\textit{#1}\right>$}
blanchet@36918	546	\def\qtybf#1{$\mathbf{\left<\textbf{\textit{#1}}\right>}$}
blanchet@36918	547	\def\optrue#1#2{\flushitem{\textit{#1} $\bigl[$= \qtybf{bool}$\bigr]$\quad [\textit{true}]\hfill (neg.: \textit{#2})}\nopagebreak\\[\parskip]}
blanchet@36918	548	\def\opfalse#1#2{\flushitem{\textit{#1} $\bigl[$= \qtybf{bool}$\bigr]$\quad [\textit{false}]\hfill (neg.: \textit{#2})}\nopagebreak\\[\parskip]}
blanchet@36918	549	\def\opsmart#1#2{\flushitem{\textit{#1} $\bigl[$= \qtybf{bool\_or\_smart}$\bigr]$\quad [\textit{smart}]\hfill (neg.: \textit{#2})}\nopagebreak\\[\parskip]}
blanchet@36918	550	\def\opsmartx#1#2{\flushitem{\textit{#1} $\bigl[$= \qtybf{bool\_or\_smart}$\bigr]$\quad [\textit{smart}]\hfill\\\hbox{}\hfill (neg.: \textit{#2})}\nopagebreak\\[\parskip]}
blanchet@36918	551	\def\opnodefault#1#2{\flushitem{\textit{#1} = \qtybf{#2}} \nopagebreak\\[\parskip]}
blanchet@36918	552	\def\opdefault#1#2#3{\flushitem{\textit{#1} = \qtybf{#2}\quad [\textit{#3}]} \nopagebreak\\[\parskip]}
blanchet@36918	553	\def\oparg#1#2#3{\flushitem{\textit{#1} \qtybf{#2} = \qtybf{#3}} \nopagebreak\\[\parskip]}
blanchet@36918	554	\def\opargbool#1#2#3{\flushitem{\textit{#1} \qtybf{#2} $\bigl[$= \qtybf{bool}$\bigr]$\hfill (neg.: \textit{#3})}\nopagebreak\\[\parskip]}
blanchet@36918	555	\def\opargboolorsmart#1#2#3{\flushitem{\textit{#1} \qtybf{#2} $\bigl[$= \qtybf{bool\_or\_smart}$\bigr]$\hfill (neg.: \textit{#3})}\nopagebreak\\[\parskip]}
blanchet@36918	556
blanchet@36918	557	Sledgehammer's options are categorized as follows:\ mode of operation
blanchet@39228	558	(\S\ref{mode-of-operation}), problem encoding (\S\ref{problem-encoding}),
blanchet@39228	559	relevance filter (\S\ref{relevance-filter}), output format
blanchet@39228	560	(\S\ref{output-format}), and authentication (\S\ref{authentication}).
blanchet@36918	561
blanchet@36918	562	The descriptions below refer to the following syntactic quantities:
blanchet@36918	563
blanchet@36918	564	\begin{enum}
blanchet@36918	565	\item[$\bullet$] \qtybf{string}: A string.
blanchet@36918	566	\item[$\bullet$] \qtybf{bool\/}: \textit{true} or \textit{false}.
blanchet@40444	567	\item[$\bullet$] \qtybf{bool\_or\_smart\/}: \textit{true}, \textit{false}, or
blanchet@40444	568	\textit{smart}.
blanchet@36918	569	\item[$\bullet$] \qtybf{int\/}: An integer.
blanchet@43589	570	%\item[$\bullet$] \qtybf{float\/}: A floating-point number (e.g., 2.5).
blanchet@40584	571	\item[$\bullet$] \qtybf{float\_pair\/}: A pair of floating-point numbers
blanchet@40584	572	(e.g., 0.6 0.95).
blanchet@38814	573	\item[$\bullet$] \qtybf{int\_or\_smart\/}: An integer or \textit{smart}.
blanchet@40584	574	\item[$\bullet$] \qtybf{float\_or\_none\/}: An integer (e.g., 60) or
blanchet@40584	575	floating-point number (e.g., 0.5) expressing a number of seconds, or the keyword
blanchet@40584	576	\textit{none} ($\infty$ seconds).
blanchet@36918	577	\end{enum}
blanchet@36918	578
blanchet@36918	579	Default values are indicated in square brackets. Boolean options have a negated
blanchet@39228	580	counterpart (e.g., \textit{blocking} vs.\ \textit{non\_blocking}). When setting
blanchet@36918	581	Boolean options, ``= \textit{true}'' may be omitted.
blanchet@36918	582
blanchet@36918	583	\subsection{Mode of Operation}
blanchet@36918	584	\label{mode-of-operation}
blanchet@36918	585
blanchet@36918	586	\begin{enum}
blanchet@40240	587	\opnodefault{provers}{string}
blanchet@40240	588	Specifies the automatic provers to use as a space-separated list (e.g.,
blanchet@40240	589	``\textit{e}~\textit{spass}''). The following provers are supported:
blanchet@36918	590
blanchet@36918	591	\begin{enum}
blanchet@36918	592	\item[$\bullet$] \textbf{\textit{e}:} E is an ATP developed by Stephan Schulz
blanchet@36918	593	\cite{schulz-2002}. To use E, set the environment variable
blanchet@36918	594	\texttt{E\_HOME} to the directory that contains the \texttt{eproof} executable,
blanchet@36918	595	or install the prebuilt E package from Isabelle's download page. See
blanchet@36918	596	\S\ref{installation} for details.
blanchet@36918	597
blanchet@36918	598	\item[$\bullet$] \textbf{\textit{spass}:} SPASS is an ATP developed by Christoph
blanchet@36918	599	Weidenbach et al.\ \cite{weidenbach-et-al-2009}. To use SPASS, set the
blanchet@36918	600	environment variable \texttt{SPASS\_HOME} to the directory that contains the
blanchet@36918	601	\texttt{SPASS} executable, or install the prebuilt SPASS package from Isabelle's
blanchet@37389	602	download page. Sledgehammer requires version 3.5 or above. See
blanchet@37389	603	\S\ref{installation} for details.
blanchet@36918	604
blanchet@36918	605	\item[$\bullet$] \textbf{\textit{vampire}:} Vampire is an ATP developed by
blanchet@36918	606	Andrei Voronkov and his colleagues \cite{riazanov-voronkov-2002}. To use
blanchet@36918	607	Vampire, set the environment variable \texttt{VAMPIRE\_HOME} to the directory
blanchet@41190	608	that contains the \texttt{vampire} executable. Sledgehammer has been tested with
blanchet@41190	609	versions 11, 0.6, and 1.0.
blanchet@36918	610
blanchet@42611	611	\item[$\bullet$] \textbf{\textit{cvc3}:} CVC3 is an SMT solver developed by
blanchet@42611	612	Clark Barrett, Cesare Tinelli, and their colleagues \cite{cvc3}. To use CVC3,
blanchet@42611	613	set the environment variable \texttt{CVC3\_SOLVER} to the complete path of the
blanchet@42611	614	executable, including the file name. Sledgehammer has been tested with version
blanchet@42611	615	2.2.
blanchet@41190	616
blanchet@41190	617	\item[$\bullet$] \textbf{\textit{yices}:} Yices is an SMT solver developed at
blanchet@41190	618	SRI \cite{yices}. To use Yices, set the environment variable
blanchet@41190	619	\texttt{YICES\_SOLVER} to the complete path of the executable, including the
blanchet@41190	620	file name. Sledgehammer has been tested with version 1.0.
blanchet@41190	621
blanchet@42611	622	\item[$\bullet$] \textbf{\textit{z3}:} Z3 is an SMT solver developed at
blanchet@42611	623	Microsoft Research \cite{z3}. To use Z3, set the environment variable
blanchet@42611	624	\texttt{Z3\_SOLVER} to the complete path of the executable, including the file
blanchet@42611	625	name. Sledgehammer has been tested with versions 2.7 to 2.18.
blanchet@42611	626
blanchet@42611	627	\item[$\bullet$] \textbf{\textit{z3\_atp}:} This version of Z3 pretends to be an
blanchet@42611	628	ATP, exploiting Z3's undocumented support for the TPTP format. It is included
blanchet@43313	629	for experimental purposes. It requires version 2.18 or above.
blanchet@40254	630
blanchet@38824	631	\item[$\bullet$] \textbf{\textit{remote\_e}:} The remote version of E runs
blanchet@36918	632	on Geoff Sutcliffe's Miami servers \cite{sutcliffe-2000}.
blanchet@36918	633
blanchet@36918	634	\item[$\bullet$] \textbf{\textit{remote\_vampire}:} The remote version of
blanchet@38824	635	Vampire runs on Geoff Sutcliffe's Miami servers. Version 9 is used.
blanchet@36918	636
blanchet@43406	637	\item[$\bullet$] \textbf{\textit{remote\_tofof\_e}:} ToFoF-E is a metaprover
blanchet@43406	638	developed by Geoff Sutcliffe \cite{tofof} based on E running on his Miami
blanchet@43406	639	servers. This ATP supports a fragment of the TPTP many-typed first-order format
blanchet@43406	640	(TFF). It is supported primarily for experimenting with the
blanchet@43725	641	\textit{type\_sys} $=$ \textit{simple} option (\S\ref{problem-encoding}).
blanchet@43406	642
blanchet@38824	643	\item[$\bullet$] \textbf{\textit{remote\_sine\_e}:} SInE-E is a metaprover
blanchet@38824	644	developed by Kry\v stof Hoder \cite{sine} based on E. The remote version of
blanchet@38824	645	SInE runs on Geoff Sutcliffe's Miami servers.
blanchet@38824	646
blanchet@38824	647	\item[$\bullet$] \textbf{\textit{remote\_snark}:} SNARK is a prover
blanchet@38824	648	developed by Stickel et al.\ \cite{snark}. The remote version of
blanchet@38824	649	SNARK runs on Geoff Sutcliffe's Miami servers.
blanchet@40254	650
blanchet@42609	651	\item[$\bullet$] \textbf{\textit{remote\_cvc3}:} The remote version of CVC3 runs
blanchet@42609	652	on servers at the TU M\"unchen (or wherever \texttt{REMOTE\_SMT\_URL} is set to
blanchet@42609	653	point).
blanchet@42609	654
blanchet@41190	655	\item[$\bullet$] \textbf{\textit{remote\_z3}:} The remote version of Z3 runs on
blanchet@41190	656	servers at the TU M\"unchen (or wherever \texttt{REMOTE\_SMT\_URL} is set to
blanchet@41190	657	point).
blanchet@40254	658
blanchet@42611	659	\item[$\bullet$] \textbf{\textit{remote\_z3\_atp}:} The remote version of ``Z3
blanchet@42611	660	as an ATP'' runs on Geoff Sutcliffe's Miami servers.
blanchet@36918	661	\end{enum}
blanchet@36918	662
blanchet@41190	663	By default, Sledgehammer will run E, SPASS, Vampire, SInE-E, and Z3 (or whatever
blanchet@43089	664	the SMT module's \textit{smt\_solver} configuration option is set to) in
blanchet@40254	665	parallel---either locally or remotely, depending on the number of processor
blanchet@40254	666	cores available. For historical reasons, the default value of this option can be
blanchet@40254	667	overridden using the option ``Sledgehammer: Provers'' from the ``Isabelle'' menu
blanchet@40254	668	in Proof General.
blanchet@36918	669
blanchet@40240	670	It is a good idea to run several provers in parallel, although it could slow
blanchet@40254	671	down your machine. Running E, SPASS, Vampire, and SInE-E together for 5 seconds
blanchet@40254	672	yields a better success rate than running the most effective of these (Vampire)
blanchet@40254	673	for 120 seconds \cite{boehme-nipkow-2010}.
blanchet@40240	674
blanchet@40240	675	\opnodefault{prover}{string}
blanchet@40240	676	Alias for \textit{provers}.
blanchet@40240	677
blanchet@40240	678	\opnodefault{atps}{string}
blanchet@40240	679	Legacy alias for \textit{provers}.
blanchet@36918	680
blanchet@36918	681	\opnodefault{atp}{string}
blanchet@40240	682	Legacy alias for \textit{provers}.
blanchet@36918	683
blanchet@40584	684	\opdefault{timeout}{float\_or\_none}{\upshape 30}
blanchet@40582	685	Specifies the maximum number of seconds that the automatic provers should spend
blanchet@43719	686	searching for a proof. This excludes problem preparation and is a soft limit.
blanchet@43719	687	For historical reasons, the default value of this option can be overridden using
blanchet@43719	688	the option ``Sledgehammer: Time Limit'' from the ``Isabelle'' menu in Proof
blanchet@43719	689	General.
blanchet@39228	690
blanchet@39227	691	\opfalse{blocking}{non\_blocking}
blanchet@39227	692	Specifies whether the \textbf{sledgehammer} command should operate
blanchet@39227	693	synchronously. The asynchronous (non-blocking) mode lets the user start proving
blanchet@39227	694	the putative theorem manually while Sledgehammer looks for a proof, but it can
blanchet@39227	695	also be more confusing.
blanchet@39227	696
blanchet@43314	697	\optrue{slicing}{no\_slicing}
blanchet@43314	698	Specifies whether the time allocated to a prover should be sliced into several
blanchet@43314	699	segments, each of which has its own set of possibly prover-dependent options.
blanchet@43317	700	For SPASS and Vampire, the first slice tries the fast but incomplete
blanchet@43314	701	set-of-support (SOS) strategy, whereas the second slice runs without it. For E,
blanchet@43317	702	up to three slices are tried, with different weighted search strategies and
blanchet@43314	703	number of facts. For SMT solvers, several slices are tried with the same options
blanchet@43317	704	each time but fewer and fewer facts. According to benchmarks with a timeout of
blanchet@43317	705	30 seconds, slicing is a valuable optimization, and you should probably leave it
blanchet@43317	706	enabled unless you are conducting experiments. This option is implicitly
blanchet@43314	707	disabled for (short) automatic runs.
blanchet@43314	708
blanchet@43314	709	\nopagebreak
blanchet@43314	710	{\small See also \textit{verbose} (\S\ref{output-format}).}
blanchet@43314	711
blanchet@36918	712	\opfalse{overlord}{no\_overlord}
blanchet@36918	713	Specifies whether Sledgehammer should put its temporary files in
blanchet@36918	714	\texttt{\$ISA\-BELLE\_\allowbreak HOME\_\allowbreak USER}, which is useful for
blanchet@36918	715	debugging Sledgehammer but also unsafe if several instances of the tool are run
blanchet@36918	716	simultaneously. The files are identified by the prefix \texttt{prob\_}; you may
blanchet@36918	717	safely remove them after Sledgehammer has run.
blanchet@36918	718
blanchet@36918	719	\nopagebreak
blanchet@36918	720	{\small See also \textit{debug} (\S\ref{output-format}).}
blanchet@36918	721	\end{enum}
blanchet@36918	722
blanchet@36918	723	\subsection{Problem Encoding}
blanchet@36918	724	\label{problem-encoding}
blanchet@36918	725
blanchet@36918	726	\begin{enum}
blanchet@36918	727	\opfalse{explicit\_apply}{implicit\_apply}
blanchet@36918	728	Specifies whether function application should be encoded as an explicit
blanchet@40254	729	``apply'' operator in ATP problems. If the option is set to \textit{false}, each
blanchet@40254	730	function will be directly applied to as many arguments as possible. Enabling
blanchet@40254	731	this option can sometimes help discover higher-order proofs that otherwise would
blanchet@40254	732	not be found.
blanchet@36918	733
blanchet@36918	734	\opfalse{full\_types}{partial\_types}
blanchet@43551	735	Specifies whether full type information is encoded in ATP problems. Enabling
blanchet@43601	736	this option prevents the discovery of type-incorrect proofs, but it can slow
blanchet@43601	737	down the ATP slightly. This option is implicitly enabled for automatic runs. For
blanchet@43601	738	historical reasons, the default value of this option can be overridden using the
blanchet@43601	739	option ``Sledgehammer: Full Types'' from the ``Isabelle'' menu in Proof General.
blanchet@43089	740
blanchet@43089	741	\opdefault{type\_sys}{string}{smart}
blanchet@43089	742	Specifies the type system to use in ATP problems. The option can take the
blanchet@43089	743	following values:
blanchet@43089	744
blanchet@43089	745	\begin{enum}
blanchet@43587	746	\item[$\bullet$] \textbf{\textit{poly\_preds}:} Types are encoded using a predicate
blanchet@43460	747	$\mathit{has\_type\/}(\tau, t)$ that restricts the range of bound variables.
blanchet@43460	748	Constants are annotated with their types, supplied as extra arguments, to
blanchet@43460	749	resolve overloading.
blanchet@43453	750
blanchet@43587	751	\item[$\bullet$] \textbf{\textit{poly\_tags}:} Each term and subterm is tagged with
blanchet@43555	752	its type using a function $\mathit{type\_info\/}(\tau, t)$.
blanchet@43555	753
blanchet@43587	754	\item[$\bullet$] \textbf{\textit{poly\_args}:}
blanchet@43587	755	Like for the other sound encodings, constants are annotated with their types to
blanchet@43587	756	resolve overloading, but otherwise no type information is encoded.
blanchet@43555	757
blanchet@43587	758	\item[$\bullet$] \textbf{\textit{erased}:} No type information is supplied to
blanchet@43587	759	the ATP. Types are simply erased.
blanchet@43453	760
blanchet@43587	761	\item[$\bullet$]
blanchet@43587	762	\textbf{%
blanchet@43587	763	\textit{mono\_preds},
blanchet@43587	764	\textit{mono\_tags},
blanchet@43587	765	\textit{mono\_args}:} \\
blanchet@43587	766	Similar to \textit{poly\_preds}, \textit{poly\_tags}, and \textit{poly\_args},
blanchet@43587	767	respectively, but the problem is additionally monomorphized, meaning that type
blanchet@43587	768	variables are instantiated with heuristically chosen ground types.
blanchet@43587	769	Monomorphization can simplify reasoning but also leads to larger fact bases,
blanchet@43587	770	which can slow down the ATPs.
blanchet@43453	771
blanchet@43725	772	\item[$\bullet$] \textbf{\textit{simple}:} Use the prover's support for simply
blanchet@43725	773	typed first-order logic if available; otherwise, fall back on
blanchet@43587	774	\textit{mangled\_preds}. The problem is monomorphized.
blanchet@43587	775
blanchet@43587	776	\item[$\bullet$]
blanchet@43587	777	\textbf{%
blanchet@43587	778	\textit{mangled\_preds},
blanchet@43587	779	\textit{mangled\_tags},
blanchet@43587	780	\textit{mangled\_args}:} \\
blanchet@43587	781	Similar to
blanchet@43587	782	\textit{mono\_preds}, \textit{mono\_tags}, and \textit{mono\_args},
blanchet@43587	783	respectively but types are mangled in constant names instead of being supplied
blanchet@43587	784	as ground term arguments. The binary predicate $\mathit{has\_type\/}(\tau, t)$
blanchet@43587	785	becomes a unary predicate $\mathit{has\_type\_}\tau(t)$, and the binary function
blanchet@43460	786	$\mathit{type\_info\/}(\tau, t)$ becomes a unary function
blanchet@43460	787	$\mathit{type\_info\_}\tau(t)$.
blanchet@43453	788
blanchet@43453	789	\item[$\bullet$]
blanchet@43453	790	\textbf{%
blanchet@43725	791	\textit{mono\_preds}?, \textit{mono\_tags}?, \textit{simple}?, \\
blanchet@43618	792	\textit{mangled\_preds}?, \textit{mangled\_tags}?:} \\
blanchet@43725	793	The type systems \textit{mono\_preds}, \textit{mono\_tags}, \textit{simple},
blanchet@43587	794	\textit{mangled\_preds}, and \textit{mangled\_tags} are fully typed and
blanchet@43587	795	virtually sound---except for pathological cases, all found proofs are
blanchet@43608	796	type-correct. For each of these, Sledgehammer also provides a lighter (but
blanchet@43608	797	virtually sound) variant identified by a question mark (`{?}')\ that detects and
blanchet@43725	798	erases monotonic types, notably infinite types. (For \textit{simple}, the types
blanchet@43725	799	are not actually erased but rather replaced by a shared uniform type of
blanchet@43608	800	individuals.)
blanchet@43551	801
blanchet@43551	802	\item[$\bullet$]
blanchet@43551	803	\textbf{%
blanchet@43618	804	\textit{poly\_tags}!, \textit{mono\_preds}!, \textit{mono\_tags}!, \\
blanchet@43725	805	\textit{simple}!, \textit{mangled\_preds}!, \textit{mangled\_tags}!:} \\
blanchet@43608	806	The type systems \textit{poly\_preds}, \textit{poly\_tags},
blanchet@43725	807	\textit{mono\_preds}, \textit{mono\_tags}, \textit{simple},
blanchet@43608	808	\textit{mangled\_preds}, and \textit{mangled\_tags} also admit a somewhat
blanchet@43608	809	unsound (but very efficient) variant identified by an exclamation mark (`{!}')
blanchet@43608	810	that detects and erases erases all types except those that are clearly finite
blanchet@43725	811	(e.g., \textit{bool}). (For \textit{simple}, the types are not actually erased
blanchet@43725	812	but rather replaced by a shared uniform type of individuals.)
blanchet@43460	813
blanchet@43098	814	\item[$\bullet$] \textbf{\textit{smart}:} If \textit{full\_types} is enabled,
blanchet@43460	815	uses a fully typed, virtually sound encoding; otherwise, uses any encoding. The
blanchet@43460	816	actual encoding used depends on the ATP and should be the most efficient for
blanchet@43460	817	that ATP.
blanchet@43089	818	\end{enum}
blanchet@43089	819
blanchet@43725	820	In addition, all the \textit{preds} and \textit{tags} type systems are available
blanchet@43725	821	in two variants, a lightweight and a heavyweight variant. The lightweight
blanchet@43725	822	variants are generally more efficient and are the default; the heavyweight
blanchet@43725	823	variants are identified by a \textit{\_heavy} suffix (e.g.,
blanchet@43725	824	\textit{mangled\_preds\_heavy}{?}).
blanchet@43394	825
blanchet@43725	826	For SMT solvers and ToFoF-E, the type system is always \textit{simple},
blanchet@43725	827	irrespective of the value of this option.
blanchet@43725	828
blanchet@43725	829	\opdefault{max\_mono\_iters}{int}{\upshape 3}
blanchet@43394	830	Specifies the maximum number of iterations for the monomorphization fixpoint
blanchet@43394	831	construction. The higher this limit is, the more monomorphic instances are
blanchet@43462	832	potentially generated. Whether monomorphization takes place depends on the
blanchet@43462	833	type system used.
blanchet@43589	834
blanchet@43725	835	\opdefault{max\_new\_mono\_instances}{int}{\upshape 400}
blanchet@43608	836	Specifies the maximum number of monomorphic instances to generate beyond
blanchet@43608	837	\textit{max\_relevant}. The higher this limit is, the more monomorphic instances
blanchet@43608	838	are potentially generated. Whether monomorphization takes place depends on the
blanchet@43608	839	type system used.
blanchet@38814	840	\end{enum}
blanchet@36918	841
blanchet@38814	842	\subsection{Relevance Filter}
blanchet@38814	843	\label{relevance-filter}
blanchet@38814	844
blanchet@38814	845	\begin{enum}
blanchet@40584	846	\opdefault{relevance\_thresholds}{float\_pair}{\upshape 0.45~0.85}
blanchet@38985	847	Specifies the thresholds above which facts are considered relevant by the
blanchet@38985	848	relevance filter. The first threshold is used for the first iteration of the
blanchet@38985	849	relevance filter and the second threshold is used for the last iteration (if it
blanchet@38985	850	is reached). The effective threshold is quadratically interpolated for the other
blanchet@40584	851	iterations. Each threshold ranges from 0 to 1, where 0 means that all theorems
blanchet@40584	852	are relevant and 1 only theorems that refer to previously seen constants.
blanchet@36918	853
blanchet@40584	854	\opsmart{max\_relevant}{int\_or\_smart}
blanchet@38985	855	Specifies the maximum number of facts that may be returned by the relevance
blanchet@38985	856	filter. If the option is set to \textit{smart}, it is set to a value that was
blanchet@40240	857	empirically found to be appropriate for the prover. A typical value would be
blanchet@40240	858	300.
blanchet@43051	859
blanchet@36918	860	\end{enum}
blanchet@36918	861
blanchet@36918	862	\subsection{Output Format}
blanchet@36918	863	\label{output-format}
blanchet@36918	864
blanchet@36918	865	\begin{enum}
blanchet@36918	866
blanchet@36918	867	\opfalse{verbose}{quiet}
blanchet@36918	868	Specifies whether the \textbf{sledgehammer} command should explain what it does.
blanchet@41456	869	This option is implicitly disabled for automatic runs.
blanchet@36918	870
blanchet@36918	871	\opfalse{debug}{no\_debug}
blanchet@40444	872	Specifies whether Sledgehammer should display additional debugging information
blanchet@40444	873	beyond what \textit{verbose} already displays. Enabling \textit{debug} also
blanchet@41456	874	enables \textit{verbose} and \textit{blocking} (\S\ref{mode-of-operation})
blanchet@41456	875	behind the scenes. The \textit{debug} option is implicitly disabled for
blanchet@41456	876	automatic runs.
blanchet@36918	877
blanchet@36918	878	\nopagebreak
blanchet@36918	879	{\small See also \textit{overlord} (\S\ref{mode-of-operation}).}
blanchet@36918	880
blanchet@36918	881	\opfalse{isar\_proof}{no\_isar\_proof}
blanchet@36918	882	Specifies whether Isar proofs should be output in addition to one-liner
blanchet@36918	883	\textit{metis} proofs. Isar proof construction is still experimental and often
blanchet@36918	884	fails; however, they are usually faster and sometimes more robust than
blanchet@36918	885	\textit{metis} proofs.
blanchet@36918	886
blanchet@40584	887	\opdefault{isar\_shrink\_factor}{int}{\upshape 1}
blanchet@36918	888	Specifies the granularity of the Isar proof. A value of $n$ indicates that each
blanchet@36918	889	Isar proof step should correspond to a group of up to $n$ consecutive proof
blanchet@36918	890	steps in the ATP proof.
blanchet@36918	891
blanchet@36918	892	\end{enum}
blanchet@36918	893
blanchet@39228	894	\subsection{Authentication}
blanchet@39228	895	\label{authentication}
blanchet@36918	896
blanchet@36918	897	\begin{enum}
blanchet@39228	898	\opnodefault{expect}{string}
blanchet@39228	899	Specifies the expected outcome, which must be one of the following:
blanchet@39228	900
blanchet@39228	901	\begin{enum}
blanchet@40444	902	\item[$\bullet$] \textbf{\textit{some}:} Sledgehammer found a (potentially
blanchet@40444	903	unsound) proof.
blanchet@39228	904	\item[$\bullet$] \textbf{\textit{none}:} Sledgehammer found no proof.
blanchet@40444	905	\item[$\bullet$] \textbf{\textit{unknown}:} Sledgehammer encountered some
blanchet@40444	906	problem.
blanchet@39228	907	\end{enum}
blanchet@39228	908
blanchet@39228	909	Sledgehammer emits an error (if \textit{blocking} is enabled) or a warning
blanchet@39228	910	(otherwise) if the actual outcome differs from the expected outcome. This option
blanchet@39228	911	is useful for regression testing.
blanchet@39228	912
blanchet@39228	913	\nopagebreak
blanchet@39228	914	{\small See also \textit{blocking} (\S\ref{mode-of-operation}).}
blanchet@36918	915	\end{enum}
blanchet@36918	916
blanchet@36918	917	\let\em=\sl
blanchet@36918	918	\bibliography{../manual}{}
blanchet@36918	919	\bibliographystyle{abbrv}
blanchet@36918	920
blanchet@36918	921	\end{document}

author	blanchet
	Fri, 20 May 2011 12:47:58 +0200
changeset 43746	d7447b8c4265
parent 43725	9eef1dc200a8
child 43752	ec1ea24d49bc
permissions	-rw-r--r--