wneuper/isa: doc-src/Nitpick/nitpick.tex@7b8c366e34a2 (annotated)

blanchet@33191	1	\documentclass[a4paper,12pt]{article}
blanchet@33191	2	\usepackage[T1]{fontenc}
blanchet@33191	3	\usepackage{amsmath}
blanchet@33191	4	\usepackage{amssymb}
blanchet@33555	5	\usepackage[english,french]{babel}
blanchet@33191	6	\usepackage{color}
blanchet@33191	7	\usepackage{graphicx}
blanchet@33191	8	%\usepackage{mathpazo}
blanchet@33191	9	\usepackage{multicol}
blanchet@33191	10	\usepackage{stmaryrd}
blanchet@33191	11	%\usepackage[scaled=.85]{beramono}
blanchet@33191	12	\usepackage{../iman,../pdfsetup}
blanchet@33191	13
blanchet@33191	14	%\oddsidemargin=4.6mm
blanchet@33191	15	%\evensidemargin=4.6mm
blanchet@33191	16	%\textwidth=150mm
blanchet@33191	17	%\topmargin=4.6mm
blanchet@33191	18	%\headheight=0mm
blanchet@33191	19	%\headsep=0mm
blanchet@33191	20	%\textheight=234mm
blanchet@33191	21
blanchet@33191	22	\def\Colon{\mathord{:\mkern-1.5mu:}}
blanchet@33191	23	%\def\lbrakk{\mathopen{\lbrack\mkern-3.25mu\lbrack}}
blanchet@33191	24	%\def\rbrakk{\mathclose{\rbrack\mkern-3.255mu\rbrack}}
blanchet@33191	25	\def\lparr{\mathopen{(\mkern-4mu\mid}}
blanchet@33191	26	\def\rparr{\mathclose{\mid\mkern-4mu)}}
blanchet@33191	27
blanchet@33191	28	\def\unk{{?}}
blanchet@34969	29	\def\undef{(\lambda x.\; \unk)}
blanchet@33191	30	%\def\unr{\textit{others}}
blanchet@33191	31	\def\unr{\ldots}
blanchet@33191	32	\def\Abs#1{\hbox{\rm{\flqq}}{\,#1\,}\hbox{\rm{\frqq}}}
blanchet@33191	33	\def\Q{{\smash{\lower.2ex\hbox{$\scriptstyle?$}}}}
blanchet@33191	34
blanchet@33191	35	\hyphenation{Mini-Sat size-change First-Steps grand-parent nit-pick
blanchet@33191	36	counter-example counter-examples data-type data-types co-data-type
blanchet@33191	37	co-data-types in-duc-tive co-in-duc-tive}
blanchet@33191	38
blanchet@33191	39	\urlstyle{tt}
blanchet@33191	40
blanchet@33191	41	\begin{document}
blanchet@33191	42
blanchet@33555	43	\selectlanguage{english}
blanchet@33555	44
blanchet@33191	45	\title{\includegraphics[scale=0.5]{isabelle_nitpick} \\[4ex]
blanchet@33191	46	Picking Nits \\[\smallskipamount]
blanchet@33887	47	\Large A User's Guide to Nitpick for Isabelle/HOL}
blanchet@33191	48	\author{\hbox{} \\
blanchet@33191	49	Jasmin Christian Blanchette \\
blanchet@33887	50	{\normalsize Institut f\"ur Informatik, Technische Universit\"at M\"unchen} \\
blanchet@33191	51	\hbox{}}
blanchet@33191	52
blanchet@33191	53	\maketitle
blanchet@33191	54
blanchet@33191	55	\tableofcontents
blanchet@33191	56
blanchet@33191	57	\setlength{\parskip}{.7em plus .2em minus .1em}
blanchet@33191	58	\setlength{\parindent}{0pt}
blanchet@33191	59	\setlength{\abovedisplayskip}{\parskip}
blanchet@33191	60	\setlength{\abovedisplayshortskip}{.9\parskip}
blanchet@33191	61	\setlength{\belowdisplayskip}{\parskip}
blanchet@33191	62	\setlength{\belowdisplayshortskip}{.9\parskip}
blanchet@33191	63
blanchet@33191	64	% General-purpose enum environment with correct spacing
blanchet@33191	65	\newenvironment{enum}%
blanchet@33191	66	{\begin{list}{}{%
blanchet@33191	67	\setlength{\topsep}{.1\parskip}%
blanchet@33191	68	\setlength{\partopsep}{.1\parskip}%
blanchet@33191	69	\setlength{\itemsep}{\parskip}%
blanchet@33191	70	\advance\itemsep by-\parsep}}
blanchet@33191	71	{\end{list}}
blanchet@33191	72
blanchet@33191	73	\def\pre{\begingroup\vskip0pt plus1ex\advance\leftskip by\leftmargin
blanchet@33191	74	\advance\rightskip by\leftmargin}
blanchet@33191	75	\def\post{\vskip0pt plus1ex\endgroup}
blanchet@33191	76
blanchet@33191	77	\def\prew{\pre\advance\rightskip by-\leftmargin}
blanchet@33191	78	\def\postw{\post}
blanchet@33191	79
blanchet@33191	80	\section{Introduction}
blanchet@33191	81	\label{introduction}
blanchet@33191	82
blanchet@33191	83	Nitpick \cite{blanchette-nipkow-2009} is a counterexample generator for
blanchet@33191	84	Isabelle/HOL \cite{isa-tutorial} that is designed to handle formulas
blanchet@33191	85	combining (co)in\-duc\-tive datatypes, (co)in\-duc\-tively defined predicates, and
blanchet@33191	86	quantifiers. It builds on Kodkod \cite{torlak-jackson-2007}, a highly optimized
blanchet@33191	87	first-order relational model finder developed by the Software Design Group at
blanchet@33191	88	MIT. It is conceptually similar to Refute \cite{weber-2008}, from which it
blanchet@33191	89	borrows many ideas and code fragments, but it benefits from Kodkod's
blanchet@33191	90	optimizations and a new encoding scheme. The name Nitpick is shamelessly
blanchet@33191	91	appropriated from a now retired Alloy precursor.
blanchet@33191	92
blanchet@33191	93	Nitpick is easy to use---you simply enter \textbf{nitpick} after a putative
blanchet@33191	94	theorem and wait a few seconds. Nonetheless, there are situations where knowing
blanchet@33191	95	how it works under the hood and how it reacts to various options helps
blanchet@33191	96	increase the test coverage. This manual also explains how to install the tool on
blanchet@33191	97	your workstation. Should the motivation fail you, think of the many hours of
blanchet@33191	98	hard work Nitpick will save you. Proving non-theorems is \textsl{hard work}.
blanchet@33191	99
blanchet@33191	100	Another common use of Nitpick is to find out whether the axioms of a locale are
blanchet@33191	101	satisfiable, while the locale is being developed. To check this, it suffices to
blanchet@33191	102	write
blanchet@33191	103
blanchet@33191	104	\prew
blanchet@33191	105	\textbf{lemma}~``$\textit{False}$'' \\
blanchet@33191	106	\textbf{nitpick}~[\textit{show\_all}]
blanchet@33191	107	\postw
blanchet@33191	108
blanchet@33191	109	after the locale's \textbf{begin} keyword. To falsify \textit{False}, Nitpick
blanchet@33191	110	must find a model for the axioms. If it finds no model, we have an indication
blanchet@33191	111	that the axioms might be unsatisfiable.
blanchet@33191	112
blanchet@33195	113	Nitpick requires the Kodkodi package for Isabelle as well as a Java 1.5 virtual
blanchet@33195	114	machine called \texttt{java}. The examples presented in this manual can be found
blanchet@33195	115	in Isabelle's \texttt{src/HOL/Nitpick\_Examples/Manual\_Nits.thy} theory.
blanchet@33195	116
blanchet@33552	117	Throughout this manual, we will explicitly invoke the \textbf{nitpick} command.
blanchet@33552	118	Nitpick also provides an automatic mode that can be enabled using the
blanchet@33552	119	``Auto Nitpick'' option from the ``Isabelle'' menu in Proof General. In this
blanchet@33552	120	mode, Nitpick is run on every newly entered theorem, much like Auto Quickcheck.
blanchet@33552	121	The collective time limit for Auto Nitpick and Auto Quickcheck can be set using
blanchet@33552	122	the ``Auto Counterexample Time Limit'' option.
blanchet@33552	123
blanchet@33191	124	\newbox\boxA
blanchet@33191	125	\setbox\boxA=\hbox{\texttt{nospam}}
blanchet@33191	126
blanchet@33191	127	The known bugs and limitations at the time of writing are listed in
blanchet@33191	128	\S\ref{known-bugs-and-limitations}. Comments and bug reports concerning Nitpick
blanchet@33191	129	or this manual should be directed to
blanchet@33191	130	\texttt{blan{\color{white}nospam}\kern-\wd\boxA{}chette@\allowbreak
blanchet@33191	131	in.\allowbreak tum.\allowbreak de}.
blanchet@33191	132
blanchet@33191	133	\vskip2.5\smallskipamount
blanchet@33191	134
blanchet@33191	135	\textbf{Acknowledgment.} The author would like to thank Mark Summerfield for
blanchet@33191	136	suggesting several textual improvements.
blanchet@33191	137	% and Perry James for reporting a typo.
blanchet@33191	138
blanchet@33191	139	\section{First Steps}
blanchet@33191	140	\label{first-steps}
blanchet@33191	141
blanchet@33191	142	This section introduces Nitpick by presenting small examples. If possible, you
blanchet@33191	143	should try out the examples on your workstation. Your theory file should start
blanchet@33191	144	the standard way:
blanchet@33191	145
blanchet@33191	146	\prew
blanchet@33191	147	\textbf{theory}~\textit{Scratch} \\
blanchet@33191	148	\textbf{imports}~\textit{Main} \\
blanchet@33191	149	\textbf{begin}
blanchet@33191	150	\postw
blanchet@33191	151
blanchet@33191	152	The results presented here were obtained using the JNI version of MiniSat and
blanchet@33191	153	with multithreading disabled to reduce nondeterminism. This was done by adding
blanchet@33191	154	the line
blanchet@33191	155
blanchet@33191	156	\prew
blanchet@33191	157	\textbf{nitpick\_params} [\textit{sat\_solver}~= \textit{MiniSatJNI}, \,\textit{max\_threads}~= 1]
blanchet@33191	158	\postw
blanchet@33191	159
blanchet@33191	160	after the \textbf{begin} keyword. The JNI version of MiniSat is bundled with
blanchet@33191	161	Kodkodi and is precompiled for the major platforms. Other SAT solvers can also
blanchet@33191	162	be installed, as explained in \S\ref{optimizations}. If you have already
blanchet@33191	163	configured SAT solvers in Isabelle (e.g., for Refute), these will also be
blanchet@33191	164	available to Nitpick.
blanchet@33191	165
blanchet@33191	166	\subsection{Propositional Logic}
blanchet@33191	167	\label{propositional-logic}
blanchet@33191	168
blanchet@33191	169	Let's start with a trivial example from propositional logic:
blanchet@33191	170
blanchet@33191	171	\prew
blanchet@33191	172	\textbf{lemma}~``$P \longleftrightarrow Q$'' \\
blanchet@33191	173	\textbf{nitpick}
blanchet@33191	174	\postw
blanchet@33191	175
blanchet@33191	176	You should get the following output:
blanchet@33191	177
blanchet@33191	178	\prew
blanchet@33191	179	\slshape
blanchet@33191	180	Nitpick found a counterexample: \\[2\smallskipamount]
blanchet@33191	181	\hbox{}\qquad Free variables: \nopagebreak \\
blanchet@33191	182	\hbox{}\qquad\qquad $P = \textit{True}$ \\
blanchet@33191	183	\hbox{}\qquad\qquad $Q = \textit{False}$
blanchet@33191	184	\postw
blanchet@33191	185
blanchet@33191	186	Nitpick can also be invoked on individual subgoals, as in the example below:
blanchet@33191	187
blanchet@33191	188	\prew
blanchet@33191	189	\textbf{apply}~\textit{auto} \\[2\smallskipamount]
blanchet@33191	190	{\slshape goal (2 subgoals): \\
blanchet@34969	191	\phantom{0}1. $P\,\Longrightarrow\, Q$ \\
blanchet@34969	192	\phantom{0}2. $Q\,\Longrightarrow\, P$} \\[2\smallskipamount]
blanchet@33191	193	\textbf{nitpick}~1 \\[2\smallskipamount]
blanchet@33191	194	{\slshape Nitpick found a counterexample: \\[2\smallskipamount]
blanchet@33191	195	\hbox{}\qquad Free variables: \nopagebreak \\
blanchet@33191	196	\hbox{}\qquad\qquad $P = \textit{True}$ \\
blanchet@33191	197	\hbox{}\qquad\qquad $Q = \textit{False}$} \\[2\smallskipamount]
blanchet@33191	198	\textbf{nitpick}~2 \\[2\smallskipamount]
blanchet@33191	199	{\slshape Nitpick found a counterexample: \\[2\smallskipamount]
blanchet@33191	200	\hbox{}\qquad Free variables: \nopagebreak \\
blanchet@33191	201	\hbox{}\qquad\qquad $P = \textit{False}$ \\
blanchet@33191	202	\hbox{}\qquad\qquad $Q = \textit{True}$} \\[2\smallskipamount]
blanchet@33191	203	\textbf{oops}
blanchet@33191	204	\postw
blanchet@33191	205
blanchet@33191	206	\subsection{Type Variables}
blanchet@33191	207	\label{type-variables}
blanchet@33191	208
blanchet@33191	209	If you are left unimpressed by the previous example, don't worry. The next
blanchet@33191	210	one is more mind- and computer-boggling:
blanchet@33191	211
blanchet@33191	212	\prew
blanchet@33191	213	\textbf{lemma} ``$P~x\,\Longrightarrow\, P~(\textrm{THE}~y.\;P~y)$''
blanchet@33191	214	\postw
blanchet@33191	215	\pagebreak[2] %% TYPESETTING
blanchet@33191	216
blanchet@33191	217	The putative lemma involves the definite description operator, {THE}, presented
blanchet@33191	218	in section 5.10.1 of the Isabelle tutorial \cite{isa-tutorial}. The
blanchet@33191	219	operator is defined by the axiom $(\textrm{THE}~x.\; x = a) = a$. The putative
blanchet@33191	220	lemma is merely asserting the indefinite description operator axiom with {THE}
blanchet@33191	221	substituted for {SOME}.
blanchet@33191	222
blanchet@33191	223	The free variable $x$ and the bound variable $y$ have type $'a$. For formulas
blanchet@33191	224	containing type variables, Nitpick enumerates the possible domains for each type
blanchet@33191	225	variable, up to a given cardinality (8 by default), looking for a finite
blanchet@33191	226	countermodel:
blanchet@33191	227
blanchet@33191	228	\prew
blanchet@33191	229	\textbf{nitpick} [\textit{verbose}] \\[2\smallskipamount]
blanchet@33191	230	\slshape
blanchet@33191	231	Trying 8 scopes: \nopagebreak \\
blanchet@33191	232	\hbox{}\qquad \textit{card}~$'a$~= 1; \\
blanchet@33191	233	\hbox{}\qquad \textit{card}~$'a$~= 2; \\
blanchet@33191	234	\hbox{}\qquad $\qquad\vdots$ \\[.5\smallskipamount]
blanchet@33191	235	\hbox{}\qquad \textit{card}~$'a$~= 8. \\[2\smallskipamount]
blanchet@33191	236	Nitpick found a counterexample for \textit{card} $'a$~= 3: \\[2\smallskipamount]
blanchet@33191	237	\hbox{}\qquad Free variables: \nopagebreak \\
blanchet@33191	238	\hbox{}\qquad\qquad $P = \{a_2,\, a_3\}$ \\
blanchet@33191	239	\hbox{}\qquad\qquad $x = a_3$ \\[2\smallskipamount]
blanchet@33191	240	Total time: 580 ms.
blanchet@33191	241	\postw
blanchet@33191	242
blanchet@33191	243	Nitpick found a counterexample in which $'a$ has cardinality 3. (For
blanchet@33191	244	cardinalities 1 and 2, the formula holds.) In the counterexample, the three
blanchet@33191	245	values of type $'a$ are written $a_1$, $a_2$, and $a_3$.
blanchet@33191	246
blanchet@33191	247	The message ``Trying $n$ scopes: {\ldots}''\ is shown only if the option
blanchet@33191	248	\textit{verbose} is enabled. You can specify \textit{verbose} each time you
blanchet@33191	249	invoke \textbf{nitpick}, or you can set it globally using the command
blanchet@33191	250
blanchet@33191	251	\prew
blanchet@33191	252	\textbf{nitpick\_params} [\textit{verbose}]
blanchet@33191	253	\postw
blanchet@33191	254
blanchet@33191	255	This command also displays the current default values for all of the options
blanchet@33191	256	supported by Nitpick. The options are listed in \S\ref{option-reference}.
blanchet@33191	257
blanchet@33191	258	\subsection{Constants}
blanchet@33191	259	\label{constants}
blanchet@33191	260
blanchet@33191	261	By just looking at Nitpick's output, it might not be clear why the
blanchet@33191	262	counterexample in \S\ref{type-variables} is genuine. Let's invoke Nitpick again,
blanchet@33191	263	this time telling it to show the values of the constants that occur in the
blanchet@33191	264	formula:
blanchet@33191	265
blanchet@33191	266	\prew
blanchet@33191	267	\textbf{lemma}~``$P~x\,\Longrightarrow\, P~(\textrm{THE}~y.\;P~y)$'' \\
blanchet@33191	268	\textbf{nitpick}~[\textit{show\_consts}] \\[2\smallskipamount]
blanchet@33191	269	\slshape
blanchet@33191	270	Nitpick found a counterexample for \textit{card} $'a$~= 3: \\[2\smallskipamount]
blanchet@33191	271	\hbox{}\qquad Free variables: \nopagebreak \\
blanchet@33191	272	\hbox{}\qquad\qquad $P = \{a_2,\, a_3\}$ \\
blanchet@33191	273	\hbox{}\qquad\qquad $x = a_3$ \\
blanchet@33191	274	\hbox{}\qquad Constant: \nopagebreak \\
blanchet@33191	275	\hbox{}\qquad\qquad $\textit{The}~\textsl{fallback} = a_1$
blanchet@33191	276	\postw
blanchet@33191	277
blanchet@33191	278	We can see more clearly now. Since the predicate $P$ isn't true for a unique
blanchet@33191	279	value, $\textrm{THE}~y.\;P~y$ can denote any value of type $'a$, even
blanchet@33191	280	$a_1$. Since $P~a_1$ is false, the entire formula is falsified.
blanchet@33191	281
blanchet@33191	282	As an optimization, Nitpick's preprocessor introduced the special constant
blanchet@33191	283	``\textit{The} fallback'' corresponding to $\textrm{THE}~y.\;P~y$ (i.e.,
blanchet@33191	284	$\mathit{The}~(\lambda y.\;P~y)$) when there doesn't exist a unique $y$
blanchet@33191	285	satisfying $P~y$. We disable this optimization by passing the
blanchet@33191	286	\textit{full\_descrs} option:
blanchet@33191	287
blanchet@33191	288	\prew
blanchet@33191	289	\textbf{nitpick}~[\textit{full\_descrs},\, \textit{show\_consts}] \\[2\smallskipamount]
blanchet@33191	290	\slshape
blanchet@33191	291	Nitpick found a counterexample for \textit{card} $'a$~= 3: \\[2\smallskipamount]
blanchet@33191	292	\hbox{}\qquad Free variables: \nopagebreak \\
blanchet@33191	293	\hbox{}\qquad\qquad $P = \{a_2,\, a_3\}$ \\
blanchet@33191	294	\hbox{}\qquad\qquad $x = a_3$ \\
blanchet@33191	295	\hbox{}\qquad Constant: \nopagebreak \\
blanchet@33191	296	\hbox{}\qquad\qquad $\hbox{\slshape THE}~y.\;P~y = a_1$
blanchet@33191	297	\postw
blanchet@33191	298
blanchet@33191	299	As the result of another optimization, Nitpick directly assigned a value to the
blanchet@33191	300	subterm $\textrm{THE}~y.\;P~y$, rather than to the \textit{The} constant. If we
blanchet@33191	301	disable this second optimization by using the command
blanchet@33191	302
blanchet@33191	303	\prew
blanchet@33191	304	\textbf{nitpick}~[\textit{dont\_specialize},\, \textit{full\_descrs},\,
blanchet@33191	305	\textit{show\_consts}]
blanchet@33191	306	\postw
blanchet@33191	307
blanchet@33191	308	we finally get \textit{The}:
blanchet@33191	309
blanchet@33191	310	\prew
blanchet@33191	311	\slshape Constant: \nopagebreak \\
blanchet@33191	312	\hbox{}\qquad $\mathit{The} = \undef{}
blanchet@33191	313	(\!\begin{aligned}[t]%
blanchet@33191	314	& \{\} := a_3,\> \{a_3\} := a_3,\> \{a_2\} := a_2, \\[-2pt] %% TYPESETTING
blanchet@33191	315	& \{a_2, a_3\} := a_1,\> \{a_1\} := a_1,\> \{a_1, a_3\} := a_3, \\[-2pt]
blanchet@33191	316	& \{a_1, a_2\} := a_3,\> \{a_1, a_2, a_3\} := a_3)\end{aligned}$
blanchet@33191	317	\postw
blanchet@33191	318
blanchet@33191	319	Notice that $\textit{The}~(\lambda y.\;P~y) = \textit{The}~\{a_2, a_3\} = a_1$,
blanchet@34969	320	just like before.\footnote{The Isabelle/HOL notation $f(x :=
blanchet@34969	321	y)$ denotes the function that maps $x$ to $y$ and that otherwise behaves like
blanchet@34969	322	$f$.}
blanchet@33191	323
blanchet@33191	324	Our misadventures with THE suggest adding `$\exists!x{.}$' (``there exists a
blanchet@33191	325	unique $x$ such that'') at the front of our putative lemma's assumption:
blanchet@33191	326
blanchet@33191	327	\prew
blanchet@33191	328	\textbf{lemma}~``$\exists {!}x.\; P~x\,\Longrightarrow\, P~(\textrm{THE}~y.\;P~y)$''
blanchet@33191	329	\postw
blanchet@33191	330
blanchet@33191	331	The fix appears to work:
blanchet@33191	332
blanchet@33191	333	\prew
blanchet@33191	334	\textbf{nitpick} \\[2\smallskipamount]
blanchet@33191	335	\slshape Nitpick found no counterexample.
blanchet@33191	336	\postw
blanchet@33191	337
blanchet@33191	338	We can further increase our confidence in the formula by exhausting all
blanchet@33191	339	cardinalities up to 50:
blanchet@33191	340
blanchet@33191	341	\prew
blanchet@33191	342	\textbf{nitpick} [\textit{card} $'a$~= 1--50]\footnote{The symbol `--'
blanchet@33191	343	can be entered as \texttt{-} (hyphen) or
blanchet@33191	344	\texttt{\char`\\\char`\<midarrow\char`\>}.} \\[2\smallskipamount]
blanchet@33191	345	\slshape Nitpick found no counterexample.
blanchet@33191	346	\postw
blanchet@33191	347
blanchet@33191	348	Let's see if Sledgehammer \cite{sledgehammer-2009} can find a proof:
blanchet@33191	349
blanchet@33191	350	\prew
blanchet@33191	351	\textbf{sledgehammer} \\[2\smallskipamount]
blanchet@33191	352	{\slshape Sledgehammer: external prover ``$e$'' for subgoal 1: \\
blanchet@33191	353	$\exists{!}x.\; P~x\,\Longrightarrow\, P~(\hbox{\slshape THE}~y.\; P~y)$ \\
blanchet@33191	354	Try this command: \textrm{apply}~(\textit{metis~the\_equality})} \\[2\smallskipamount]
blanchet@33191	355	\textbf{apply}~(\textit{metis~the\_equality\/}) \nopagebreak \\[2\smallskipamount]
blanchet@33191	356	{\slshape No subgoals!}% \\[2\smallskipamount]
blanchet@33191	357	%\textbf{done}
blanchet@33191	358	\postw
blanchet@33191	359
blanchet@33191	360	This must be our lucky day.
blanchet@33191	361
blanchet@33191	362	\subsection{Skolemization}
blanchet@33191	363	\label{skolemization}
blanchet@33191	364
blanchet@33191	365	Are all invertible functions onto? Let's find out:
blanchet@33191	366
blanchet@33191	367	\prew
blanchet@33191	368	\textbf{lemma} ``$\exists g.\; \forall x.~g~(f~x) = x
blanchet@33191	369	\,\Longrightarrow\, \forall y.\; \exists x.~y = f~x$'' \\
blanchet@33191	370	\textbf{nitpick} \\[2\smallskipamount]
blanchet@33191	371	\slshape
blanchet@33191	372	Nitpick found a counterexample for \textit{card} $'a$~= 2 and \textit{card} $'b$~=~1: \\[2\smallskipamount]
blanchet@33191	373	\hbox{}\qquad Free variable: \nopagebreak \\
blanchet@33191	374	\hbox{}\qquad\qquad $f = \undef{}(b_1 := a_1)$ \\
blanchet@33191	375	\hbox{}\qquad Skolem constants: \nopagebreak \\
blanchet@33191	376	\hbox{}\qquad\qquad $g = \undef{}(a_1 := b_1,\> a_2 := b_1)$ \\
blanchet@33191	377	\hbox{}\qquad\qquad $y = a_2$
blanchet@33191	378	\postw
blanchet@33191	379
blanchet@33191	380	Although $f$ is the only free variable occurring in the formula, Nitpick also
blanchet@33191	381	displays values for the bound variables $g$ and $y$. These values are available
blanchet@33191	382	to Nitpick because it performs skolemization as a preprocessing step.
blanchet@33191	383
blanchet@33191	384	In the previous example, skolemization only affected the outermost quantifiers.
blanchet@33191	385	This is not always the case, as illustrated below:
blanchet@33191	386
blanchet@33191	387	\prew
blanchet@33191	388	\textbf{lemma} ``$\exists x.\; \forall f.\; f~x = x$'' \\
blanchet@33191	389	\textbf{nitpick} \\[2\smallskipamount]
blanchet@33191	390	\slshape
blanchet@33191	391	Nitpick found a counterexample for \textit{card} $'a$~= 2: \\[2\smallskipamount]
blanchet@33191	392	\hbox{}\qquad Skolem constant: \nopagebreak \\
blanchet@33191	393	\hbox{}\qquad\qquad $\lambda x.\; f =
blanchet@33191	394	\undef{}(\!\begin{aligned}[t]
blanchet@33191	395	& a_1 := \undef{}(a_1 := a_2,\> a_2 := a_1), \\[-2pt]
blanchet@33191	396	& a_2 := \undef{}(a_1 := a_1,\> a_2 := a_1))\end{aligned}$
blanchet@33191	397	\postw
blanchet@33191	398
blanchet@33191	399	The variable $f$ is bound within the scope of $x$; therefore, $f$ depends on
blanchet@33191	400	$x$, as suggested by the notation $\lambda x.\,f$. If $x = a_1$, then $f$ is the
blanchet@33191	401	function that maps $a_1$ to $a_2$ and vice versa; otherwise, $x = a_2$ and $f$
blanchet@33191	402	maps both $a_1$ and $a_2$ to $a_1$. In both cases, $f~x \not= x$.
blanchet@33191	403
blanchet@33191	404	The source of the Skolem constants is sometimes more obscure:
blanchet@33191	405
blanchet@33191	406	\prew
blanchet@33191	407	\textbf{lemma} ``$\mathit{refl}~r\,\Longrightarrow\, \mathit{sym}~r$'' \\
blanchet@33191	408	\textbf{nitpick} \\[2\smallskipamount]
blanchet@33191	409	\slshape
blanchet@33191	410	Nitpick found a counterexample for \textit{card} $'a$~= 2: \\[2\smallskipamount]
blanchet@33191	411	\hbox{}\qquad Free variable: \nopagebreak \\
blanchet@33191	412	\hbox{}\qquad\qquad $r = \{(a_1, a_1),\, (a_2, a_1),\, (a_2, a_2)\}$ \\
blanchet@33191	413	\hbox{}\qquad Skolem constants: \nopagebreak \\
blanchet@33191	414	\hbox{}\qquad\qquad $\mathit{sym}.x = a_2$ \\
blanchet@33191	415	\hbox{}\qquad\qquad $\mathit{sym}.y = a_1$
blanchet@33191	416	\postw
blanchet@33191	417
blanchet@33191	418	What happened here is that Nitpick expanded the \textit{sym} constant to its
blanchet@33191	419	definition:
blanchet@33191	420
blanchet@33191	421	\prew
blanchet@33191	422	$\mathit{sym}~r \,\equiv\,
blanchet@33191	423	\forall x\> y.\,\> (x, y) \in r \longrightarrow (y, x) \in r.$
blanchet@33191	424	\postw
blanchet@33191	425
blanchet@33191	426	As their names suggest, the Skolem constants $\mathit{sym}.x$ and
blanchet@33191	427	$\mathit{sym}.y$ are simply the bound variables $x$ and $y$
blanchet@33191	428	from \textit{sym}'s definition.
blanchet@33191	429
blanchet@33191	430	Although skolemization is a useful optimization, you can disable it by invoking
blanchet@33191	431	Nitpick with \textit{dont\_skolemize}. See \S\ref{optimizations} for details.
blanchet@33191	432
blanchet@33191	433	\subsection{Natural Numbers and Integers}
blanchet@33191	434	\label{natural-numbers-and-integers}
blanchet@33191	435
blanchet@33191	436	Because of the axiom of infinity, the type \textit{nat} does not admit any
blanchet@34121	437	finite models. To deal with this, Nitpick's approach is to consider finite
blanchet@34121	438	subsets $N$ of \textit{nat} and maps all numbers $\notin N$ to the undefined
blanchet@34121	439	value (displayed as `$\unk$'). The type \textit{int} is handled similarly.
blanchet@34121	440	Internally, undefined values lead to a three-valued logic.
blanchet@33191	441
blanchet@33191	442	Here is an example involving \textit{int}:
blanchet@33191	443
blanchet@33191	444	\prew
blanchet@33191	445	\textbf{lemma} ``$\lbrakk i \le j;\> n \le (m{\Colon}\mathit{int})\rbrakk \,\Longrightarrow\, i * n + j * m \le i * m + j * n$'' \\
blanchet@33191	446	\textbf{nitpick} \\[2\smallskipamount]
blanchet@33191	447	\slshape Nitpick found a counterexample: \\[2\smallskipamount]
blanchet@33191	448	\hbox{}\qquad Free variables: \nopagebreak \\
blanchet@33191	449	\hbox{}\qquad\qquad $i = 0$ \\
blanchet@33191	450	\hbox{}\qquad\qquad $j = 1$ \\
blanchet@33191	451	\hbox{}\qquad\qquad $m = 1$ \\
blanchet@33191	452	\hbox{}\qquad\qquad $n = 0$
blanchet@33191	453	\postw
blanchet@33191	454
blanchet@34121	455	Internally, Nitpick uses either a unary or a binary representation of numbers.
blanchet@34121	456	The unary representation is more efficient but only suitable for numbers very
blanchet@34121	457	close to zero. By default, Nitpick attempts to choose the more appropriate
blanchet@34121	458	encoding by inspecting the formula at hand. This behavior can be overridden by
blanchet@34121	459	passing either \textit{unary\_ints} or \textit{binary\_ints} as option. For
blanchet@34121	460	binary notation, the number of bits to use can be specified using
blanchet@34121	461	the \textit{bits} option. For example:
blanchet@34121	462
blanchet@34121	463	\prew
blanchet@34121	464	\textbf{nitpick} [\textit{binary\_ints}, \textit{bits}${} = 16$]
blanchet@34121	465	\postw
blanchet@34121	466
blanchet@33191	467	With infinite types, we don't always have the luxury of a genuine counterexample
blanchet@33191	468	and must often content ourselves with a potential one. The tedious task of
blanchet@33191	469	finding out whether the potential counterexample is in fact genuine can be
blanchet@34121	470	outsourced to \textit{auto} by passing \textit{check\_potential}. For example:
blanchet@33191	471
blanchet@33191	472	\prew
blanchet@33191	473	\textbf{lemma} ``$\forall n.\; \textit{Suc}~n \mathbin{\not=} n \,\Longrightarrow\, P$'' \\
blanchet@34121	474	\textbf{nitpick} [\textit{card~nat}~= 100, \textit{check\_potential}] \\[2\smallskipamount]
blanchet@33191	475	\slshape Nitpick found a potential counterexample: \\[2\smallskipamount]
blanchet@33191	476	\hbox{}\qquad Free variable: \nopagebreak \\
blanchet@33191	477	\hbox{}\qquad\qquad $P = \textit{False}$ \\[2\smallskipamount]
blanchet@33191	478	Confirmation by ``\textit{auto}'': The above counterexample is genuine.
blanchet@33191	479	\postw
blanchet@33191	480
blanchet@33191	481	You might wonder why the counterexample is first reported as potential. The root
blanchet@33191	482	of the problem is that the bound variable in $\forall n.\; \textit{Suc}~n
blanchet@33191	483	\mathbin{\not=} n$ ranges over an infinite type. If Nitpick finds an $n$ such
blanchet@33191	484	that $\textit{Suc}~n \mathbin{=} n$, it evaluates the assumption to
blanchet@33191	485	\textit{False}; but otherwise, it does not know anything about values of $n \ge
blanchet@33191	486	\textit{card~nat}$ and must therefore evaluate the assumption to $\unk$, not
blanchet@33191	487	\textit{True}. Since the assumption can never be satisfied, the putative lemma
blanchet@33191	488	can never be falsified.
blanchet@33191	489
blanchet@33191	490	Incidentally, if you distrust the so-called genuine counterexamples, you can
blanchet@33191	491	enable \textit{check\_\allowbreak genuine} to verify them as well. However, be
blanchet@34121	492	aware that \textit{auto} will usually fail to prove that the counterexample is
blanchet@33191	493	genuine or spurious.
blanchet@33191	494
blanchet@33191	495	Some conjectures involving elementary number theory make Nitpick look like a
blanchet@33191	496	giant with feet of clay:
blanchet@33191	497
blanchet@33191	498	\prew
blanchet@33191	499	\textbf{lemma} ``$P~\textit{Suc}$'' \\
blanchet@33191	500	\textbf{nitpick} [\textit{card} = 1--6] \\[2\smallskipamount]
blanchet@33191	501	\slshape
blanchet@33191	502	Nitpick found no counterexample.
blanchet@33191	503	\postw
blanchet@33191	504
blanchet@34121	505	On any finite set $N$, \textit{Suc} is a partial function; for example, if $N =
blanchet@34121	506	\{0, 1, \ldots, k\}$, then \textit{Suc} is $\{0 \mapsto 1,\, 1 \mapsto 2,\,
blanchet@34121	507	\ldots,\, k \mapsto \unk\}$, which evaluates to $\unk$ when passed as
blanchet@34121	508	argument to $P$. As a result, $P~\textit{Suc}$ is always $\unk$. The next
blanchet@34121	509	example is similar:
blanchet@33191	510
blanchet@33191	511	\prew
blanchet@33191	512	\textbf{lemma} ``$P~(\textit{op}~{+}\Colon
blanchet@33191	513	\textit{nat}\mathbin{\Rightarrow}\textit{nat}\mathbin{\Rightarrow}\textit{nat})$'' \\
blanchet@33191	514	\textbf{nitpick} [\textit{card nat} = 1] \\[2\smallskipamount]
blanchet@33191	515	{\slshape Nitpick found a counterexample:} \\[2\smallskipamount]
blanchet@33191	516	\hbox{}\qquad Free variable: \nopagebreak \\
blanchet@33191	517	\hbox{}\qquad\qquad $P = \{\}$ \\[2\smallskipamount]
blanchet@33191	518	\textbf{nitpick} [\textit{card nat} = 2] \\[2\smallskipamount]
blanchet@33191	519	{\slshape Nitpick found no counterexample.}
blanchet@33191	520	\postw
blanchet@33191	521
blanchet@33191	522	The problem here is that \textit{op}~+ is total when \textit{nat} is taken to be
blanchet@33191	523	$\{0\}$ but becomes partial as soon as we add $1$, because $1 + 1 \notin \{0,
blanchet@33191	524	1\}$.
blanchet@33191	525
blanchet@33191	526	Because numbers are infinite and are approximated using a three-valued logic,
blanchet@33191	527	there is usually no need to systematically enumerate domain sizes. If Nitpick
blanchet@33191	528	cannot find a genuine counterexample for \textit{card~nat}~= $k$, it is very
blanchet@33191	529	unlikely that one could be found for smaller domains. (The $P~(\textit{op}~{+})$
blanchet@33191	530	example above is an exception to this principle.) Nitpick nonetheless enumerates
blanchet@33191	531	all cardinalities from 1 to 8 for \textit{nat}, mainly because smaller
blanchet@33191	532	cardinalities are fast to handle and give rise to simpler counterexamples. This
blanchet@33191	533	is explained in more detail in \S\ref{scope-monotonicity}.
blanchet@33191	534
blanchet@33191	535	\subsection{Inductive Datatypes}
blanchet@33191	536	\label{inductive-datatypes}
blanchet@33191	537
blanchet@33191	538	Like natural numbers and integers, inductive datatypes with recursive
blanchet@33191	539	constructors admit no finite models and must be approximated by a subterm-closed
blanchet@33191	540	subset. For example, using a cardinality of 10 for ${'}a~\textit{list}$,
blanchet@33191	541	Nitpick looks for all counterexamples that can be built using at most 10
blanchet@33191	542	different lists.
blanchet@33191	543
blanchet@33191	544	Let's see with an example involving \textit{hd} (which returns the first element
blanchet@33191	545	of a list) and $@$ (which concatenates two lists):
blanchet@33191	546
blanchet@33191	547	\prew
blanchet@33191	548	\textbf{lemma} ``$\textit{hd}~(\textit{xs} \mathbin{@} [y, y]) = \textit{hd}~\textit{xs}$'' \\
blanchet@33191	549	\textbf{nitpick} \\[2\smallskipamount]
blanchet@33191	550	\slshape Nitpick found a counterexample for \textit{card} $'a$~= 3: \\[2\smallskipamount]
blanchet@33191	551	\hbox{}\qquad Free variables: \nopagebreak \\
blanchet@33191	552	\hbox{}\qquad\qquad $\textit{xs} = []$ \\
blanchet@33191	553	\hbox{}\qquad\qquad $\textit{y} = a_3$
blanchet@33191	554	\postw
blanchet@33191	555
blanchet@33191	556	To see why the counterexample is genuine, we enable \textit{show\_consts}
blanchet@33191	557	and \textit{show\_\allowbreak datatypes}:
blanchet@33191	558
blanchet@33191	559	\prew
blanchet@33191	560	{\slshape Datatype:} \\
blanchet@33191	561	\hbox{}\qquad $'a$~\textit{list}~= $\{[],\, [a_3, a_3],\, [a_3],\, \unr\}$ \\
blanchet@33191	562	{\slshape Constants:} \\
blanchet@34969	563	\hbox{}\qquad $\lambda x_1.\; x_1 \mathbin{@} [y, y] = \undef([] := [a_3, a_3])$ \\
blanchet@33191	564	\hbox{}\qquad $\textit{hd} = \undef([] := a_2,\> [a_3, a_3] := a_3,\> [a_3] := a_3)$
blanchet@33191	565	\postw
blanchet@33191	566
blanchet@33191	567	Since $\mathit{hd}~[]$ is undefined in the logic, it may be given any value,
blanchet@33191	568	including $a_2$.
blanchet@33191	569
blanchet@33191	570	The second constant, $\lambda x_1.\; x_1 \mathbin{@} [y, y]$, is simply the
blanchet@33191	571	append operator whose second argument is fixed to be $[y, y]$. Appending $[a_3,
blanchet@33191	572	a_3]$ to $[a_3]$ would normally give $[a_3, a_3, a_3]$, but this value is not
blanchet@33191	573	representable in the subset of $'a$~\textit{list} considered by Nitpick, which
blanchet@33191	574	is shown under the ``Datatype'' heading; hence the result is $\unk$. Similarly,
blanchet@33191	575	appending $[a_3, a_3]$ to itself gives $\unk$.
blanchet@33191	576
blanchet@33191	577	Given \textit{card}~$'a = 3$ and \textit{card}~$'a~\textit{list} = 3$, Nitpick
blanchet@33191	578	considers the following subsets:
blanchet@33191	579
blanchet@33191	580	\kern-.5\smallskipamount %% TYPESETTING
blanchet@33191	581
blanchet@33191	582	\prew
blanchet@33191	583	\begin{multicols}{3}
blanchet@33191	584	$\{[],\, [a_1],\, [a_2]\}$; \\
blanchet@33191	585	$\{[],\, [a_1],\, [a_3]\}$; \\
blanchet@33191	586	$\{[],\, [a_2],\, [a_3]\}$; \\
blanchet@33191	587	$\{[],\, [a_1],\, [a_1, a_1]\}$; \\
blanchet@33191	588	$\{[],\, [a_1],\, [a_2, a_1]\}$; \\
blanchet@33191	589	$\{[],\, [a_1],\, [a_3, a_1]\}$; \\
blanchet@33191	590	$\{[],\, [a_2],\, [a_1, a_2]\}$; \\
blanchet@33191	591	$\{[],\, [a_2],\, [a_2, a_2]\}$; \\
blanchet@33191	592	$\{[],\, [a_2],\, [a_3, a_2]\}$; \\
blanchet@33191	593	$\{[],\, [a_3],\, [a_1, a_3]\}$; \\
blanchet@33191	594	$\{[],\, [a_3],\, [a_2, a_3]\}$; \\
blanchet@33191	595	$\{[],\, [a_3],\, [a_3, a_3]\}$.
blanchet@33191	596	\end{multicols}
blanchet@33191	597	\postw
blanchet@33191	598
blanchet@33191	599	\kern-2\smallskipamount %% TYPESETTING
blanchet@33191	600
blanchet@33191	601	All subterm-closed subsets of $'a~\textit{list}$ consisting of three values
blanchet@33191	602	are listed and only those. As an example of a non-subterm-closed subset,
blanchet@33191	603	consider $\mathcal{S} = \{[],\, [a_1],\,\allowbreak [a_1, a_3]\}$, and observe
blanchet@33191	604	that $[a_1, a_3]$ (i.e., $a_1 \mathbin{\#} [a_3]$) has $[a_3] \notin
blanchet@33191	605	\mathcal{S}$ as a subterm.
blanchet@33191	606
blanchet@33191	607	Here's another m\"ochtegern-lemma that Nitpick can refute without a blink:
blanchet@33191	608
blanchet@33191	609	\prew
blanchet@33191	610	\textbf{lemma} ``$\lbrakk \textit{length}~\textit{xs} = 1;\> \textit{length}~\textit{ys} = 1
blanchet@33191	611	\rbrakk \,\Longrightarrow\, \textit{xs} = \textit{ys}$''
blanchet@33191	612	\\
blanchet@33191	613	\textbf{nitpick} [\textit{show\_datatypes}] \\[2\smallskipamount]
blanchet@33191	614	\slshape Nitpick found a counterexample for \textit{card} $'a$~= 3: \\[2\smallskipamount]
blanchet@33191	615	\hbox{}\qquad Free variables: \nopagebreak \\
blanchet@33191	616	\hbox{}\qquad\qquad $\textit{xs} = [a_2]$ \\
blanchet@33191	617	\hbox{}\qquad\qquad $\textit{ys} = [a_3]$ \\
blanchet@33191	618	\hbox{}\qquad Datatypes: \\
blanchet@33191	619	\hbox{}\qquad\qquad $\textit{nat} = \{0,\, 1,\, 2,\, \unr\}$ \\
blanchet@33191	620	\hbox{}\qquad\qquad $'a$~\textit{list} = $\{[],\, [a_3],\, [a_2],\, \unr\}$
blanchet@33191	621	\postw
blanchet@33191	622
blanchet@33191	623	Because datatypes are approximated using a three-valued logic, there is usually
blanchet@33191	624	no need to systematically enumerate cardinalities: If Nitpick cannot find a
blanchet@33191	625	genuine counterexample for \textit{card}~$'a~\textit{list}$~= 10, it is very
blanchet@33191	626	unlikely that one could be found for smaller cardinalities.
blanchet@33191	627
blanchet@33191	628	\subsection{Typedefs, Records, Rationals, and Reals}
blanchet@33191	629	\label{typedefs-records-rationals-and-reals}
blanchet@33191	630
blanchet@33191	631	Nitpick generally treats types declared using \textbf{typedef} as datatypes
blanchet@33191	632	whose single constructor is the corresponding \textit{Abs\_\kern.1ex} function.
blanchet@33191	633	For example:
blanchet@33191	634
blanchet@33191	635	\prew
blanchet@33191	636	\textbf{typedef}~\textit{three} = ``$\{0\Colon\textit{nat},\, 1,\, 2\}$'' \\
blanchet@33191	637	\textbf{by}~\textit{blast} \\[2\smallskipamount]
blanchet@33191	638	\textbf{definition}~$A \mathbin{\Colon} \textit{three}$ \textbf{where} ``\kern-.1em$A \,\equiv\, \textit{Abs\_\allowbreak three}~0$'' \\
blanchet@33191	639	\textbf{definition}~$B \mathbin{\Colon} \textit{three}$ \textbf{where} ``$B \,\equiv\, \textit{Abs\_three}~1$'' \\
blanchet@33191	640	\textbf{definition}~$C \mathbin{\Colon} \textit{three}$ \textbf{where} ``$C \,\equiv\, \textit{Abs\_three}~2$'' \\[2\smallskipamount]
blanchet@33191	641	\textbf{lemma} ``$\lbrakk P~A;\> P~B\rbrakk \,\Longrightarrow\, P~x$'' \\
blanchet@33191	642	\textbf{nitpick} [\textit{show\_datatypes}] \\[2\smallskipamount]
blanchet@33191	643	\slshape Nitpick found a counterexample: \\[2\smallskipamount]
blanchet@33191	644	\hbox{}\qquad Free variables: \nopagebreak \\
blanchet@33191	645	\hbox{}\qquad\qquad $P = \{\Abs{1},\, \Abs{0}\}$ \\
blanchet@33191	646	\hbox{}\qquad\qquad $x = \Abs{2}$ \\
blanchet@33191	647	\hbox{}\qquad Datatypes: \\
blanchet@33191	648	\hbox{}\qquad\qquad $\textit{nat} = \{0,\, 1,\, 2,\, \unr\}$ \\
blanchet@33191	649	\hbox{}\qquad\qquad $\textit{three} = \{\Abs{2},\, \Abs{1},\, \Abs{0},\, \unr\}$
blanchet@33191	650	\postw
blanchet@33191	651
blanchet@33191	652	%% MARK
blanchet@33191	653	In the output above, $\Abs{n}$ abbreviates $\textit{Abs\_three}~n$.
blanchet@33191	654
blanchet@33191	655	%% MARK
blanchet@33191	656	Records, which are implemented as \textbf{typedef}s behind the scenes, are
blanchet@33191	657	handled in much the same way:
blanchet@33191	658
blanchet@33191	659	\prew
blanchet@33191	660	\textbf{record} \textit{point} = \\
blanchet@33191	661	\hbox{}\quad $\textit{Xcoord} \mathbin{\Colon} \textit{int}$ \\
blanchet@33191	662	\hbox{}\quad $\textit{Ycoord} \mathbin{\Colon} \textit{int}$ \\[2\smallskipamount]
blanchet@33191	663	\textbf{lemma} ``$\textit{Xcoord}~(p\Colon\textit{point}) = \textit{Xcoord}~(q\Colon\textit{point})$'' \\
blanchet@33191	664	\textbf{nitpick} [\textit{show\_datatypes}] \\[2\smallskipamount]
blanchet@33191	665	\slshape Nitpick found a counterexample: \\[2\smallskipamount]
blanchet@33191	666	\hbox{}\qquad Free variables: \nopagebreak \\
blanchet@33191	667	\hbox{}\qquad\qquad $p = \lparr\textit{Xcoord} = 0,\> \textit{Ycoord} = 0\rparr$ \\
blanchet@33191	668	\hbox{}\qquad\qquad $q = \lparr\textit{Xcoord} = 1,\> \textit{Ycoord} = 1\rparr$ \\
blanchet@33191	669	\hbox{}\qquad Datatypes: \\
blanchet@33191	670	\hbox{}\qquad\qquad $\textit{int} = \{0,\, 1,\, \unr\}$ \\
blanchet@33191	671	\hbox{}\qquad\qquad $\textit{point} = \{\lparr\textit{Xcoord} = 1,\>
blanchet@33191	672	\textit{Ycoord} = 1\rparr,\> \lparr\textit{Xcoord} = 0,\> \textit{Ycoord} = 0\rparr,\, \unr\}$\kern-1pt %% QUIET
blanchet@33191	673	\postw
blanchet@33191	674
blanchet@33191	675	Finally, Nitpick provides rudimentary support for rationals and reals using a
blanchet@33191	676	similar approach:
blanchet@33191	677
blanchet@33191	678	\prew
blanchet@33191	679	\textbf{lemma} ``$4 * x + 3 * (y\Colon\textit{real}) \not= 1/2$'' \\
blanchet@33191	680	\textbf{nitpick} [\textit{show\_datatypes}] \\[2\smallskipamount]
blanchet@33191	681	\slshape Nitpick found a counterexample: \\[2\smallskipamount]
blanchet@33191	682	\hbox{}\qquad Free variables: \nopagebreak \\
blanchet@33191	683	\hbox{}\qquad\qquad $x = 1/2$ \\
blanchet@33191	684	\hbox{}\qquad\qquad $y = -1/2$ \\
blanchet@33191	685	\hbox{}\qquad Datatypes: \\
blanchet@33191	686	\hbox{}\qquad\qquad $\textit{nat} = \{0,\, 1,\, 2,\, 3,\, 4,\, 5,\, 6,\, 7,\, \unr\}$ \\
blanchet@33191	687	\hbox{}\qquad\qquad $\textit{int} = \{0,\, 1,\, 2,\, 3,\, 4,\, -3,\, -2,\, -1,\, \unr\}$ \\
blanchet@33191	688	\hbox{}\qquad\qquad $\textit{real} = \{1,\, 0,\, 4,\, -3/2,\, 3,\, 2,\, 1/2,\, -1/2,\, \unr\}$
blanchet@33191	689	\postw
blanchet@33191	690
blanchet@33191	691	\subsection{Inductive and Coinductive Predicates}
blanchet@33191	692	\label{inductive-and-coinductive-predicates}
blanchet@33191	693
blanchet@33191	694	Inductively defined predicates (and sets) are particularly problematic for
blanchet@33191	695	counterexample generators. They can make Quickcheck~\cite{berghofer-nipkow-2004}
blanchet@33191	696	loop forever and Refute~\cite{weber-2008} run out of resources. The crux of
blanchet@33191	697	the problem is that they are defined using a least fixed point construction.
blanchet@33191	698
blanchet@33191	699	Nitpick's philosophy is that not all inductive predicates are equal. Consider
blanchet@33191	700	the \textit{even} predicate below:
blanchet@33191	701
blanchet@33191	702	\prew
blanchet@33191	703	\textbf{inductive}~\textit{even}~\textbf{where} \\
blanchet@33191	704	``\textit{even}~0'' $\,\mid$ \\
blanchet@33191	705	``\textit{even}~$n\,\Longrightarrow\, \textit{even}~(\textit{Suc}~(\textit{Suc}~n))$''
blanchet@33191	706	\postw
blanchet@33191	707
blanchet@33191	708	This predicate enjoys the desirable property of being well-founded, which means
blanchet@33191	709	that the introduction rules don't give rise to infinite chains of the form
blanchet@33191	710
blanchet@33191	711	\prew
blanchet@33191	712	$\cdots\,\Longrightarrow\, \textit{even}~k''
blanchet@33191	713	\,\Longrightarrow\, \textit{even}~k'
blanchet@33191	714	\,\Longrightarrow\, \textit{even}~k.$
blanchet@33191	715	\postw
blanchet@33191	716
blanchet@33191	717	For \textit{even}, this is obvious: Any chain ending at $k$ will be of length
blanchet@33191	718	$k/2 + 1$:
blanchet@33191	719
blanchet@33191	720	\prew
blanchet@33191	721	$\textit{even}~0\,\Longrightarrow\, \textit{even}~2\,\Longrightarrow\, \cdots
blanchet@33191	722	\,\Longrightarrow\, \textit{even}~(k - 2)
blanchet@33191	723	\,\Longrightarrow\, \textit{even}~k.$
blanchet@33191	724	\postw
blanchet@33191	725
blanchet@33191	726	Wellfoundedness is desirable because it enables Nitpick to use a very efficient
blanchet@33191	727	fixed point computation.%
blanchet@33191	728	\footnote{If an inductive predicate is
blanchet@33191	729	well-founded, then it has exactly one fixed point, which is simultaneously the
blanchet@33191	730	least and the greatest fixed point. In these circumstances, the computation of
blanchet@33191	731	the least fixed point amounts to the computation of an arbitrary fixed point,
blanchet@33191	732	which can be performed using a straightforward recursive equation.}
blanchet@33191	733	Moreover, Nitpick can prove wellfoundedness of most well-founded predicates,
blanchet@33191	734	just as Isabelle's \textbf{function} package usually discharges termination
blanchet@33191	735	proof obligations automatically.
blanchet@33191	736
blanchet@33191	737	Let's try an example:
blanchet@33191	738
blanchet@33191	739	\prew
blanchet@33191	740	\textbf{lemma} ``$\exists n.\; \textit{even}~n \mathrel{\land} \textit{even}~(\textit{Suc}~n)$'' \\
blanchet@34123	741	\textbf{nitpick}~[\textit{card nat}~= 100, \textit{unary\_ints}, \textit{verbose}] \\[2\smallskipamount]
blanchet@33191	742	\slshape The inductive predicate ``\textit{even}'' was proved well-founded.
blanchet@33191	743	Nitpick can compute it efficiently. \\[2\smallskipamount]
blanchet@33191	744	Trying 1 scope: \\
blanchet@33191	745	\hbox{}\qquad \textit{card nat}~= 100. \\[2\smallskipamount]
blanchet@33191	746	Nitpick found a potential counterexample for \textit{card nat}~= 100: \\[2\smallskipamount]
blanchet@33191	747	\hbox{}\qquad Empty assignment \\[2\smallskipamount]
blanchet@33191	748	Nitpick could not find a better counterexample. \\[2\smallskipamount]
blanchet@33191	749	Total time: 2274 ms.
blanchet@33191	750	\postw
blanchet@33191	751
blanchet@33191	752	No genuine counterexample is possible because Nitpick cannot rule out the
blanchet@33191	753	existence of a natural number $n \ge 100$ such that both $\textit{even}~n$ and
blanchet@33191	754	$\textit{even}~(\textit{Suc}~n)$ are true. To help Nitpick, we can bound the
blanchet@33191	755	existential quantifier:
blanchet@33191	756
blanchet@33191	757	\prew
blanchet@33191	758	\textbf{lemma} ``$\exists n \mathbin{\le} 99.\; \textit{even}~n \mathrel{\land} \textit{even}~(\textit{Suc}~n)$'' \\
blanchet@34123	759	\textbf{nitpick}~[\textit{card nat}~= 100, \textit{unary\_ints}] \\[2\smallskipamount]
blanchet@33191	760	\slshape Nitpick found a counterexample: \\[2\smallskipamount]
blanchet@33191	761	\hbox{}\qquad Empty assignment
blanchet@33191	762	\postw
blanchet@33191	763
blanchet@33191	764	So far we were blessed by the wellfoundedness of \textit{even}. What happens if
blanchet@33191	765	we use the following definition instead?
blanchet@33191	766
blanchet@33191	767	\prew
blanchet@33191	768	\textbf{inductive} $\textit{even}'$ \textbf{where} \\
blanchet@33191	769	``$\textit{even}'~(0{\Colon}\textit{nat})$'' $\,\mid$ \\
blanchet@33191	770	``$\textit{even}'~2$'' $\,\mid$ \\
blanchet@33191	771	``$\lbrakk\textit{even}'~m;\> \textit{even}'~n\rbrakk \,\Longrightarrow\, \textit{even}'~(m + n)$''
blanchet@33191	772	\postw
blanchet@33191	773
blanchet@33191	774	This definition is not well-founded: From $\textit{even}'~0$ and
blanchet@33191	775	$\textit{even}'~0$, we can derive that $\textit{even}'~0$. Nonetheless, the
blanchet@33191	776	predicates $\textit{even}$ and $\textit{even}'$ are equivalent.
blanchet@33191	777
blanchet@33191	778	Let's check a property involving $\textit{even}'$. To make up for the
blanchet@33191	779	foreseeable computational hurdles entailed by non-wellfoundedness, we decrease
blanchet@33191	780	\textit{nat}'s cardinality to a mere 10:
blanchet@33191	781
blanchet@33191	782	\prew
blanchet@33191	783	\textbf{lemma}~``$\exists n \in \{0, 2, 4, 6, 8\}.\;
blanchet@33191	784	\lnot\;\textit{even}'~n$'' \\
blanchet@33191	785	\textbf{nitpick}~[\textit{card nat}~= 10,\, \textit{verbose},\, \textit{show\_consts}] \\[2\smallskipamount]
blanchet@33191	786	\slshape
blanchet@33191	787	The inductive predicate ``$\textit{even}'\!$'' could not be proved well-founded.
blanchet@33191	788	Nitpick might need to unroll it. \\[2\smallskipamount]
blanchet@33191	789	Trying 6 scopes: \\
blanchet@33191	790	\hbox{}\qquad \textit{card nat}~= 10 and \textit{iter} $\textit{even}'$~= 0; \\
blanchet@33191	791	\hbox{}\qquad \textit{card nat}~= 10 and \textit{iter} $\textit{even}'$~= 1; \\
blanchet@33191	792	\hbox{}\qquad \textit{card nat}~= 10 and \textit{iter} $\textit{even}'$~= 2; \\
blanchet@33191	793	\hbox{}\qquad \textit{card nat}~= 10 and \textit{iter} $\textit{even}'$~= 4; \\
blanchet@33191	794	\hbox{}\qquad \textit{card nat}~= 10 and \textit{iter} $\textit{even}'$~= 8; \\
blanchet@33191	795	\hbox{}\qquad \textit{card nat}~= 10 and \textit{iter} $\textit{even}'$~= 9. \\[2\smallskipamount]
blanchet@33191	796	Nitpick found a counterexample for \textit{card nat}~= 10 and \textit{iter} $\textit{even}'$~= 2: \\[2\smallskipamount]
blanchet@33191	797	\hbox{}\qquad Constant: \nopagebreak \\
blanchet@33191	798	\hbox{}\qquad\qquad $\lambda i.\; \textit{even}'$ = $\undef(\!\begin{aligned}[t]
blanchet@33191	799	& 2 := \{0, 2, 4, 6, 8, 1^\Q, 3^\Q, 5^\Q, 7^\Q, 9^\Q\}, \\[-2pt]
blanchet@33191	800	& 1 := \{0, 2, 4, 1^\Q, 3^\Q, 5^\Q, 6^\Q, 7^\Q, 8^\Q, 9^\Q\}, \\[-2pt]
blanchet@33191	801	& 0 := \{0, 2, 1^\Q, 3^\Q, 4^\Q, 5^\Q, 6^\Q, 7^\Q, 8^\Q, 9^\Q\})\end{aligned}$ \\[2\smallskipamount]
blanchet@33191	802	Total time: 1140 ms.
blanchet@33191	803	\postw
blanchet@33191	804
blanchet@33191	805	Nitpick's output is very instructive. First, it tells us that the predicate is
blanchet@33191	806	unrolled, meaning that it is computed iteratively from the empty set. Then it
blanchet@33191	807	lists six scopes specifying different bounds on the numbers of iterations:\ 0,
blanchet@33191	808	1, 2, 4, 8, and~9.
blanchet@33191	809
blanchet@33191	810	The output also shows how each iteration contributes to $\textit{even}'$. The
blanchet@33191	811	notation $\lambda i.\; \textit{even}'$ indicates that the value of the
blanchet@33191	812	predicate depends on an iteration counter. Iteration 0 provides the basis
blanchet@33191	813	elements, $0$ and $2$. Iteration 1 contributes $4$ ($= 2 + 2$). Iteration 2
blanchet@33191	814	throws $6$ ($= 2 + 4 = 4 + 2$) and $8$ ($= 4 + 4$) into the mix. Further
blanchet@33191	815	iterations would not contribute any new elements.
blanchet@33191	816
blanchet@33191	817	Some values are marked with superscripted question
blanchet@33191	818	marks~(`\lower.2ex\hbox{$^\Q$}'). These are the elements for which the
blanchet@33191	819	predicate evaluates to $\unk$. Thus, $\textit{even}'$ evaluates to either
blanchet@33191	820	\textit{True} or $\unk$, never \textit{False}.
blanchet@33191	821
blanchet@33191	822	When unrolling a predicate, Nitpick tries 0, 1, 2, 4, 8, 12, 16, and 24
blanchet@33191	823	iterations. However, these numbers are bounded by the cardinality of the
blanchet@33191	824	predicate's domain. With \textit{card~nat}~= 10, no more than 9 iterations are
blanchet@33191	825	ever needed to compute the value of a \textit{nat} predicate. You can specify
blanchet@33191	826	the number of iterations using the \textit{iter} option, as explained in
blanchet@33191	827	\S\ref{scope-of-search}.
blanchet@33191	828
blanchet@33191	829	In the next formula, $\textit{even}'$ occurs both positively and negatively:
blanchet@33191	830
blanchet@33191	831	\prew
blanchet@33191	832	\textbf{lemma} ``$\textit{even}'~(n - 2) \,\Longrightarrow\, \textit{even}'~n$'' \\
blanchet@34121	833	\textbf{nitpick} [\textit{card nat} = 10, \textit{show\_consts}] \\[2\smallskipamount]
blanchet@33191	834	\slshape Nitpick found a counterexample: \\[2\smallskipamount]
blanchet@33191	835	\hbox{}\qquad Free variable: \nopagebreak \\
blanchet@33191	836	\hbox{}\qquad\qquad $n = 1$ \\
blanchet@33191	837	\hbox{}\qquad Constants: \nopagebreak \\
blanchet@33191	838	\hbox{}\qquad\qquad $\lambda i.\; \textit{even}'$ = $\undef(\!\begin{aligned}[t]
blanchet@33191	839	& 0 := \{0, 2, 1^\Q, 3^\Q, 4^\Q, 5^\Q, 6^\Q, 7^\Q, 8^\Q, 9^\Q\})\end{aligned}$ \\
blanchet@33191	840	\hbox{}\qquad\qquad $\textit{even}' \subseteq \{0, 2, 4, 6, 8, \unr\}$
blanchet@33191	841	\postw
blanchet@33191	842
blanchet@33191	843	Notice the special constraint $\textit{even}' \subseteq \{0,\, 2,\, 4,\, 6,\,
blanchet@33191	844	8,\, \unr\}$ in the output, whose right-hand side represents an arbitrary
blanchet@33191	845	fixed point (not necessarily the least one). It is used to falsify
blanchet@33191	846	$\textit{even}'~n$. In contrast, the unrolled predicate is used to satisfy
blanchet@33191	847	$\textit{even}'~(n - 2)$.
blanchet@33191	848
blanchet@33191	849	Coinductive predicates are handled dually. For example:
blanchet@33191	850
blanchet@33191	851	\prew
blanchet@33191	852	\textbf{coinductive} \textit{nats} \textbf{where} \\
blanchet@33191	853	``$\textit{nats}~(x\Colon\textit{nat}) \,\Longrightarrow\, \textit{nats}~x$'' \\[2\smallskipamount]
blanchet@33191	854	\textbf{lemma} ``$\textit{nats} = \{0, 1, 2, 3, 4\}$'' \\
blanchet@33191	855	\textbf{nitpick}~[\textit{card nat} = 10,\, \textit{show\_consts}] \\[2\smallskipamount]
blanchet@33191	856	\slshape Nitpick found a counterexample:
blanchet@33191	857	\\[2\smallskipamount]
blanchet@33191	858	\hbox{}\qquad Constants: \nopagebreak \\
blanchet@33191	859	\hbox{}\qquad\qquad $\lambda i.\; \textit{nats} = \undef(0 := \{\!\begin{aligned}[t]
blanchet@33191	860	& 0^\Q, 1^\Q, 2^\Q, 3^\Q, 4^\Q, 5^\Q, 6^\Q, 7^\Q, 8^\Q, 9^\Q, \\[-2pt]
blanchet@33191	861	& \unr\})\end{aligned}$ \\
blanchet@33191	862	\hbox{}\qquad\qquad $nats \supseteq \{9, 5^\Q, 6^\Q, 7^\Q, 8^\Q, \unr\}$
blanchet@33191	863	\postw
blanchet@33191	864
blanchet@33191	865	As a special case, Nitpick uses Kodkod's transitive closure operator to encode
blanchet@33191	866	negative occurrences of non-well-founded ``linear inductive predicates,'' i.e.,
blanchet@33191	867	inductive predicates for which each the predicate occurs in at most one
blanchet@33191	868	assumption of each introduction rule. For example:
blanchet@33191	869
blanchet@33191	870	\prew
blanchet@33191	871	\textbf{inductive} \textit{odd} \textbf{where} \\
blanchet@33191	872	``$\textit{odd}~1$'' $\,\mid$ \\
blanchet@33191	873	``$\lbrakk \textit{odd}~m;\>\, \textit{even}~n\rbrakk \,\Longrightarrow\, \textit{odd}~(m + n)$'' \\[2\smallskipamount]
blanchet@33191	874	\textbf{lemma}~``$\textit{odd}~n \,\Longrightarrow\, \textit{odd}~(n - 2)$'' \\
blanchet@33191	875	\textbf{nitpick}~[\textit{card nat} = 10,\, \textit{show\_consts}] \\[2\smallskipamount]
blanchet@33191	876	\slshape Nitpick found a counterexample:
blanchet@33191	877	\\[2\smallskipamount]
blanchet@33191	878	\hbox{}\qquad Free variable: \nopagebreak \\
blanchet@33191	879	\hbox{}\qquad\qquad $n = 1$ \\
blanchet@33191	880	\hbox{}\qquad Constants: \nopagebreak \\
blanchet@33191	881	\hbox{}\qquad\qquad $\textit{even} = \{0, 2, 4, 6, 8, \unr\}$ \\
blanchet@33191	882	\hbox{}\qquad\qquad $\textit{odd}_{\textsl{base}} = \{1, \unr\}$ \\
blanchet@33191	883	\hbox{}\qquad\qquad $\textit{odd}_{\textsl{step}} = \!
blanchet@33191	884	\!\begin{aligned}[t]
blanchet@33191	885	& \{(0, 0), (0, 2), (0, 4), (0, 6), (0, 8), (1, 1), (1, 3), (1, 5), \\[-2pt]
blanchet@33191	886	& \phantom{\{} (1, 7), (1, 9), (2, 2), (2, 4), (2, 6), (2, 8), (3, 3),
blanchet@33191	887	(3, 5), \\[-2pt]
blanchet@33191	888	& \phantom{\{} (3, 7), (3, 9), (4, 4), (4, 6), (4, 8), (5, 5), (5, 7), (5, 9), \\[-2pt]
blanchet@33191	889	& \phantom{\{} (6, 6), (6, 8), (7, 7), (7, 9), (8, 8), (9, 9), \unr\}\end{aligned}$ \\
blanchet@33191	890	\hbox{}\qquad\qquad $\textit{odd} \subseteq \{1, 3, 5, 7, 9, 8^\Q, \unr\}$
blanchet@33191	891	\postw
blanchet@33191	892
blanchet@33191	893	\noindent
blanchet@33191	894	In the output, $\textit{odd}_{\textrm{base}}$ represents the base elements and
blanchet@33191	895	$\textit{odd}_{\textrm{step}}$ is a transition relation that computes new
blanchet@33191	896	elements from known ones. The set $\textit{odd}$ consists of all the values
blanchet@33191	897	reachable through the reflexive transitive closure of
blanchet@33191	898	$\textit{odd}_{\textrm{step}}$ starting with any element from
blanchet@33191	899	$\textit{odd}_{\textrm{base}}$, namely 1, 3, 5, 7, and 9. Using Kodkod's
blanchet@33191	900	transitive closure to encode linear predicates is normally either more thorough
blanchet@33191	901	or more efficient than unrolling (depending on the value of \textit{iter}), but
blanchet@33191	902	for those cases where it isn't you can disable it by passing the
blanchet@33191	903	\textit{dont\_star\_linear\_preds} option.
blanchet@33191	904
blanchet@33191	905	\subsection{Coinductive Datatypes}
blanchet@33191	906	\label{coinductive-datatypes}
blanchet@33191	907
blanchet@33191	908	While Isabelle regrettably lacks a high-level mechanism for defining coinductive
blanchet@33191	909	datatypes, the \textit{Coinductive\_List} theory provides a coinductive ``lazy
blanchet@33191	910	list'' datatype, $'a~\textit{llist}$, defined the hard way. Nitpick supports
blanchet@33191	911	these lazy lists seamlessly and provides a hook, described in
blanchet@33191	912	\S\ref{registration-of-coinductive-datatypes}, to register custom coinductive
blanchet@33191	913	datatypes.
blanchet@33191	914
blanchet@33191	915	(Co)intuitively, a coinductive datatype is similar to an inductive datatype but
blanchet@33191	916	allows infinite objects. Thus, the infinite lists $\textit{ps}$ $=$ $[a, a, a,
blanchet@33191	917	\ldots]$, $\textit{qs}$ $=$ $[a, b, a, b, \ldots]$, and $\textit{rs}$ $=$ $[0,
blanchet@33191	918	1, 2, 3, \ldots]$ can be defined as lazy lists using the
blanchet@33191	919	$\textit{LNil}\mathbin{\Colon}{'}a~\textit{llist}$ and
blanchet@33191	920	$\textit{LCons}\mathbin{\Colon}{'}a \mathbin{\Rightarrow} {'}a~\textit{llist}
blanchet@33191	921	\mathbin{\Rightarrow} {'}a~\textit{llist}$ constructors.
blanchet@33191	922
blanchet@33191	923	Although it is otherwise no friend of infinity, Nitpick can find counterexamples
blanchet@33191	924	involving cyclic lists such as \textit{ps} and \textit{qs} above as well as
blanchet@33191	925	finite lists:
blanchet@33191	926
blanchet@33191	927	\prew
blanchet@33191	928	\textbf{lemma} ``$\textit{xs} \not= \textit{LCons}~a~\textit{xs}$'' \\
blanchet@33191	929	\textbf{nitpick} \\[2\smallskipamount]
blanchet@33191	930	\slshape Nitpick found a counterexample for {\itshape card}~$'a$ = 1: \\[2\smallskipamount]
blanchet@33191	931	\hbox{}\qquad Free variables: \nopagebreak \\
blanchet@33191	932	\hbox{}\qquad\qquad $\textit{a} = a_1$ \\
blanchet@33191	933	\hbox{}\qquad\qquad $\textit{xs} = \textsl{THE}~\omega.\; \omega = \textit{LCons}~a_1~\omega$
blanchet@33191	934	\postw
blanchet@33191	935
blanchet@33191	936	The notation $\textrm{THE}~\omega.\; \omega = t(\omega)$ stands
blanchet@33191	937	for the infinite term $t(t(t(\ldots)))$. Hence, \textit{xs} is simply the
blanchet@33191	938	infinite list $[a_1, a_1, a_1, \ldots]$.
blanchet@33191	939
blanchet@33191	940	The next example is more interesting:
blanchet@33191	941
blanchet@33191	942	\prew
blanchet@33191	943	\textbf{lemma}~``$\lbrakk\textit{xs} = \textit{LCons}~a~\textit{xs};\>\,
blanchet@33191	944	\textit{ys} = \textit{iterates}~(\lambda b.\> a)~b\rbrakk \,\Longrightarrow\, \textit{xs} = \textit{ys}$'' \\
blanchet@33191	945	\textbf{nitpick} [\textit{verbose}] \\[2\smallskipamount]
blanchet@33191	946	\slshape The type ``\kern1pt$'a$'' passed the monotonicity test. Nitpick might be able to skip
blanchet@33191	947	some scopes. \\[2\smallskipamount]
blanchet@33191	948	Trying 8 scopes: \\
blanchet@33191	949	\hbox{}\qquad \textit{card} $'a$~= 1, \textit{card} ``\kern1pt$'a~\textit{list}$''~= 1,
blanchet@33191	950	and \textit{bisim\_depth}~= 0. \\
blanchet@33191	951	\hbox{}\qquad $\qquad\vdots$ \\[.5\smallskipamount]
blanchet@33191	952	\hbox{}\qquad \textit{card} $'a$~= 8, \textit{card} ``\kern1pt$'a~\textit{list}$''~= 8,
blanchet@33191	953	and \textit{bisim\_depth}~= 7. \\[2\smallskipamount]
blanchet@33191	954	Nitpick found a counterexample for {\itshape card}~$'a$ = 2,
blanchet@33191	955	\textit{card}~``\kern1pt$'a~\textit{list}$''~= 2, and \textit{bisim\_\allowbreak
blanchet@33191	956	depth}~= 1:
blanchet@33191	957	\\[2\smallskipamount]
blanchet@33191	958	\hbox{}\qquad Free variables: \nopagebreak \\
blanchet@33191	959	\hbox{}\qquad\qquad $\textit{a} = a_2$ \\
blanchet@33191	960	\hbox{}\qquad\qquad $\textit{b} = a_1$ \\
blanchet@33191	961	\hbox{}\qquad\qquad $\textit{xs} = \textsl{THE}~\omega.\; \omega = \textit{LCons}~a_2~\omega$ \\
blanchet@33191	962	\hbox{}\qquad\qquad $\textit{ys} = \textit{LCons}~a_1~(\textsl{THE}~\omega.\; \omega = \textit{LCons}~a_2~\omega)$ \\[2\smallskipamount]
blanchet@33191	963	Total time: 726 ms.
blanchet@33191	964	\postw
blanchet@33191	965
blanchet@33191	966	The lazy list $\textit{xs}$ is simply $[a_2, a_2, a_2, \ldots]$, whereas
blanchet@33191	967	$\textit{ys}$ is $[a_1, a_2, a_2, a_2, \ldots]$, i.e., a lasso-shaped list with
blanchet@33191	968	$[a_1]$ as its stem and $[a_2]$ as its cycle. In general, the list segment
blanchet@33191	969	within the scope of the {THE} binder corresponds to the lasso's cycle, whereas
blanchet@33191	970	the segment leading to the binder is the stem.
blanchet@33191	971
blanchet@33191	972	A salient property of coinductive datatypes is that two objects are considered
blanchet@33191	973	equal if and only if they lead to the same observations. For example, the lazy
blanchet@33191	974	lists $\textrm{THE}~\omega.\; \omega =
blanchet@33191	975	\textit{LCons}~a~(\textit{LCons}~b~\omega)$ and
blanchet@33191	976	$\textit{LCons}~a~(\textrm{THE}~\omega.\; \omega =
blanchet@33191	977	\textit{LCons}~b~(\textit{LCons}~a~\omega))$ are identical, because both lead
blanchet@33191	978	to the sequence of observations $a$, $b$, $a$, $b$, \hbox{\ldots} (or,
blanchet@33191	979	equivalently, both encode the infinite list $[a, b, a, b, \ldots]$). This
blanchet@33191	980	concept of equality for coinductive datatypes is called bisimulation and is
blanchet@33191	981	defined coinductively.
blanchet@33191	982
blanchet@33191	983	Internally, Nitpick encodes the coinductive bisimilarity predicate as part of
blanchet@33191	984	the Kodkod problem to ensure that distinct objects lead to different
blanchet@33191	985	observations. This precaution is somewhat expensive and often unnecessary, so it
blanchet@33191	986	can be disabled by setting the \textit{bisim\_depth} option to $-1$. The
blanchet@33191	987	bisimilarity check is then performed \textsl{after} the counterexample has been
blanchet@33191	988	found to ensure correctness. If this after-the-fact check fails, the
blanchet@33191	989	counterexample is tagged as ``likely genuine'' and Nitpick recommends to try
blanchet@33191	990	again with \textit{bisim\_depth} set to a nonnegative integer. Disabling the
blanchet@33191	991	check for the previous example saves approximately 150~milli\-seconds; the speed
blanchet@33191	992	gains can be more significant for larger scopes.
blanchet@33191	993
blanchet@33191	994	The next formula illustrates the need for bisimilarity (either as a Kodkod
blanchet@33191	995	predicate or as an after-the-fact check) to prevent spurious counterexamples:
blanchet@33191	996
blanchet@33191	997	\prew
blanchet@33191	998	\textbf{lemma} ``$\lbrakk xs = \textit{LCons}~a~\textit{xs};\>\, \textit{ys} = \textit{LCons}~a~\textit{ys}\rbrakk
blanchet@33191	999	\,\Longrightarrow\, \textit{xs} = \textit{ys}$'' \\
blanchet@34121	1000	\textbf{nitpick} [\textit{bisim\_depth} = $-1$, \textit{show\_datatypes}] \\[2\smallskipamount]
blanchet@33191	1001	\slshape Nitpick found a likely genuine counterexample for $\textit{card}~'a$ = 2: \\[2\smallskipamount]
blanchet@33191	1002	\hbox{}\qquad Free variables: \nopagebreak \\
blanchet@33191	1003	\hbox{}\qquad\qquad $a = a_2$ \\
blanchet@33191	1004	\hbox{}\qquad\qquad $\textit{xs} = \textsl{THE}~\omega.\; \omega =
blanchet@33191	1005	\textit{LCons}~a_2~\omega$ \\
blanchet@33191	1006	\hbox{}\qquad\qquad $\textit{ys} = \textsl{THE}~\omega.\; \omega = \textit{LCons}~a_2~\omega$ \\
blanchet@33191	1007	\hbox{}\qquad Codatatype:\strut \nopagebreak \\
blanchet@33191	1008	\hbox{}\qquad\qquad $'a~\textit{llist} =
blanchet@33191	1009	\{\!\begin{aligned}[t]
blanchet@33191	1010	& \textsl{THE}~\omega.\; \omega = \textit{LCons}~a_2~\omega, \\[-2pt]
blanchet@33191	1011	& \textsl{THE}~\omega.\; \omega = \textit{LCons}~a_2~\omega,\> \unr\}\end{aligned}$
blanchet@33191	1012	\\[2\smallskipamount]
blanchet@33191	1013	Try again with ``\textit{bisim\_depth}'' set to a nonnegative value to confirm
blanchet@33191	1014	that the counterexample is genuine. \\[2\smallskipamount]
blanchet@33191	1015	{\upshape\textbf{nitpick}} \\[2\smallskipamount]
blanchet@33191	1016	\slshape Nitpick found no counterexample.
blanchet@33191	1017	\postw
blanchet@33191	1018
blanchet@33191	1019	In the first \textbf{nitpick} invocation, the after-the-fact check discovered
blanchet@33191	1020	that the two known elements of type $'a~\textit{llist}$ are bisimilar.
blanchet@33191	1021
blanchet@33191	1022	A compromise between leaving out the bisimilarity predicate from the Kodkod
blanchet@33191	1023	problem and performing the after-the-fact check is to specify a lower
blanchet@33191	1024	nonnegative \textit{bisim\_depth} value than the default one provided by
blanchet@33191	1025	Nitpick. In general, a value of $K$ means that Nitpick will require all lists to
blanchet@33191	1026	be distinguished from each other by their prefixes of length $K$. Be aware that
blanchet@33191	1027	setting $K$ to a too low value can overconstrain Nitpick, preventing it from
blanchet@33191	1028	finding any counterexamples.
blanchet@33191	1029
blanchet@33191	1030	\subsection{Boxing}
blanchet@33191	1031	\label{boxing}
blanchet@33191	1032
blanchet@33191	1033	Nitpick normally maps function and product types directly to the corresponding
blanchet@33191	1034	Kodkod concepts. As a consequence, if $'a$ has cardinality 3 and $'b$ has
blanchet@33191	1035	cardinality 4, then $'a \times {'}b$ has cardinality 12 ($= 4 \times 3$) and $'a
blanchet@33191	1036	\Rightarrow {'}b$ has cardinality 64 ($= 4^3$). In some circumstances, it pays
blanchet@33191	1037	off to treat these types in the same way as plain datatypes, by approximating
blanchet@33191	1038	them by a subset of a given cardinality. This technique is called ``boxing'' and
blanchet@33191	1039	is particularly useful for functions passed as arguments to other functions, for
blanchet@33191	1040	high-arity functions, and for large tuples. Under the hood, boxing involves
blanchet@33191	1041	wrapping occurrences of the types $'a \times {'}b$ and $'a \Rightarrow {'}b$ in
blanchet@33191	1042	isomorphic datatypes, as can be seen by enabling the \textit{debug} option.
blanchet@33191	1043
blanchet@33191	1044	To illustrate boxing, we consider a formalization of $\lambda$-terms represented
blanchet@33191	1045	using de Bruijn's notation:
blanchet@33191	1046
blanchet@33191	1047	\prew
blanchet@33191	1048	\textbf{datatype} \textit{tm} = \textit{Var}~\textit{nat}~$\mid$~\textit{Lam}~\textit{tm} $\mid$ \textit{App~tm~tm}
blanchet@33191	1049	\postw
blanchet@33191	1050
blanchet@33191	1051	The $\textit{lift}~t~k$ function increments all variables with indices greater
blanchet@33191	1052	than or equal to $k$ by one:
blanchet@33191	1053
blanchet@33191	1054	\prew
blanchet@33191	1055	\textbf{primrec} \textit{lift} \textbf{where} \\
blanchet@33191	1056	``$\textit{lift}~(\textit{Var}~j)~k = \textit{Var}~(\textrm{if}~j < k~\textrm{then}~j~\textrm{else}~j + 1)$'' $\mid$ \\
blanchet@33191	1057	``$\textit{lift}~(\textit{Lam}~t)~k = \textit{Lam}~(\textit{lift}~t~(k + 1))$'' $\mid$ \\
blanchet@33191	1058	``$\textit{lift}~(\textit{App}~t~u)~k = \textit{App}~(\textit{lift}~t~k)~(\textit{lift}~u~k)$''
blanchet@33191	1059	\postw
blanchet@33191	1060
blanchet@33191	1061	The $\textit{loose}~t~k$ predicate returns \textit{True} if and only if
blanchet@33191	1062	term $t$ has a loose variable with index $k$ or more:
blanchet@33191	1063
blanchet@33191	1064	\prew
blanchet@33191	1065	\textbf{primrec}~\textit{loose} \textbf{where} \\
blanchet@33191	1066	``$\textit{loose}~(\textit{Var}~j)~k = (j \ge k)$'' $\mid$ \\
blanchet@33191	1067	``$\textit{loose}~(\textit{Lam}~t)~k = \textit{loose}~t~(\textit{Suc}~k)$'' $\mid$ \\
blanchet@33191	1068	``$\textit{loose}~(\textit{App}~t~u)~k = (\textit{loose}~t~k \mathrel{\lor} \textit{loose}~u~k)$''
blanchet@33191	1069	\postw
blanchet@33191	1070
blanchet@33191	1071	Next, the $\textit{subst}~\sigma~t$ function applies the substitution $\sigma$
blanchet@33191	1072	on $t$:
blanchet@33191	1073
blanchet@33191	1074	\prew
blanchet@33191	1075	\textbf{primrec}~\textit{subst} \textbf{where} \\
blanchet@33191	1076	``$\textit{subst}~\sigma~(\textit{Var}~j) = \sigma~j$'' $\mid$ \\
blanchet@33191	1077	``$\textit{subst}~\sigma~(\textit{Lam}~t) = {}$\phantom{''} \\
blanchet@33191	1078	\phantom{``}$\textit{Lam}~(\textit{subst}~(\lambda n.\> \textrm{case}~n~\textrm{of}~0 \Rightarrow \textit{Var}~0 \mid \textit{Suc}~m \Rightarrow \textit{lift}~(\sigma~m)~1)~t)$'' $\mid$ \\
blanchet@33191	1079	``$\textit{subst}~\sigma~(\textit{App}~t~u) = \textit{App}~(\textit{subst}~\sigma~t)~(\textit{subst}~\sigma~u)$''
blanchet@33191	1080	\postw
blanchet@33191	1081
blanchet@33191	1082	A substitution is a function that maps variable indices to terms. Observe that
blanchet@33191	1083	$\sigma$ is a function passed as argument and that Nitpick can't optimize it
blanchet@33191	1084	away, because the recursive call for the \textit{Lam} case involves an altered
blanchet@33191	1085	version. Also notice the \textit{lift} call, which increments the variable
blanchet@33191	1086	indices when moving under a \textit{Lam}.
blanchet@33191	1087
blanchet@33191	1088	A reasonable property to expect of substitution is that it should leave closed
blanchet@33191	1089	terms unchanged. Alas, even this simple property does not hold:
blanchet@33191	1090
blanchet@33191	1091	\pre
blanchet@33191	1092	\textbf{lemma}~``$\lnot\,\textit{loose}~t~0 \,\Longrightarrow\, \textit{subst}~\sigma~t = t$'' \\
blanchet@33191	1093	\textbf{nitpick} [\textit{verbose}] \\[2\smallskipamount]
blanchet@33191	1094	\slshape
blanchet@33191	1095	Trying 8 scopes: \nopagebreak \\
blanchet@33191	1096	\hbox{}\qquad \textit{card~nat}~= 1, \textit{card tm}~= 1, and \textit{card} ``$\textit{nat} \Rightarrow \textit{tm}$'' = 1; \\
blanchet@33191	1097	\hbox{}\qquad \textit{card~nat}~= 2, \textit{card tm}~= 2, and \textit{card} ``$\textit{nat} \Rightarrow \textit{tm}$'' = 2; \\
blanchet@33191	1098	\hbox{}\qquad $\qquad\vdots$ \\[.5\smallskipamount]
blanchet@33191	1099	\hbox{}\qquad \textit{card~nat}~= 8, \textit{card tm}~= 8, and \textit{card} ``$\textit{nat} \Rightarrow \textit{tm}$'' = 8. \\[2\smallskipamount]
blanchet@33191	1100	Nitpick found a counterexample for \textit{card~nat}~= 6, \textit{card~tm}~= 6,
blanchet@33191	1101	and \textit{card}~``$\textit{nat} \Rightarrow \textit{tm}$''~= 6: \\[2\smallskipamount]
blanchet@33191	1102	\hbox{}\qquad Free variables: \nopagebreak \\
blanchet@33191	1103	\hbox{}\qquad\qquad $\sigma = \undef(\!\begin{aligned}[t]
blanchet@33191	1104	& 0 := \textit{Var}~0,\>
blanchet@33191	1105	1 := \textit{Var}~0,\>
blanchet@33191	1106	2 := \textit{Var}~0, \\[-2pt]
blanchet@33191	1107	& 3 := \textit{Var}~0,\>
blanchet@33191	1108	4 := \textit{Var}~0,\>
blanchet@33191	1109	5 := \textit{Var}~0)\end{aligned}$ \\
blanchet@33191	1110	\hbox{}\qquad\qquad $t = \textit{Lam}~(\textit{Lam}~(\textit{Var}~1))$ \\[2\smallskipamount]
blanchet@33191	1111	Total time: $4679$ ms.
blanchet@33191	1112	\postw
blanchet@33191	1113
blanchet@33191	1114	Using \textit{eval}, we find out that $\textit{subst}~\sigma~t =
blanchet@33191	1115	\textit{Lam}~(\textit{Lam}~(\textit{Var}~0))$. Using the traditional
blanchet@33191	1116	$\lambda$-term notation, $t$~is
blanchet@33191	1117	$\lambda x\, y.\> x$ whereas $\textit{subst}~\sigma~t$ is $\lambda x\, y.\> y$.
blanchet@33191	1118	The bug is in \textit{subst}: The $\textit{lift}~(\sigma~m)~1$ call should be
blanchet@33191	1119	replaced with $\textit{lift}~(\sigma~m)~0$.
blanchet@33191	1120
blanchet@33191	1121	An interesting aspect of Nitpick's verbose output is that it assigned inceasing
blanchet@33191	1122	cardinalities from 1 to 8 to the type $\textit{nat} \Rightarrow \textit{tm}$.
blanchet@33191	1123	For the formula of interest, knowing 6 values of that type was enough to find
blanchet@33191	1124	the counterexample. Without boxing, $46\,656$ ($= 6^6$) values must be
blanchet@33191	1125	considered, a hopeless undertaking:
blanchet@33191	1126
blanchet@33191	1127	\prew
blanchet@33191	1128	\textbf{nitpick} [\textit{dont\_box}] \\[2\smallskipamount]
blanchet@33191	1129	{\slshape Nitpick ran out of time after checking 4 of 8 scopes.}
blanchet@33191	1130	\postw
blanchet@33191	1131
blanchet@33191	1132	{\looseness=-1
blanchet@33191	1133	Boxing can be enabled or disabled globally or on a per-type basis using the
blanchet@33191	1134	\textit{box} option. Moreover, setting the cardinality of a function or
blanchet@33191	1135	product type implicitly enables boxing for that type. Nitpick usually performs
blanchet@33191	1136	reasonable choices about which types should be boxed, but option tweaking
blanchet@33191	1137	sometimes helps.
blanchet@33191	1138
blanchet@33191	1139	}
blanchet@33191	1140
blanchet@33191	1141	\subsection{Scope Monotonicity}
blanchet@33191	1142	\label{scope-monotonicity}
blanchet@33191	1143
blanchet@33191	1144	The \textit{card} option (together with \textit{iter}, \textit{bisim\_depth},
blanchet@33191	1145	and \textit{max}) controls which scopes are actually tested. In general, to
blanchet@33191	1146	exhaust all models below a certain cardinality bound, the number of scopes that
blanchet@33191	1147	Nitpick must consider increases exponentially with the number of type variables
blanchet@33191	1148	(and \textbf{typedecl}'d types) occurring in the formula. Given the default
blanchet@33191	1149	cardinality specification of 1--8, no fewer than $8^4 = 4096$ scopes must be
blanchet@33191	1150	considered for a formula involving $'a$, $'b$, $'c$, and $'d$.
blanchet@33191	1151
blanchet@33191	1152	Fortunately, many formulas exhibit a property called \textsl{scope
blanchet@33191	1153	monotonicity}, meaning that if the formula is falsifiable for a given scope,
blanchet@33191	1154	it is also falsifiable for all larger scopes \cite[p.~165]{jackson-2006}.
blanchet@33191	1155
blanchet@33191	1156	Consider the formula
blanchet@33191	1157
blanchet@33191	1158	\prew
blanchet@33191	1159	\textbf{lemma}~``$\textit{length~xs} = \textit{length~ys} \,\Longrightarrow\, \textit{rev}~(\textit{zip~xs~ys}) = \textit{zip~xs}~(\textit{rev~ys})$''
blanchet@33191	1160	\postw
blanchet@33191	1161
blanchet@33191	1162	where \textit{xs} is of type $'a~\textit{list}$ and \textit{ys} is of type
blanchet@33191	1163	$'b~\textit{list}$. A priori, Nitpick would need to consider 512 scopes to
blanchet@33191	1164	exhaust the specification \textit{card}~= 1--8. However, our intuition tells us
blanchet@33191	1165	that any counterexample found with a small scope would still be a counterexample
blanchet@33191	1166	in a larger scope---by simply ignoring the fresh $'a$ and $'b$ values provided
blanchet@33191	1167	by the larger scope. Nitpick comes to the same conclusion after a careful
blanchet@33191	1168	inspection of the formula and the relevant definitions:
blanchet@33191	1169
blanchet@33191	1170	\prew
blanchet@33191	1171	\textbf{nitpick}~[\textit{verbose}] \\[2\smallskipamount]
blanchet@33191	1172	\slshape
blanchet@33191	1173	The types ``\kern1pt$'a$'' and ``\kern1pt$'b$'' passed the monotonicity test.
blanchet@33191	1174	Nitpick might be able to skip some scopes.
blanchet@33191	1175	\\[2\smallskipamount]
blanchet@33191	1176	Trying 8 scopes: \\
blanchet@33191	1177	\hbox{}\qquad \textit{card} $'a$~= 1, \textit{card} $'b$~= 1,
blanchet@33191	1178	\textit{card} \textit{nat}~= 1, \textit{card} ``$('a \times {'}b)$
blanchet@33191	1179	\textit{list}''~= 1, \\
blanchet@33191	1180	\hbox{}\qquad\quad \textit{card} ``\kern1pt$'a$ \textit{list}''~= 1, and
blanchet@33191	1181	\textit{card} ``\kern1pt$'b$ \textit{list}''~= 1. \\
blanchet@33191	1182	\hbox{}\qquad \textit{card} $'a$~= 2, \textit{card} $'b$~= 2,
blanchet@33191	1183	\textit{card} \textit{nat}~= 2, \textit{card} ``$('a \times {'}b)$
blanchet@33191	1184	\textit{list}''~= 2, \\
blanchet@33191	1185	\hbox{}\qquad\quad \textit{card} ``\kern1pt$'a$ \textit{list}''~= 2, and
blanchet@33191	1186	\textit{card} ``\kern1pt$'b$ \textit{list}''~= 2. \\
blanchet@33191	1187	\hbox{}\qquad $\qquad\vdots$ \\[.5\smallskipamount]
blanchet@33191	1188	\hbox{}\qquad \textit{card} $'a$~= 8, \textit{card} $'b$~= 8,
blanchet@33191	1189	\textit{card} \textit{nat}~= 8, \textit{card} ``$('a \times {'}b)$
blanchet@33191	1190	\textit{list}''~= 8, \\
blanchet@33191	1191	\hbox{}\qquad\quad \textit{card} ``\kern1pt$'a$ \textit{list}''~= 8, and
blanchet@33191	1192	\textit{card} ``\kern1pt$'b$ \textit{list}''~= 8.
blanchet@33191	1193	\\[2\smallskipamount]
blanchet@33191	1194	Nitpick found a counterexample for
blanchet@33191	1195	\textit{card} $'a$~= 5, \textit{card} $'b$~= 5,
blanchet@33191	1196	\textit{card} \textit{nat}~= 5, \textit{card} ``$('a \times {'}b)$
blanchet@33191	1197	\textit{list}''~= 5, \textit{card} ``\kern1pt$'a$ \textit{list}''~= 5, and
blanchet@33191	1198	\textit{card} ``\kern1pt$'b$ \textit{list}''~= 5:
blanchet@33191	1199	\\[2\smallskipamount]
blanchet@33191	1200	\hbox{}\qquad Free variables: \nopagebreak \\
blanchet@33191	1201	\hbox{}\qquad\qquad $\textit{xs} = [a_4, a_5]$ \\
blanchet@33191	1202	\hbox{}\qquad\qquad $\textit{ys} = [b_3, b_3]$ \\[2\smallskipamount]
blanchet@33191	1203	Total time: 1636 ms.
blanchet@33191	1204	\postw
blanchet@33191	1205
blanchet@33191	1206	In theory, it should be sufficient to test a single scope:
blanchet@33191	1207
blanchet@33191	1208	\prew
blanchet@33191	1209	\textbf{nitpick}~[\textit{card}~= 8]
blanchet@33191	1210	\postw
blanchet@33191	1211
blanchet@33191	1212	However, this is often less efficient in practice and may lead to overly complex
blanchet@33191	1213	counterexamples.
blanchet@33191	1214
blanchet@33191	1215	If the monotonicity check fails but we believe that the formula is monotonic (or
blanchet@33191	1216	we don't mind missing some counterexamples), we can pass the
blanchet@33191	1217	\textit{mono} option. To convince yourself that this option is risky,
blanchet@33191	1218	simply consider this example from \S\ref{skolemization}:
blanchet@33191	1219
blanchet@33191	1220	\prew
blanchet@33191	1221	\textbf{lemma} ``$\exists g.\; \forall x\Colon 'b.~g~(f~x) = x
blanchet@33191	1222	\,\Longrightarrow\, \forall y\Colon {'}a.\; \exists x.~y = f~x$'' \\
blanchet@33191	1223	\textbf{nitpick} [\textit{mono}] \\[2\smallskipamount]
blanchet@33191	1224	{\slshape Nitpick found no counterexample.} \\[2\smallskipamount]
blanchet@33191	1225	\textbf{nitpick} \\[2\smallskipamount]
blanchet@33191	1226	\slshape
blanchet@33191	1227	Nitpick found a counterexample for \textit{card} $'a$~= 2 and \textit{card} $'b$~=~1: \\
blanchet@33191	1228	\hbox{}\qquad $\vdots$
blanchet@33191	1229	\postw
blanchet@33191	1230
blanchet@33191	1231	(It turns out the formula holds if and only if $\textit{card}~'a \le
blanchet@33191	1232	\textit{card}~'b$.) Although this is rarely advisable, the automatic
blanchet@33191	1233	monotonicity checks can be disabled by passing \textit{non\_mono}
blanchet@33191	1234	(\S\ref{optimizations}).
blanchet@33191	1235
blanchet@33191	1236	As insinuated in \S\ref{natural-numbers-and-integers} and
blanchet@33191	1237	\S\ref{inductive-datatypes}, \textit{nat}, \textit{int}, and inductive datatypes
blanchet@33191	1238	are normally monotonic and treated as such. The same is true for record types,
blanchet@33191	1239	\textit{rat}, \textit{real}, and some \textbf{typedef}'d types. Thus, given the
blanchet@33191	1240	cardinality specification 1--8, a formula involving \textit{nat}, \textit{int},
blanchet@33191	1241	\textit{int~list}, \textit{rat}, and \textit{rat~list} will lead Nitpick to
blanchet@33191	1242	consider only 8~scopes instead of $32\,768$.
blanchet@33191	1243
blanchet@34969	1244	\subsection{Inductive Properties}
blanchet@34969	1245	\label{inductive-properties}
blanchet@34969	1246
blanchet@34969	1247	Inductive properties are a particular pain to prove, because the failure to
blanchet@34969	1248	establish an induction step can mean several things:
blanchet@34969	1249	%
blanchet@34969	1250	\begin{enumerate}
blanchet@34969	1251	\item The property is invalid.
blanchet@34969	1252	\item The property is valid but is too weak to support the induction step.
blanchet@34969	1253	\item The property is valid and strong enough; it's just that we haven't found
blanchet@34969	1254	the proof yet.
blanchet@34969	1255	\end{enumerate}
blanchet@34969	1256	%
blanchet@34969	1257	Depending on which scenario applies, we would take the appropriate course of
blanchet@34969	1258	action:
blanchet@34969	1259	%
blanchet@34969	1260	\begin{enumerate}
blanchet@34969	1261	\item Repair the statement of the property so that it becomes valid.
blanchet@34969	1262	\item Generalize the property and/or prove auxiliary properties.
blanchet@34969	1263	\item Work harder on a proof.
blanchet@34969	1264	\end{enumerate}
blanchet@34969	1265	%
blanchet@34969	1266	How can we distinguish between the three scenarios? Nitpick's normal mode of
blanchet@34969	1267	operation can often detect scenario 1, and Isabelle's automatic tactics help with
blanchet@34969	1268	scenario 3. Using appropriate techniques, it is also often possible to use
blanchet@34969	1269	Nitpick to identify scenario 2. Consider the following transition system,
blanchet@34969	1270	in which natural numbers represent states:
blanchet@34969	1271
blanchet@34969	1272	\prew
blanchet@34969	1273	\textbf{inductive\_set}~\textit{reach}~\textbf{where} \\
blanchet@34969	1274	``$(4\Colon\textit{nat}) \in \textit{reach\/}$'' $\mid$ \\
blanchet@34969	1275	``$\lbrakk n < 4;\> n \in \textit{reach\/}\rbrakk \,\Longrightarrow\, 3 * n + 1 \in \textit{reach\/}$'' $\mid$ \\
blanchet@34969	1276	``$n \in \textit{reach} \,\Longrightarrow n + 2 \in \textit{reach\/}$''
blanchet@34969	1277	\postw
blanchet@34969	1278
blanchet@34969	1279	We will try to prove that only even numbers are reachable:
blanchet@34969	1280
blanchet@34969	1281	\prew
blanchet@34969	1282	\textbf{lemma}~``$n \in \textit{reach} \,\Longrightarrow\, 2~\textrm{dvd}~n$''
blanchet@34969	1283	\postw
blanchet@34969	1284
blanchet@34969	1285	Does this property hold? Nitpick cannot find a counterexample within 30 seconds,
blanchet@34969	1286	so let's attempt a proof by induction:
blanchet@34969	1287
blanchet@34969	1288	\prew
blanchet@34969	1289	\textbf{apply}~(\textit{induct~set}{:}~\textit{reach\/}) \\
blanchet@34969	1290	\textbf{apply}~\textit{auto}
blanchet@34969	1291	\postw
blanchet@34969	1292
blanchet@34969	1293	This leaves us in the following proof state:
blanchet@34969	1294
blanchet@34969	1295	\prew
blanchet@34969	1296	{\slshape goal (2 subgoals): \\
blanchet@34969	1297	\phantom{0}1. ${\bigwedge}n.\;\, \lbrakk n \in \textit{reach\/};\, n < 4;\, 2~\textsl{dvd}~n\rbrakk \,\Longrightarrow\, 2~\textsl{dvd}~\textit{Suc}~(3 * n)$ \\
blanchet@34969	1298	\phantom{0}2. ${\bigwedge}n.\;\, \lbrakk n \in \textit{reach\/};\, 2~\textsl{dvd}~n\rbrakk \,\Longrightarrow\, 2~\textsl{dvd}~\textit{Suc}~(\textit{Suc}~n)$
blanchet@34969	1299	}
blanchet@34969	1300	\postw
blanchet@34969	1301
blanchet@34969	1302	If we run Nitpick on the first subgoal, it still won't find any
blanchet@34969	1303	counterexample; and yet, \textit{auto} fails to go further, and \textit{arith}
blanchet@34969	1304	is helpless. However, notice the $n \in \textit{reach}$ assumption, which
blanchet@34969	1305	strengthens the induction hypothesis but is not immediately usable in the proof.
blanchet@34969	1306	If we remove it and invoke Nitpick, this time we get a counterexample:
blanchet@34969	1307
blanchet@34969	1308	\prew
blanchet@34969	1309	\textbf{apply}~(\textit{thin\_tac}~``$n \in \textit{reach\/}$'') \\
blanchet@34969	1310	\textbf{nitpick} \\[2\smallskipamount]
blanchet@34969	1311	\slshape Nitpick found a counterexample: \\[2\smallskipamount]
blanchet@34969	1312	\hbox{}\qquad Skolem constant: \nopagebreak \\
blanchet@34969	1313	\hbox{}\qquad\qquad $n = 0$
blanchet@34969	1314	\postw
blanchet@34969	1315
blanchet@34969	1316	Indeed, 0 < 4, 2 divides 0, but 2 does not divide 1. We can use this information
blanchet@34969	1317	to strength the lemma:
blanchet@34969	1318
blanchet@34969	1319	\prew
blanchet@34969	1320	\textbf{lemma}~``$n \in \textit{reach} \,\Longrightarrow\, 2~\textrm{dvd}~n \mathrel{\lor} n \not= 0$''
blanchet@34969	1321	\postw
blanchet@34969	1322
blanchet@34969	1323	Unfortunately, the proof by induction still gets stuck, except that Nitpick now
blanchet@34969	1324	finds the counterexample $n = 2$. We generalize the lemma further to
blanchet@34969	1325
blanchet@34969	1326	\prew
blanchet@34969	1327	\textbf{lemma}~``$n \in \textit{reach} \,\Longrightarrow\, 2~\textrm{dvd}~n \mathrel{\lor} n \ge 4$''
blanchet@34969	1328	\postw
blanchet@34969	1329
blanchet@34969	1330	and this time \textit{arith} can finish off the subgoals.
blanchet@34969	1331
blanchet@34969	1332	A similar technique can be employed for structural induction. The
blanchet@34969	1333	following mini-formalization of full binary trees will serve as illustration:
blanchet@34969	1334
blanchet@34969	1335	\prew
blanchet@34969	1336	\textbf{datatype} $\kern1pt'a$~\textit{bin\_tree} = $\textit{Leaf}~{\kern1pt'a}$ $\mid$ $\textit{Branch}$ ``\kern1pt$'a$ \textit{bin\_tree}'' ``\kern1pt$'a$ \textit{bin\_tree}'' \\[2\smallskipamount]
blanchet@34969	1337	\textbf{primrec}~\textit{labels}~\textbf{where} \\
blanchet@34969	1338	``$\textit{labels}~(\textit{Leaf}~a) = \{a\}$'' $\mid$ \\
blanchet@34969	1339	``$\textit{labels}~(\textit{Branch}~t~u) = \textit{labels}~t \mathrel{\cup} \textit{labels}~u$'' \\[2\smallskipamount]
blanchet@34969	1340	\textbf{primrec}~\textit{swap}~\textbf{where} \\
blanchet@34969	1341	``$\textit{swap}~(\textit{Leaf}~c)~a~b =$ \\
blanchet@34969	1342	\phantom{``}$(\textrm{if}~c = a~\textrm{then}~\textit{Leaf}~b~\textrm{else~if}~c = b~\textrm{then}~\textit{Leaf}~a~\textrm{else}~\textit{Leaf}~c)$'' $\mid$ \\
blanchet@34969	1343	``$\textit{swap}~(\textit{Branch}~t~u)~a~b = \textit{Branch}~(\textit{swap}~t~a~b)~(\textit{swap}~u~a~b)$''
blanchet@34969	1344	\postw
blanchet@34969	1345
blanchet@34969	1346	The \textit{labels} function returns the set of labels occurring on leaves of a
blanchet@34969	1347	tree, and \textit{swap} exchanges two labels. Intuitively, if two distinct
blanchet@34969	1348	labels $a$ and $b$ occur in a tree $t$, they should also occur in the tree
blanchet@34969	1349	obtained by swapping $a$ and $b$:
blanchet@34969	1350
blanchet@34969	1351	\prew
blanchet@34969	1352	\textbf{lemma} $``\lbrakk a \in \textit{labels}~t;\, b \in \textit{labels}~t;\, a \not= b\rbrakk {}$ \\
blanchet@34969	1353	\phantom{\textbf{lemma} ``}$\,{\Longrightarrow}{\;\,} \textit{labels}~(\textit{swap}~t~a~b) = \textit{labels}~t$''
blanchet@34969	1354	\postw
blanchet@34969	1355
blanchet@34969	1356	Nitpick can't find any counterexample, so we proceed with induction
blanchet@34969	1357	(this time favoring a more structured style):
blanchet@34969	1358
blanchet@34969	1359	\prew
blanchet@34969	1360	\textbf{proof}~(\textit{induct}~$t$) \\
blanchet@34969	1361	\hbox{}\quad \textbf{case}~\textit{Leaf}~\textbf{thus}~\textit{?case}~\textbf{by}~\textit{simp} \\
blanchet@34969	1362	\textbf{next} \\
blanchet@34969	1363	\hbox{}\quad \textbf{case}~$(\textit{Branch}~t~u)$~\textbf{thus} \textit{?case}
blanchet@34969	1364	\postw
blanchet@34969	1365
blanchet@34969	1366	Nitpick can't find any counterexample at this point either, but it makes the
blanchet@34969	1367	following suggestion:
blanchet@34969	1368
blanchet@34969	1369	\prew
blanchet@34969	1370	\slshape
blanchet@34969	1371	Hint: To check that the induction hypothesis is general enough, try the following command:
blanchet@34969	1372	\textbf{nitpick}~[\textit{non\_std} ``${\kern1pt'a}~\textit{bin\_tree}$'', \textit{show\_consts}].
blanchet@34969	1373	\postw
blanchet@34969	1374
blanchet@34969	1375	If we follow the hint, we get a ``nonstandard'' counterexample for the step:
blanchet@34969	1376
blanchet@34969	1377	\prew
blanchet@34969	1378	\slshape Nitpick found a nonstandard counterexample for \textit{card} $'a$ = 4: \\[2\smallskipamount]
blanchet@34969	1379	\hbox{}\qquad Free variables: \nopagebreak \\
blanchet@34969	1380	\hbox{}\qquad\qquad $a = a_4$ \\
blanchet@34969	1381	\hbox{}\qquad\qquad $b = a_3$ \\
blanchet@34969	1382	\hbox{}\qquad\qquad $t = \xi_3$ \\
blanchet@34969	1383	\hbox{}\qquad\qquad $u = \xi_4$ \\
blanchet@34969	1384	\hbox{}\qquad {\slshape Constants:} \nopagebreak \\
blanchet@34969	1385	\hbox{}\qquad\qquad $\textit{labels} = \undef
blanchet@34969	1386	(\!\begin{aligned}[t]%
blanchet@34969	1387	& \xi_3 := \{a_4\},\> \xi_4 := \{a_1, a_3\}, \\[-2pt] %% TYPESETTING
blanchet@34969	1388	& \textit{Branch}~\xi_3~\xi_3 := \{a_4\}, \\[-2pt]
blanchet@34969	1389	& \textit{Branch}~\xi_3~\xi_4 := \{a_1, a_3, a_4\})\end{aligned}$ \\
blanchet@34969	1390	\hbox{}\qquad\qquad $\lambda x_1.\> \textit{swap}~x_1~a~b = \undef
blanchet@34969	1391	(\!\begin{aligned}[t]%
blanchet@34969	1392	& \xi_3 := \xi_3,\> \xi_4 := \xi_3, \\[-2pt]
blanchet@34969	1393	& \textit{Branch}~\xi_3~\xi_3 := \textit{Branch}~\xi_3~\xi_3, \\[-2pt]
blanchet@34969	1394	& \textit{Branch}~\xi_4~\xi_3 := \textit{Branch}~\xi_3~\xi_3)\end{aligned}$ \\[2\smallskipamount]
blanchet@34969	1395	The existence of a nonstandard model suggests that the induction hypothesis is not general enough or perhaps
blanchet@34969	1396	even wrong. See the ``Inductive Properties'' section of the Nitpick manual for details (``\textit{isabelle doc nitpick}'').
blanchet@34969	1397	\postw
blanchet@34969	1398
blanchet@34969	1399	Reading the Nitpick manual is a most excellent idea.
blanchet@34969	1400	But what's going on? The \textit{non\_std} ``${\kern1pt'a}~\textit{bin\_tree}$''
blanchet@34969	1401	option told the tool to look for nonstandard models of binary trees, which
blanchet@34969	1402	means that new ``nonstandard'' trees $\xi_1, \xi_2, \ldots$, are now allowed in
blanchet@34969	1403	addition to the standard trees generated by the \textit{Leaf} and
blanchet@34969	1404	\textit{Branch} constructors.%
blanchet@34969	1405	\footnote{Notice the similarity between allowing nonstandard trees here and
blanchet@34969	1406	allowing unreachable states in the preceding example (by removing the ``$n \in
blanchet@34969	1407	\textit{reach\/}$'' assumption). In both cases, we effectively enlarge the
blanchet@34969	1408	set of objects over which the induction is performed while doing the step
blanchet@34969	1409	so as to test the induction hypothesis's strength.}
blanchet@34969	1410	The new trees are so nonstandard that we know nothing about them, except what
blanchet@34969	1411	the induction hypothesis states and what can be proved about all trees without
blanchet@34969	1412	relying on induction or case distinction. The key observation is,
blanchet@34969	1413	%
blanchet@34969	1414	\begin{quote}
blanchet@34969	1415	\textsl{If the induction
blanchet@34969	1416	hypothesis is strong enough, the induction step will hold even for nonstandard
blanchet@34969	1417	objects, and Nitpick won't find any nonstandard counterexample.}
blanchet@34969	1418	\end{quote}
blanchet@34969	1419	%
blanchet@34969	1420	But here, Nitpick did find some nonstandard trees $t = \xi_3$
blanchet@34969	1421	and $u = \xi_4$ such that $a \in \textit{labels}~t$, $b \notin
blanchet@34969	1422	\textit{labels}~t$, $a \notin \textit{labels}~u$, and $b \in \textit{labels}~u$.
blanchet@34969	1423	Because neither tree contains both $a$ and $b$, the induction hypothesis tells
blanchet@34969	1424	us nothing about the labels of $\textit{swap}~t~a~b$ and $\textit{swap}~u~a~b$,
blanchet@34969	1425	and as a result we know nothing about the labels of the tree
blanchet@34969	1426	$\textit{swap}~(\textit{Branch}~t~u)~a~b$, which by definition equals
blanchet@34969	1427	$\textit{Branch}$ $(\textit{swap}~t~a~b)$ $(\textit{swap}~u~a~b)$, whose
blanchet@34969	1428	labels are $\textit{labels}$ $(\textit{swap}~t~a~b) \mathrel{\cup}
blanchet@34969	1429	\textit{labels}$ $(\textit{swap}~u~a~b)$.
blanchet@34969	1430
blanchet@34969	1431	The solution is to ensure that we always know what the labels of the subtrees
blanchet@34969	1432	are in the inductive step, by covering the cases where $a$ and/or~$b$ is not in
blanchet@34969	1433	$t$ in the statement of the lemma:
blanchet@34969	1434
blanchet@34969	1435	\prew
blanchet@34969	1436	\textbf{lemma} ``$\textit{labels}~(\textit{swap}~t~a~b) = {}$ \\
blanchet@34969	1437	\phantom{\textbf{lemma} ``}$(\textrm{if}~a \in \textit{labels}~t~\textrm{then}$ \nopagebreak \\
blanchet@34969	1438	\phantom{\textbf{lemma} ``(\quad}$\textrm{if}~b \in \textit{labels}~t~\textrm{then}~\textit{labels}~t~\textrm{else}~(\textit{labels}~t - \{a\}) \mathrel{\cup} \{b\}$ \\
blanchet@34969	1439	\phantom{\textbf{lemma} ``(}$\textrm{else}$ \\
blanchet@34969	1440	\phantom{\textbf{lemma} ``(\quad}$\textrm{if}~b \in \textit{labels}~t~\textrm{then}~(\textit{labels}~t - \{b\}) \mathrel{\cup} \{a\}~\textrm{else}~\textit{labels}~t)$''
blanchet@34969	1441	\postw
blanchet@34969	1442
blanchet@34969	1443	This time, Nitpick won't find any nonstandard counterexample, and we can perform
blanchet@34969	1444	the induction step using \textbf{auto}.
blanchet@34969	1445
blanchet@33191	1446	\section{Case Studies}
blanchet@33191	1447	\label{case-studies}
blanchet@33191	1448
blanchet@33191	1449	As a didactic device, the previous section focused mostly on toy formulas whose
blanchet@33191	1450	validity can easily be assessed just by looking at the formula. We will now
blanchet@33191	1451	review two somewhat more realistic case studies that are within Nitpick's
blanchet@33191	1452	reach:\ a context-free grammar modeled by mutually inductive sets and a
blanchet@33191	1453	functional implementation of AA trees. The results presented in this
blanchet@33191	1454	section were produced with the following settings:
blanchet@33191	1455
blanchet@33191	1456	\prew
blanchet@33191	1457	\textbf{nitpick\_params} [\textit{max\_potential}~= 0,\, \textit{max\_threads} = 2]
blanchet@33191	1458	\postw
blanchet@33191	1459
blanchet@33191	1460	\subsection{A Context-Free Grammar}
blanchet@33191	1461	\label{a-context-free-grammar}
blanchet@33191	1462
blanchet@33191	1463	Our first case study is taken from section 7.4 in the Isabelle tutorial
blanchet@33191	1464	\cite{isa-tutorial}. The following grammar, originally due to Hopcroft and
blanchet@33191	1465	Ullman, produces all strings with an equal number of $a$'s and $b$'s:
blanchet@33191	1466
blanchet@33191	1467	\prew
blanchet@33191	1468	\begin{tabular}{@{}r@{$\;\,$}c@{$\;\,$}l@{}}
blanchet@33191	1469	$S$ & $::=$ & $\epsilon \mid bA \mid aB$ \\
blanchet@33191	1470	$A$ & $::=$ & $aS \mid bAA$ \\
blanchet@33191	1471	$B$ & $::=$ & $bS \mid aBB$
blanchet@33191	1472	\end{tabular}
blanchet@33191	1473	\postw
blanchet@33191	1474
blanchet@33191	1475	The intuition behind the grammar is that $A$ generates all string with one more
blanchet@33191	1476	$a$ than $b$'s and $B$ generates all strings with one more $b$ than $a$'s.
blanchet@33191	1477
blanchet@33191	1478	The alphabet consists exclusively of $a$'s and $b$'s:
blanchet@33191	1479
blanchet@33191	1480	\prew
blanchet@33191	1481	\textbf{datatype} \textit{alphabet}~= $a$ $\mid$ $b$
blanchet@33191	1482	\postw
blanchet@33191	1483
blanchet@33191	1484	Strings over the alphabet are represented by \textit{alphabet list}s.
blanchet@33191	1485	Nonterminals in the grammar become sets of strings. The production rules
blanchet@33191	1486	presented above can be expressed as a mutually inductive definition:
blanchet@33191	1487
blanchet@33191	1488	\prew
blanchet@33191	1489	\textbf{inductive\_set} $S$ \textbf{and} $A$ \textbf{and} $B$ \textbf{where} \\
blanchet@33191	1490	\textit{R1}:\kern.4em ``$[] \in S$'' $\,\mid$ \\
blanchet@33191	1491	\textit{R2}:\kern.4em ``$w \in A\,\Longrightarrow\, b \mathbin{\#} w \in S$'' $\,\mid$ \\
blanchet@33191	1492	\textit{R3}:\kern.4em ``$w \in B\,\Longrightarrow\, a \mathbin{\#} w \in S$'' $\,\mid$ \\
blanchet@33191	1493	\textit{R4}:\kern.4em ``$w \in S\,\Longrightarrow\, a \mathbin{\#} w \in A$'' $\,\mid$ \\
blanchet@33191	1494	\textit{R5}:\kern.4em ``$w \in S\,\Longrightarrow\, b \mathbin{\#} w \in S$'' $\,\mid$ \\
blanchet@33191	1495	\textit{R6}:\kern.4em ``$\lbrakk v \in B;\> v \in B\rbrakk \,\Longrightarrow\, a \mathbin{\#} v \mathbin{@} w \in B$''
blanchet@33191	1496	\postw
blanchet@33191	1497
blanchet@33191	1498	The conversion of the grammar into the inductive definition was done manually by
blanchet@33191	1499	Joe Blow, an underpaid undergraduate student. As a result, some errors might
blanchet@33191	1500	have sneaked in.
blanchet@33191	1501
blanchet@33191	1502	Debugging faulty specifications is at the heart of Nitpick's \textsl{raison
blanchet@33191	1503	d'\^etre}. A good approach is to state desirable properties of the specification
blanchet@33191	1504	(here, that $S$ is exactly the set of strings over $\{a, b\}$ with as many $a$'s
blanchet@33191	1505	as $b$'s) and check them with Nitpick. If the properties are correctly stated,
blanchet@33191	1506	counterexamples will point to bugs in the specification. For our grammar
blanchet@33191	1507	example, we will proceed in two steps, separating the soundness and the
blanchet@33191	1508	completeness of the set $S$. First, soundness:
blanchet@33191	1509
blanchet@33191	1510	\prew
blanchet@33191	1511	\textbf{theorem}~\textit{S\_sound}: \\
blanchet@33191	1512	``$w \in S \longrightarrow \textit{length}~[x\mathbin{\leftarrow} w.\; x = a] =
blanchet@33191	1513	\textit{length}~[x\mathbin{\leftarrow} w.\; x = b]$'' \\
blanchet@33191	1514	\textbf{nitpick} \\[2\smallskipamount]
blanchet@33191	1515	\slshape Nitpick found a counterexample: \\[2\smallskipamount]
blanchet@33191	1516	\hbox{}\qquad Free variable: \nopagebreak \\
blanchet@33191	1517	\hbox{}\qquad\qquad $w = [b]$
blanchet@33191	1518	\postw
blanchet@33191	1519
blanchet@33191	1520	It would seem that $[b] \in S$. How could this be? An inspection of the
blanchet@33191	1521	introduction rules reveals that the only rule with a right-hand side of the form
blanchet@33191	1522	$b \mathbin{\#} {\ldots} \in S$ that could have introduced $[b]$ into $S$ is
blanchet@33191	1523	\textit{R5}:
blanchet@33191	1524
blanchet@33191	1525	\prew
blanchet@33191	1526	``$w \in S\,\Longrightarrow\, b \mathbin{\#} w \in S$''
blanchet@33191	1527	\postw
blanchet@33191	1528
blanchet@33191	1529	On closer inspection, we can see that this rule is wrong. To match the
blanchet@33191	1530	production $B ::= bS$, the second $S$ should be a $B$. We fix the typo and try
blanchet@33191	1531	again:
blanchet@33191	1532
blanchet@33191	1533	\prew
blanchet@33191	1534	\textbf{nitpick} \\[2\smallskipamount]
blanchet@33191	1535	\slshape Nitpick found a counterexample: \\[2\smallskipamount]
blanchet@33191	1536	\hbox{}\qquad Free variable: \nopagebreak \\
blanchet@33191	1537	\hbox{}\qquad\qquad $w = [a, a, b]$
blanchet@33191	1538	\postw
blanchet@33191	1539
blanchet@33191	1540	Some detective work is necessary to find out what went wrong here. To get $[a,
blanchet@33191	1541	a, b] \in S$, we need $[a, b] \in B$ by \textit{R3}, which in turn can only come
blanchet@33191	1542	from \textit{R6}:
blanchet@33191	1543
blanchet@33191	1544	\prew
blanchet@33191	1545	``$\lbrakk v \in B;\> v \in B\rbrakk \,\Longrightarrow\, a \mathbin{\#} v \mathbin{@} w \in B$''
blanchet@33191	1546	\postw
blanchet@33191	1547
blanchet@33191	1548	Now, this formula must be wrong: The same assumption occurs twice, and the
blanchet@33191	1549	variable $w$ is unconstrained. Clearly, one of the two occurrences of $v$ in
blanchet@33191	1550	the assumptions should have been a $w$.
blanchet@33191	1551
blanchet@33191	1552	With the correction made, we don't get any counterexample from Nitpick. Let's
blanchet@33191	1553	move on and check completeness:
blanchet@33191	1554
blanchet@33191	1555	\prew
blanchet@33191	1556	\textbf{theorem}~\textit{S\_complete}: \\
blanchet@33191	1557	``$\textit{length}~[x\mathbin{\leftarrow} w.\; x = a] =
blanchet@33191	1558	\textit{length}~[x\mathbin{\leftarrow} w.\; x = b]
blanchet@33191	1559	\longrightarrow w \in S$'' \\
blanchet@33191	1560	\textbf{nitpick} \\[2\smallskipamount]
blanchet@33191	1561	\slshape Nitpick found a counterexample: \\[2\smallskipamount]
blanchet@33191	1562	\hbox{}\qquad Free variable: \nopagebreak \\
blanchet@33191	1563	\hbox{}\qquad\qquad $w = [b, b, a, a]$
blanchet@33191	1564	\postw
blanchet@33191	1565
blanchet@33191	1566	Apparently, $[b, b, a, a] \notin S$, even though it has the same numbers of
blanchet@33191	1567	$a$'s and $b$'s. But since our inductive definition passed the soundness check,
blanchet@33191	1568	the introduction rules we have are probably correct. Perhaps we simply lack an
blanchet@33191	1569	introduction rule. Comparing the grammar with the inductive definition, our
blanchet@33191	1570	suspicion is confirmed: Joe Blow simply forgot the production $A ::= bAA$,
blanchet@33191	1571	without which the grammar cannot generate two or more $b$'s in a row. So we add
blanchet@33191	1572	the rule
blanchet@33191	1573
blanchet@33191	1574	\prew
blanchet@33191	1575	``$\lbrakk v \in A;\> w \in A\rbrakk \,\Longrightarrow\, b \mathbin{\#} v \mathbin{@} w \in A$''
blanchet@33191	1576	\postw
blanchet@33191	1577
blanchet@33191	1578	With this last change, we don't get any counterexamples from Nitpick for either
blanchet@33191	1579	soundness or completeness. We can even generalize our result to cover $A$ and
blanchet@33191	1580	$B$ as well:
blanchet@33191	1581
blanchet@33191	1582	\prew
blanchet@33191	1583	\textbf{theorem} \textit{S\_A\_B\_sound\_and\_complete}: \\
blanchet@33191	1584	``$w \in S \longleftrightarrow \textit{length}~[x \mathbin{\leftarrow} w.\; x = a] = \textit{length}~[x \mathbin{\leftarrow} w.\; x = b]$'' \\
blanchet@33191	1585	``$w \in A \longleftrightarrow \textit{length}~[x \mathbin{\leftarrow} w.\; x = a] = \textit{length}~[x \mathbin{\leftarrow} w.\; x = b] + 1$'' \\
blanchet@33191	1586	``$w \in B \longleftrightarrow \textit{length}~[x \mathbin{\leftarrow} w.\; x = b] = \textit{length}~[x \mathbin{\leftarrow} w.\; x = a] + 1$'' \\
blanchet@33191	1587	\textbf{nitpick} \\[2\smallskipamount]
blanchet@33191	1588	\slshape Nitpick found no counterexample.
blanchet@33191	1589	\postw
blanchet@33191	1590
blanchet@33191	1591	\subsection{AA Trees}
blanchet@33191	1592	\label{aa-trees}
blanchet@33191	1593
blanchet@33191	1594	AA trees are a kind of balanced trees discovered by Arne Andersson that provide
blanchet@33191	1595	similar performance to red-black trees, but with a simpler implementation
blanchet@33191	1596	\cite{andersson-1993}. They can be used to store sets of elements equipped with
blanchet@33191	1597	a total order $<$. We start by defining the datatype and some basic extractor
blanchet@33191	1598	functions:
blanchet@33191	1599
blanchet@33191	1600	\prew
blanchet@34969	1601	\textbf{datatype} $'a$~\textit{aa\_tree} = \\
blanchet@34969	1602	\hbox{}\quad $\Lambda$ $\mid$ $N$ ``\kern1pt$'a\Colon \textit{linorder}$'' \textit{nat} ``\kern1pt$'a$ \textit{aa\_tree}'' ``\kern1pt$'a$ \textit{aa\_tree}'' \\[2\smallskipamount]
blanchet@33191	1603	\textbf{primrec} \textit{data} \textbf{where} \\
blanchet@33191	1604	``$\textit{data}~\Lambda = \undef$'' $\,\mid$ \\
blanchet@33191	1605	``$\textit{data}~(N~x~\_~\_~\_) = x$'' \\[2\smallskipamount]
blanchet@33191	1606	\textbf{primrec} \textit{dataset} \textbf{where} \\
blanchet@33191	1607	``$\textit{dataset}~\Lambda = \{\}$'' $\,\mid$ \\
blanchet@33191	1608	``$\textit{dataset}~(N~x~\_~t~u) = \{x\} \cup \textit{dataset}~t \mathrel{\cup} \textit{dataset}~u$'' \\[2\smallskipamount]
blanchet@33191	1609	\textbf{primrec} \textit{level} \textbf{where} \\
blanchet@33191	1610	``$\textit{level}~\Lambda = 0$'' $\,\mid$ \\
blanchet@33191	1611	``$\textit{level}~(N~\_~k~\_~\_) = k$'' \\[2\smallskipamount]
blanchet@33191	1612	\textbf{primrec} \textit{left} \textbf{where} \\
blanchet@33191	1613	``$\textit{left}~\Lambda = \Lambda$'' $\,\mid$ \\
blanchet@33191	1614	``$\textit{left}~(N~\_~\_~t~\_) = t$'' \\[2\smallskipamount]
blanchet@33191	1615	\textbf{primrec} \textit{right} \textbf{where} \\
blanchet@33191	1616	``$\textit{right}~\Lambda = \Lambda$'' $\,\mid$ \\
blanchet@33191	1617	``$\textit{right}~(N~\_~\_~\_~u) = u$''
blanchet@33191	1618	\postw
blanchet@33191	1619
blanchet@33191	1620	The wellformedness criterion for AA trees is fairly complex. Wikipedia states it
blanchet@33191	1621	as follows \cite{wikipedia-2009-aa-trees}:
blanchet@33191	1622
blanchet@33191	1623	\kern.2\parskip %% TYPESETTING
blanchet@33191	1624
blanchet@33191	1625	\pre
blanchet@33191	1626	Each node has a level field, and the following invariants must remain true for
blanchet@33191	1627	the tree to be valid:
blanchet@33191	1628
blanchet@33191	1629	\raggedright
blanchet@33191	1630
blanchet@33191	1631	\kern-.4\parskip %% TYPESETTING
blanchet@33191	1632
blanchet@33191	1633	\begin{enum}
blanchet@33191	1634	\item[]
blanchet@33191	1635	\begin{enum}
blanchet@33191	1636	\item[1.] The level of a leaf node is one.
blanchet@33191	1637	\item[2.] The level of a left child is strictly less than that of its parent.
blanchet@33191	1638	\item[3.] The level of a right child is less than or equal to that of its parent.
blanchet@33191	1639	\item[4.] The level of a right grandchild is strictly less than that of its grandparent.
blanchet@33191	1640	\item[5.] Every node of level greater than one must have two children.
blanchet@33191	1641	\end{enum}
blanchet@33191	1642	\end{enum}
blanchet@33191	1643	\post
blanchet@33191	1644
blanchet@33191	1645	\kern.4\parskip %% TYPESETTING
blanchet@33191	1646
blanchet@33191	1647	The \textit{wf} predicate formalizes this description:
blanchet@33191	1648
blanchet@33191	1649	\prew
blanchet@33191	1650	\textbf{primrec} \textit{wf} \textbf{where} \\
blanchet@33191	1651	``$\textit{wf}~\Lambda = \textit{True}$'' $\,\mid$ \\
blanchet@33191	1652	``$\textit{wf}~(N~\_~k~t~u) =$ \\
blanchet@33191	1653	\phantom{``}$(\textrm{if}~t = \Lambda~\textrm{then}$ \\
blanchet@33191	1654	\phantom{``$(\quad$}$k = 1 \mathrel{\land} (u = \Lambda \mathrel{\lor} (\textit{level}~u = 1 \mathrel{\land} \textit{left}~u = \Lambda \mathrel{\land} \textit{right}~u = \Lambda))$ \\
blanchet@33191	1655	\phantom{``$($}$\textrm{else}$ \\
blanchet@33193	1656	\hbox{}\phantom{``$(\quad$}$\textit{wf}~t \mathrel{\land} \textit{wf}~u
blanchet@33191	1657	\mathrel{\land} u \not= \Lambda \mathrel{\land} \textit{level}~t < k
blanchet@33193	1658	\mathrel{\land} \textit{level}~u \le k$ \\
blanchet@33193	1659	\hbox{}\phantom{``$(\quad$}${\land}\; \textit{level}~(\textit{right}~u) < k)$''
blanchet@33191	1660	\postw
blanchet@33191	1661
blanchet@33191	1662	Rebalancing the tree upon insertion and removal of elements is performed by two
blanchet@33191	1663	auxiliary functions called \textit{skew} and \textit{split}, defined below:
blanchet@33191	1664
blanchet@33191	1665	\prew
blanchet@33191	1666	\textbf{primrec} \textit{skew} \textbf{where} \\
blanchet@33191	1667	``$\textit{skew}~\Lambda = \Lambda$'' $\,\mid$ \\
blanchet@33191	1668	``$\textit{skew}~(N~x~k~t~u) = {}$ \\
blanchet@33191	1669	\phantom{``}$(\textrm{if}~t \not= \Lambda \mathrel{\land} k =
blanchet@33191	1670	\textit{level}~t~\textrm{then}$ \\
blanchet@33191	1671	\phantom{``(\quad}$N~(\textit{data}~t)~k~(\textit{left}~t)~(N~x~k~
blanchet@33191	1672	(\textit{right}~t)~u)$ \\
blanchet@33191	1673	\phantom{``(}$\textrm{else}$ \\
blanchet@33191	1674	\phantom{``(\quad}$N~x~k~t~u)$''
blanchet@33191	1675	\postw
blanchet@33191	1676
blanchet@33191	1677	\prew
blanchet@33191	1678	\textbf{primrec} \textit{split} \textbf{where} \\
blanchet@33191	1679	``$\textit{split}~\Lambda = \Lambda$'' $\,\mid$ \\
blanchet@33191	1680	``$\textit{split}~(N~x~k~t~u) = {}$ \\
blanchet@33191	1681	\phantom{``}$(\textrm{if}~u \not= \Lambda \mathrel{\land} k =
blanchet@33191	1682	\textit{level}~(\textit{right}~u)~\textrm{then}$ \\
blanchet@33191	1683	\phantom{``(\quad}$N~(\textit{data}~u)~(\textit{Suc}~k)~
blanchet@33191	1684	(N~x~k~t~(\textit{left}~u))~(\textit{right}~u)$ \\
blanchet@33191	1685	\phantom{``(}$\textrm{else}$ \\
blanchet@33191	1686	\phantom{``(\quad}$N~x~k~t~u)$''
blanchet@33191	1687	\postw
blanchet@33191	1688
blanchet@33191	1689	Performing a \textit{skew} or a \textit{split} should have no impact on the set
blanchet@33191	1690	of elements stored in the tree:
blanchet@33191	1691
blanchet@33191	1692	\prew
blanchet@33191	1693	\textbf{theorem}~\textit{dataset\_skew\_split}:\\
blanchet@33191	1694	``$\textit{dataset}~(\textit{skew}~t) = \textit{dataset}~t$'' \\
blanchet@33191	1695	``$\textit{dataset}~(\textit{split}~t) = \textit{dataset}~t$'' \\
blanchet@33191	1696	\textbf{nitpick} \\[2\smallskipamount]
blanchet@33191	1697	{\slshape Nitpick ran out of time after checking 7 of 8 scopes.}
blanchet@33191	1698	\postw
blanchet@33191	1699
blanchet@33191	1700	Furthermore, applying \textit{skew} or \textit{split} to a well-formed tree
blanchet@33191	1701	should not alter the tree:
blanchet@33191	1702
blanchet@33191	1703	\prew
blanchet@33191	1704	\textbf{theorem}~\textit{wf\_skew\_split}:\\
blanchet@33191	1705	``$\textit{wf}~t\,\Longrightarrow\, \textit{skew}~t = t$'' \\
blanchet@33191	1706	``$\textit{wf}~t\,\Longrightarrow\, \textit{split}~t = t$'' \\
blanchet@33191	1707	\textbf{nitpick} \\[2\smallskipamount]
blanchet@33191	1708	{\slshape Nitpick found no counterexample.}
blanchet@33191	1709	\postw
blanchet@33191	1710
blanchet@33191	1711	Insertion is implemented recursively. It preserves the sort order:
blanchet@33191	1712
blanchet@33191	1713	\prew
blanchet@33191	1714	\textbf{primrec}~\textit{insort} \textbf{where} \\
blanchet@33191	1715	``$\textit{insort}~\Lambda~x = N~x~1~\Lambda~\Lambda$'' $\,\mid$ \\
blanchet@33191	1716	``$\textit{insort}~(N~y~k~t~u)~x =$ \\
blanchet@33191	1717	\phantom{``}$({}~(\textit{split} \circ \textit{skew})~{})~(N~y~k~(\textrm{if}~x < y~\textrm{then}~\textit{insort}~t~x~\textrm{else}~t)$ \\
blanchet@33191	1718	\phantom{``$({}~(\textit{split} \circ \textit{skew})~{})~(N~y~k~$}$(\textrm{if}~x > y~\textrm{then}~\textit{insort}~u~x~\textrm{else}~u))$''
blanchet@33191	1719	\postw
blanchet@33191	1720
blanchet@33191	1721	Notice that we deliberately commented out the application of \textit{skew} and
blanchet@33191	1722	\textit{split}. Let's see if this causes any problems:
blanchet@33191	1723
blanchet@33191	1724	\prew
blanchet@33191	1725	\textbf{theorem}~\textit{wf\_insort}:\kern.4em ``$\textit{wf}~t\,\Longrightarrow\, \textit{wf}~(\textit{insort}~t~x)$'' \\
blanchet@33191	1726	\textbf{nitpick} \\[2\smallskipamount]
blanchet@33191	1727	\slshape Nitpick found a counterexample for \textit{card} $'a$ = 4: \\[2\smallskipamount]
blanchet@33191	1728	\hbox{}\qquad Free variables: \nopagebreak \\
blanchet@33191	1729	\hbox{}\qquad\qquad $t = N~a_3~1~\Lambda~\Lambda$ \\
blanchet@34969	1730	\hbox{}\qquad\qquad $x = a_4$
blanchet@33191	1731	\postw
blanchet@33191	1732
blanchet@34038	1733	It's hard to see why this is a counterexample. To improve readability, we will
blanchet@34038	1734	restrict the theorem to \textit{nat}, so that we don't need to look up the value
blanchet@34038	1735	of the $\textit{op}~{<}$ constant to find out which element is smaller than the
blanchet@34038	1736	other. In addition, we will tell Nitpick to display the value of
blanchet@34038	1737	$\textit{insort}~t~x$ using the \textit{eval} option. This gives
blanchet@33191	1738
blanchet@33191	1739	\prew
blanchet@33191	1740	\textbf{theorem} \textit{wf\_insort\_nat}:\kern.4em ``$\textit{wf}~t\,\Longrightarrow\, \textit{wf}~(\textit{insort}~t~(x\Colon\textit{nat}))$'' \\
blanchet@33191	1741	\textbf{nitpick} [\textit{eval} = ``$\textit{insort}~t~x$''] \\[2\smallskipamount]
blanchet@33191	1742	\slshape Nitpick found a counterexample: \\[2\smallskipamount]
blanchet@33191	1743	\hbox{}\qquad Free variables: \nopagebreak \\
blanchet@33191	1744	\hbox{}\qquad\qquad $t = N~1~1~\Lambda~\Lambda$ \\
blanchet@33191	1745	\hbox{}\qquad\qquad $x = 0$ \\
blanchet@33191	1746	\hbox{}\qquad Evaluated term: \\
blanchet@33191	1747	\hbox{}\qquad\qquad $\textit{insort}~t~x = N~1~1~(N~0~1~\Lambda~\Lambda)~\Lambda$
blanchet@33191	1748	\postw
blanchet@33191	1749
blanchet@33191	1750	Nitpick's output reveals that the element $0$ was added as a left child of $1$,
blanchet@33191	1751	where both have a level of 1. This violates the second AA tree invariant, which
blanchet@33191	1752	states that a left child's level must be less than its parent's. This shouldn't
blanchet@33191	1753	come as a surprise, considering that we commented out the tree rebalancing code.
blanchet@33191	1754	Reintroducing the code seems to solve the problem:
blanchet@33191	1755
blanchet@33191	1756	\prew
blanchet@33191	1757	\textbf{theorem}~\textit{wf\_insort}:\kern.4em ``$\textit{wf}~t\,\Longrightarrow\, \textit{wf}~(\textit{insort}~t~x)$'' \\
blanchet@33191	1758	\textbf{nitpick} \\[2\smallskipamount]
blanchet@33191	1759	{\slshape Nitpick ran out of time after checking 6 of 8 scopes.}
blanchet@33191	1760	\postw
blanchet@33191	1761
blanchet@33191	1762	Insertion should transform the set of elements represented by the tree in the
blanchet@33191	1763	obvious way:
blanchet@33191	1764
blanchet@33191	1765	\prew
blanchet@33191	1766	\textbf{theorem} \textit{dataset\_insort}:\kern.4em
blanchet@33191	1767	``$\textit{dataset}~(\textit{insort}~t~x) = \{x\} \cup \textit{dataset}~t$'' \\
blanchet@33191	1768	\textbf{nitpick} \\[2\smallskipamount]
blanchet@33191	1769	{\slshape Nitpick ran out of time after checking 5 of 8 scopes.}
blanchet@33191	1770	\postw
blanchet@33191	1771
blanchet@33191	1772	We could continue like this and sketch a complete theory of AA trees without
blanchet@33191	1773	performing a single proof. Once the definitions and main theorems are in place
blanchet@33191	1774	and have been thoroughly tested using Nitpick, we could start working on the
blanchet@33191	1775	proofs. Developing theories this way usually saves time, because faulty theorems
blanchet@33191	1776	and definitions are discovered much earlier in the process.
blanchet@33191	1777
blanchet@33191	1778	\section{Option Reference}
blanchet@33191	1779	\label{option-reference}
blanchet@33191	1780
blanchet@33191	1781	\def\flushitem#1{\item[]\noindent\kern-\leftmargin \textbf{#1}}
blanchet@33191	1782	\def\qty#1{$\left<\textit{#1}\right>$}
blanchet@33191	1783	\def\qtybf#1{$\mathbf{\left<\textbf{\textit{#1}}\right>}$}
blanchet@33191	1784	\def\optrue#1#2{\flushitem{\textit{#1} $\bigl[$= \qtybf{bool}$\bigr]$\quad [\textit{true}]\hfill (neg.: \textit{#2})}\nopagebreak\\[\parskip]}
blanchet@33191	1785	\def\opfalse#1#2{\flushitem{\textit{#1} $\bigl[$= \qtybf{bool}$\bigr]$\quad [\textit{false}]\hfill (neg.: \textit{#2})}\nopagebreak\\[\parskip]}
blanchet@33191	1786	\def\opsmart#1#2{\flushitem{\textit{#1} $\bigl[$= \qtybf{bool\_or\_smart}$\bigr]$\quad [\textit{smart}]\hfill (neg.: \textit{#2})}\nopagebreak\\[\parskip]}
blanchet@34969	1787	\def\opnodefault#1#2{\flushitem{\textit{#1} = \qtybf{#2}} \nopagebreak\\[\parskip]}
blanchet@34969	1788	\def\opdefault#1#2#3{\flushitem{\textit{#1} = \qtybf{#2}\quad [\textit{#3}]} \nopagebreak\\[\parskip]}
blanchet@34969	1789	\def\oparg#1#2#3{\flushitem{\textit{#1} \qtybf{#2} = \qtybf{#3}} \nopagebreak\\[\parskip]}
blanchet@34969	1790	\def\opargbool#1#2#3{\flushitem{\textit{#1} \qtybf{#2} $\bigl[$= \qtybf{bool}$\bigr]$\hfill (neg.: \textit{#3})}\nopagebreak\\[\parskip]}
blanchet@34969	1791	\def\opargboolorsmart#1#2#3{\flushitem{\textit{#1} \qtybf{#2} $\bigl[$= \qtybf{bool\_or\_smart}$\bigr]$\hfill (neg.: \textit{#3})}\nopagebreak\\[\parskip]}
blanchet@33191	1792
blanchet@33191	1793	Nitpick's behavior can be influenced by various options, which can be specified
blanchet@33191	1794	in brackets after the \textbf{nitpick} command. Default values can be set
blanchet@33191	1795	using \textbf{nitpick\_\allowbreak params}. For example:
blanchet@33191	1796
blanchet@33191	1797	\prew
blanchet@33191	1798	\textbf{nitpick\_params} [\textit{verbose}, \,\textit{timeout} = 60$\,s$]
blanchet@33191	1799	\postw
blanchet@33191	1800
blanchet@33191	1801	The options are categorized as follows:\ mode of operation
blanchet@33191	1802	(\S\ref{mode-of-operation}), scope of search (\S\ref{scope-of-search}), output
blanchet@33191	1803	format (\S\ref{output-format}), automatic counterexample checks
blanchet@33191	1804	(\S\ref{authentication}), optimizations
blanchet@33191	1805	(\S\ref{optimizations}), and timeouts (\S\ref{timeouts}).
blanchet@33191	1806
blanchet@33552	1807	You can instruct Nitpick to run automatically on newly entered theorems by
blanchet@33552	1808	enabling the ``Auto Nitpick'' option from the ``Isabelle'' menu in Proof
blanchet@33552	1809	General. For automatic runs, \textit{user\_axioms} (\S\ref{mode-of-operation})
blanchet@33552	1810	and \textit{assms} (\S\ref{mode-of-operation}) are implicitly enabled,
blanchet@33552	1811	\textit{blocking} (\S\ref{mode-of-operation}), \textit{verbose}
blanchet@33552	1812	(\S\ref{output-format}), and \textit{debug} (\S\ref{output-format}) are
blanchet@33552	1813	disabled, \textit{max\_potential} (\S\ref{output-format}) is taken to be 0, and
blanchet@33552	1814	\textit{timeout} (\S\ref{timeouts}) is superseded by the ``Auto Counterexample
blanchet@33552	1815	Time Limit'' in Proof General's ``Isabelle'' menu. Nitpick's output is also more
blanchet@33552	1816	concise.
blanchet@33552	1817
blanchet@33191	1818	The number of options can be overwhelming at first glance. Do not let that worry
blanchet@33191	1819	you: Nitpick's defaults have been chosen so that it almost always does the right
blanchet@33191	1820	thing, and the most important options have been covered in context in
blanchet@33191	1821	\S\ref{first-steps}.
blanchet@33191	1822
blanchet@33191	1823	The descriptions below refer to the following syntactic quantities:
blanchet@33191	1824
blanchet@33191	1825	\begin{enum}
blanchet@33191	1826	\item[$\bullet$] \qtybf{string}: A string.
blanchet@33191	1827	\item[$\bullet$] \qtybf{bool}: \textit{true} or \textit{false}.
blanchet@33191	1828	\item[$\bullet$] \qtybf{bool\_or\_smart}: \textit{true}, \textit{false}, or \textit{smart}.
blanchet@33191	1829	\item[$\bullet$] \qtybf{int}: An integer. Negative integers are prefixed with a hyphen.
blanchet@33191	1830	\item[$\bullet$] \qtybf{int\_or\_smart}: An integer or \textit{smart}.
blanchet@33191	1831	\item[$\bullet$] \qtybf{int\_range}: An integer (e.g., 3) or a range
blanchet@33191	1832	of nonnegative integers (e.g., $1$--$4$). The range symbol `--' can be entered as \texttt{-} (hyphen) or \texttt{\char`\\\char`\<midarrow\char`\>}.
blanchet@33191	1833
blanchet@33191	1834	\item[$\bullet$] \qtybf{int\_seq}: A comma-separated sequence of ranges of integers (e.g.,~1{,}3{,}\allowbreak6--8).
blanchet@33191	1835	\item[$\bullet$] \qtybf{time}: An integer followed by $\textit{min}$ (minutes), $s$ (seconds), or \textit{ms}
blanchet@33191	1836	(milliseconds), or the keyword \textit{none} ($\infty$ years).
blanchet@33191	1837	\item[$\bullet$] \qtybf{const}: The name of a HOL constant.
blanchet@33191	1838	\item[$\bullet$] \qtybf{term}: A HOL term (e.g., ``$f~x$'').
blanchet@33191	1839	\item[$\bullet$] \qtybf{term\_list}: A space-separated list of HOL terms (e.g.,
blanchet@33191	1840	``$f~x$''~``$g~y$'').
blanchet@33191	1841	\item[$\bullet$] \qtybf{type}: A HOL type.
blanchet@33191	1842	\end{enum}
blanchet@33191	1843
blanchet@33191	1844	Default values are indicated in square brackets. Boolean options have a negated
blanchet@33552	1845	counterpart (e.g., \textit{blocking} vs.\ \textit{no\_blocking}). When setting
blanchet@33552	1846	Boolean options, ``= \textit{true}'' may be omitted.
blanchet@33191	1847
blanchet@33191	1848	\subsection{Mode of Operation}
blanchet@33191	1849	\label{mode-of-operation}
blanchet@33191	1850
blanchet@33191	1851	\begin{enum}
blanchet@33191	1852	\optrue{blocking}{non\_blocking}
blanchet@33191	1853	Specifies whether the \textbf{nitpick} command should operate synchronously.
blanchet@33191	1854	The asynchronous (non-blocking) mode lets the user start proving the putative
blanchet@33191	1855	theorem while Nitpick looks for a counterexample, but it can also be more
blanchet@33191	1856	confusing. For technical reasons, automatic runs currently always block.
blanchet@33191	1857
blanchet@33191	1858	\optrue{falsify}{satisfy}
blanchet@33191	1859	Specifies whether Nitpick should look for falsifying examples (countermodels) or
blanchet@33191	1860	satisfying examples (models). This manual assumes throughout that
blanchet@33191	1861	\textit{falsify} is enabled.
blanchet@33191	1862
blanchet@33191	1863	\opsmart{user\_axioms}{no\_user\_axioms}
blanchet@33191	1864	Specifies whether the user-defined axioms (specified using
blanchet@33191	1865	\textbf{axiomatization} and \textbf{axioms}) should be considered. If the option
blanchet@33191	1866	is set to \textit{smart}, Nitpick performs an ad hoc axiom selection based on
blanchet@33191	1867	the constants that occur in the formula to falsify. The option is implicitly set
blanchet@33191	1868	to \textit{true} for automatic runs.
blanchet@33191	1869
blanchet@33191	1870	\textbf{Warning:} If the option is set to \textit{true}, Nitpick might
blanchet@33191	1871	nonetheless ignore some polymorphic axioms. Counterexamples generated under
blanchet@33191	1872	these conditions are tagged as ``likely genuine.'' The \textit{debug}
blanchet@33191	1873	(\S\ref{output-format}) option can be used to find out which axioms were
blanchet@33191	1874	considered.
blanchet@33191	1875
blanchet@33191	1876	\nopagebreak
blanchet@33552	1877	{\small See also \textit{assms} (\S\ref{mode-of-operation}) and \textit{debug}
blanchet@33552	1878	(\S\ref{output-format}).}
blanchet@33191	1879
blanchet@33191	1880	\optrue{assms}{no\_assms}
blanchet@33191	1881	Specifies whether the relevant assumptions in structured proof should be
blanchet@33191	1882	considered. The option is implicitly enabled for automatic runs.
blanchet@33191	1883
blanchet@33191	1884	\nopagebreak
blanchet@33552	1885	{\small See also \textit{user\_axioms} (\S\ref{mode-of-operation}).}
blanchet@33191	1886
blanchet@33191	1887	\opfalse{overlord}{no\_overlord}
blanchet@33191	1888	Specifies whether Nitpick should put its temporary files in
blanchet@33191	1889	\texttt{\$ISABELLE\_\allowbreak HOME\_\allowbreak USER}, which is useful for
blanchet@33191	1890	debugging Nitpick but also unsafe if several instances of the tool are run
blanchet@33196	1891	simultaneously.
blanchet@33191	1892
blanchet@33191	1893	\nopagebreak
blanchet@33191	1894	{\small See also \textit{debug} (\S\ref{output-format}).}
blanchet@33191	1895	\end{enum}
blanchet@33191	1896
blanchet@33191	1897	\subsection{Scope of Search}
blanchet@33191	1898	\label{scope-of-search}
blanchet@33191	1899
blanchet@33191	1900	\begin{enum}
blanchet@34969	1901	\oparg{card}{type}{int\_seq}
blanchet@34121	1902	Specifies the sequence of cardinalities to use for a given type.
blanchet@34121	1903	For free types, and often also for \textbf{typedecl}'d types, it usually makes
blanchet@34121	1904	sense to specify cardinalities as a range of the form \textit{$1$--$n$}.
blanchet@34121	1905	Although function and product types are normally mapped directly to the
blanchet@34121	1906	corresponding Kodkod concepts, setting
blanchet@34121	1907	the cardinality of such types is also allowed and implicitly enables ``boxing''
blanchet@34121	1908	for them, as explained in the description of the \textit{box}~\qty{type}
blanchet@34121	1909	and \textit{box} (\S\ref{scope-of-search}) options.
blanchet@34121	1910
blanchet@34121	1911	\nopagebreak
blanchet@34121	1912	{\small See also \textit{mono} (\S\ref{scope-of-search}).}
blanchet@34121	1913
blanchet@34969	1914	\opdefault{card}{int\_seq}{$\mathbf{1}$--$\mathbf{8}$}
blanchet@34121	1915	Specifies the default sequence of cardinalities to use. This can be overridden
blanchet@34121	1916	on a per-type basis using the \textit{card}~\qty{type} option described above.
blanchet@34121	1917
blanchet@34969	1918	\oparg{max}{const}{int\_seq}
blanchet@34121	1919	Specifies the sequence of maximum multiplicities to use for a given
blanchet@34121	1920	(co)in\-duc\-tive datatype constructor. A constructor's multiplicity is the
blanchet@34121	1921	number of distinct values that it can construct. Nonsensical values (e.g.,
blanchet@34121	1922	\textit{max}~[]~$=$~2) are silently repaired. This option is only available for
blanchet@34121	1923	datatypes equipped with several constructors.
blanchet@34121	1924
blanchet@34969	1925	\opnodefault{max}{int\_seq}
blanchet@34121	1926	Specifies the default sequence of maximum multiplicities to use for
blanchet@34121	1927	(co)in\-duc\-tive datatype constructors. This can be overridden on a per-constructor
blanchet@34121	1928	basis using the \textit{max}~\qty{const} option described above.
blanchet@34121	1929
blanchet@34121	1930	\opsmart{binary\_ints}{unary\_ints}
blanchet@34121	1931	Specifies whether natural numbers and integers should be encoded using a unary
blanchet@34121	1932	or binary notation. In unary mode, the cardinality fully specifies the subset
blanchet@34121	1933	used to approximate the type. For example:
blanchet@33191	1934	%
blanchet@33191	1935	$$\hbox{\begin{tabular}{@{}rll@{}}%
blanchet@33191	1936	\textit{card nat} = 4 & induces & $\{0,\, 1,\, 2,\, 3\}$ \\
blanchet@33191	1937	\textit{card int} = 4 & induces & $\{-1,\, 0,\, +1,\, +2\}$ \\
blanchet@33191	1938	\textit{card int} = 5 & induces & $\{-2,\, -1,\, 0,\, +1,\, +2\}.$%
blanchet@33191	1939	\end{tabular}}$$
blanchet@33191	1940	%
blanchet@33191	1941	In general:
blanchet@33191	1942	%
blanchet@33191	1943	$$\hbox{\begin{tabular}{@{}rll@{}}%
blanchet@33191	1944	\textit{card nat} = $K$ & induces & $\{0,\, \ldots,\, K - 1\}$ \\
blanchet@33191	1945	\textit{card int} = $K$ & induces & $\{-\lceil K/2 \rceil + 1,\, \ldots,\, +\lfloor K/2 \rfloor\}.$%
blanchet@33191	1946	\end{tabular}}$$
blanchet@33191	1947	%
blanchet@34121	1948	In binary mode, the cardinality specifies the number of distinct values that can
blanchet@34121	1949	be constructed. Each of these value is represented by a bit pattern whose length
blanchet@34121	1950	is specified by the \textit{bits} (\S\ref{scope-of-search}) option. By default,
blanchet@34121	1951	Nitpick attempts to choose the more appropriate encoding by inspecting the
blanchet@34121	1952	formula at hand, preferring the binary notation for problems involving
blanchet@34121	1953	multiplicative operators or large constants.
blanchet@34121	1954
blanchet@34121	1955	\textbf{Warning:} For technical reasons, Nitpick always reverts to unary for
blanchet@34121	1956	problems that refer to the types \textit{rat} or \textit{real} or the constants
blanchet@34123	1957	\textit{Suc}, \textit{gcd}, or \textit{lcm}.
blanchet@34121	1958
blanchet@34121	1959	{\small See also \textit{bits} (\S\ref{scope-of-search}) and
blanchet@34121	1960	\textit{show\_datatypes} (\S\ref{output-format}).}
blanchet@34121	1961
blanchet@34969	1962	\opdefault{bits}{int\_seq}{$\mathbf{1},\mathbf{2},\mathbf{3},\mathbf{4},\mathbf{6},\mathbf{8},\mathbf{10},\mathbf{12}$}
blanchet@34121	1963	Specifies the number of bits to use to represent natural numbers and integers in
blanchet@34121	1964	binary, excluding the sign bit. The minimum is 1 and the maximum is 31.
blanchet@34121	1965
blanchet@34121	1966	{\small See also \textit{binary\_ints} (\S\ref{scope-of-search}).}
blanchet@33191	1967
blanchet@34969	1968	\opargboolorsmart{wf}{const}{non\_wf}
blanchet@33191	1969	Specifies whether the specified (co)in\-duc\-tively defined predicate is
blanchet@33191	1970	well-founded. The option can take the following values:
blanchet@33191	1971
blanchet@33191	1972	\begin{enum}
blanchet@33191	1973	\item[$\bullet$] \textbf{\textit{true}}: Tentatively treat the (co)in\-duc\-tive
blanchet@33191	1974	predicate as if it were well-founded. Since this is generally not sound when the
blanchet@33191	1975	predicate is not well-founded, the counterexamples are tagged as ``likely
blanchet@33191	1976	genuine.''
blanchet@33191	1977
blanchet@33191	1978	\item[$\bullet$] \textbf{\textit{false}}: Treat the (co)in\-duc\-tive predicate
blanchet@33191	1979	as if it were not well-founded. The predicate is then unrolled as prescribed by
blanchet@33191	1980	the \textit{star\_linear\_preds}, \textit{iter}~\qty{const}, and \textit{iter}
blanchet@33191	1981	options.
blanchet@33191	1982
blanchet@33191	1983	\item[$\bullet$] \textbf{\textit{smart}}: Try to prove that the inductive
blanchet@33191	1984	predicate is well-founded using Isabelle's \textit{lexicographic\_order} and
blanchet@34969	1985	\textit{size\_change} tactics. If this succeeds (or the predicate occurs with an
blanchet@33191	1986	appropriate polarity in the formula to falsify), use an efficient fixed point
blanchet@33191	1987	equation as specification of the predicate; otherwise, unroll the predicates
blanchet@33191	1988	according to the \textit{iter}~\qty{const} and \textit{iter} options.
blanchet@33191	1989	\end{enum}
blanchet@33191	1990
blanchet@33191	1991	\nopagebreak
blanchet@33191	1992	{\small See also \textit{iter} (\S\ref{scope-of-search}),
blanchet@33191	1993	\textit{star\_linear\_preds} (\S\ref{optimizations}), and \textit{tac\_timeout}
blanchet@33191	1994	(\S\ref{timeouts}).}
blanchet@33191	1995
blanchet@33191	1996	\opsmart{wf}{non\_wf}
blanchet@33191	1997	Specifies the default wellfoundedness setting to use. This can be overridden on
blanchet@33191	1998	a per-predicate basis using the \textit{wf}~\qty{const} option above.
blanchet@33191	1999
blanchet@34969	2000	\oparg{iter}{const}{int\_seq}
blanchet@33191	2001	Specifies the sequence of iteration counts to use when unrolling a given
blanchet@33191	2002	(co)in\-duc\-tive predicate. By default, unrolling is applied for inductive
blanchet@33191	2003	predicates that occur negatively and coinductive predicates that occur
blanchet@33191	2004	positively in the formula to falsify and that cannot be proved to be
blanchet@33191	2005	well-founded, but this behavior is influenced by the \textit{wf} option. The
blanchet@33191	2006	iteration counts are automatically bounded by the cardinality of the predicate's
blanchet@33191	2007	domain.
blanchet@33191	2008
blanchet@33191	2009	{\small See also \textit{wf} (\S\ref{scope-of-search}) and
blanchet@33191	2010	\textit{star\_linear\_preds} (\S\ref{optimizations}).}
blanchet@33191	2011
blanchet@34969	2012	\opdefault{iter}{int\_seq}{$\mathbf{1{,}2{,}4{,}8{,}12{,}16{,}24{,}32}$}
blanchet@33191	2013	Specifies the sequence of iteration counts to use when unrolling (co)in\-duc\-tive
blanchet@33191	2014	predicates. This can be overridden on a per-predicate basis using the
blanchet@33191	2015	\textit{iter} \qty{const} option above.
blanchet@33191	2016
blanchet@34969	2017	\opdefault{bisim\_depth}{int\_seq}{$\mathbf{7}$}
blanchet@33191	2018	Specifies the sequence of iteration counts to use when unrolling the
blanchet@33191	2019	bisimilarity predicate generated by Nitpick for coinductive datatypes. A value
blanchet@33191	2020	of $-1$ means that no predicate is generated, in which case Nitpick performs an
blanchet@33191	2021	after-the-fact check to see if the known coinductive datatype values are
blanchet@33191	2022	bidissimilar. If two values are found to be bisimilar, the counterexample is
blanchet@33191	2023	tagged as ``likely genuine.'' The iteration counts are automatically bounded by
blanchet@33191	2024	the sum of the cardinalities of the coinductive datatypes occurring in the
blanchet@33191	2025	formula to falsify.
blanchet@33191	2026
blanchet@34969	2027	\opargboolorsmart{box}{type}{dont\_box}
blanchet@33191	2028	Specifies whether Nitpick should attempt to wrap (``box'') a given function or
blanchet@33191	2029	product type in an isomorphic datatype internally. Boxing is an effective mean
blanchet@33191	2030	to reduce the search space and speed up Nitpick, because the isomorphic datatype
blanchet@33191	2031	is approximated by a subset of the possible function or pair values;
blanchet@33191	2032	like other drastic optimizations, it can also prevent the discovery of
blanchet@33191	2033	counterexamples. The option can take the following values:
blanchet@33191	2034
blanchet@33191	2035	\begin{enum}
blanchet@33191	2036	\item[$\bullet$] \textbf{\textit{true}}: Box the specified type whenever
blanchet@33191	2037	practicable.
blanchet@33191	2038	\item[$\bullet$] \textbf{\textit{false}}: Never box the type.
blanchet@33191	2039	\item[$\bullet$] \textbf{\textit{smart}}: Box the type only in contexts where it
blanchet@33191	2040	is likely to help. For example, $n$-tuples where $n > 2$ and arguments to
blanchet@33191	2041	higher-order functions are good candidates for boxing.
blanchet@33191	2042	\end{enum}
blanchet@33191	2043
blanchet@33191	2044	Setting the \textit{card}~\qty{type} option for a function or product type
blanchet@33191	2045	implicitly enables boxing for that type.
blanchet@33191	2046
blanchet@33191	2047	\nopagebreak
blanchet@33191	2048	{\small See also \textit{verbose} (\S\ref{output-format})
blanchet@33191	2049	and \textit{debug} (\S\ref{output-format}).}
blanchet@33191	2050
blanchet@33191	2051	\opsmart{box}{dont\_box}
blanchet@33191	2052	Specifies the default boxing setting to use. This can be overridden on a
blanchet@33191	2053	per-type basis using the \textit{box}~\qty{type} option described above.
blanchet@33191	2054
blanchet@34969	2055	\opargboolorsmart{mono}{type}{non\_mono}
blanchet@34969	2056	Specifies whether the given type should be considered monotonic when
blanchet@33191	2057	enumerating scopes. If the option is set to \textit{smart}, Nitpick performs a
blanchet@33191	2058	monotonicity check on the type. Setting this option to \textit{true} can reduce
blanchet@33191	2059	the number of scopes tried, but it also diminishes the theoretical chance of
blanchet@33191	2060	finding a counterexample, as demonstrated in \S\ref{scope-monotonicity}.
blanchet@33191	2061
blanchet@33191	2062	\nopagebreak
blanchet@33191	2063	{\small See also \textit{card} (\S\ref{scope-of-search}),
blanchet@33547	2064	\textit{merge\_type\_vars} (\S\ref{scope-of-search}), and \textit{verbose}
blanchet@33191	2065	(\S\ref{output-format}).}
blanchet@33191	2066
blanchet@33191	2067	\opsmart{mono}{non\_box}
blanchet@33191	2068	Specifies the default monotonicity setting to use. This can be overridden on a
blanchet@33191	2069	per-type basis using the \textit{mono}~\qty{type} option described above.
blanchet@33191	2070
blanchet@33547	2071	\opfalse{merge\_type\_vars}{dont\_merge\_type\_vars}
blanchet@33191	2072	Specifies whether type variables with the same sort constraints should be
blanchet@33191	2073	merged. Setting this option to \textit{true} can reduce the number of scopes
blanchet@33191	2074	tried and the size of the generated Kodkod formulas, but it also diminishes the
blanchet@33191	2075	theoretical chance of finding a counterexample.
blanchet@33191	2076
blanchet@33191	2077	{\small See also \textit{mono} (\S\ref{scope-of-search}).}
blanchet@34969	2078
blanchet@34969	2079	\opargbool{std}{type}{non\_std}
blanchet@34969	2080	Specifies whether the given type should be given standard models.
blanchet@34969	2081	Nonstandard models are unsound but can help debug inductive arguments,
blanchet@34969	2082	as explained in \S\ref{inductive-properties}.
blanchet@34969	2083
blanchet@34969	2084	\optrue{std}{non\_std}
blanchet@34969	2085	Specifies the default standardness to use. This can be overridden on a per-type
blanchet@34969	2086	basis using the \textit{std}~\qty{type} option described above.
blanchet@33191	2087	\end{enum}
blanchet@33191	2088
blanchet@33191	2089	\subsection{Output Format}
blanchet@33191	2090	\label{output-format}
blanchet@33191	2091
blanchet@33191	2092	\begin{enum}
blanchet@33191	2093	\opfalse{verbose}{quiet}
blanchet@33191	2094	Specifies whether the \textbf{nitpick} command should explain what it does. This
blanchet@33191	2095	option is useful to determine which scopes are tried or which SAT solver is
blanchet@33191	2096	used. This option is implicitly disabled for automatic runs.
blanchet@33191	2097
blanchet@33191	2098	\opfalse{debug}{no\_debug}
blanchet@33191	2099	Specifies whether Nitpick should display additional debugging information beyond
blanchet@33191	2100	what \textit{verbose} already displays. Enabling \textit{debug} also enables
blanchet@33191	2101	\textit{verbose} and \textit{show\_all} behind the scenes. The \textit{debug}
blanchet@33191	2102	option is implicitly disabled for automatic runs.
blanchet@33191	2103
blanchet@33191	2104	\nopagebreak
blanchet@33552	2105	{\small See also \textit{overlord} (\S\ref{mode-of-operation}) and
blanchet@33552	2106	\textit{batch\_size} (\S\ref{optimizations}).}
blanchet@33191	2107
blanchet@33191	2108	\optrue{show\_skolems}{hide\_skolem}
blanchet@33191	2109	Specifies whether the values of Skolem constants should be displayed as part of
blanchet@33191	2110	counterexamples. Skolem constants correspond to bound variables in the original
blanchet@33191	2111	formula and usually help us to understand why the counterexample falsifies the
blanchet@33191	2112	formula.
blanchet@33191	2113
blanchet@33191	2114	\nopagebreak
blanchet@33191	2115	{\small See also \textit{skolemize} (\S\ref{optimizations}).}
blanchet@33191	2116
blanchet@33191	2117	\opfalse{show\_datatypes}{hide\_datatypes}
blanchet@33191	2118	Specifies whether the subsets used to approximate (co)in\-duc\-tive datatypes should
blanchet@33191	2119	be displayed as part of counterexamples. Such subsets are sometimes helpful when
blanchet@33191	2120	investigating whether a potential counterexample is genuine or spurious, but
blanchet@33191	2121	their potential for clutter is real.
blanchet@33191	2122
blanchet@33191	2123	\opfalse{show\_consts}{hide\_consts}
blanchet@33191	2124	Specifies whether the values of constants occurring in the formula (including
blanchet@33191	2125	its axioms) should be displayed along with any counterexample. These values are
blanchet@33191	2126	sometimes helpful when investigating why a counterexample is
blanchet@33191	2127	genuine, but they can clutter the output.
blanchet@33191	2128
blanchet@33191	2129	\opfalse{show\_all}{dont\_show\_all}
blanchet@33191	2130	Enabling this option effectively enables \textit{show\_skolems},
blanchet@33191	2131	\textit{show\_datatypes}, and \textit{show\_consts}.
blanchet@33191	2132
blanchet@34969	2133	\opdefault{max\_potential}{int}{$\mathbf{1}$}
blanchet@33191	2134	Specifies the maximum number of potential counterexamples to display. Setting
blanchet@33191	2135	this option to 0 speeds up the search for a genuine counterexample. This option
blanchet@33191	2136	is implicitly set to 0 for automatic runs. If you set this option to a value
blanchet@33191	2137	greater than 1, you will need an incremental SAT solver: For efficiency, it is
blanchet@33191	2138	recommended to install the JNI version of MiniSat and set \textit{sat\_solver} =
blanchet@33191	2139	\textit{MiniSatJNI}. Also be aware that many of the counterexamples may look
blanchet@33191	2140	identical, unless the \textit{show\_all} (\S\ref{output-format}) option is
blanchet@33191	2141	enabled.
blanchet@33191	2142
blanchet@33191	2143	\nopagebreak
blanchet@33552	2144	{\small See also \textit{check\_potential} (\S\ref{authentication}) and
blanchet@33191	2145	\textit{sat\_solver} (\S\ref{optimizations}).}
blanchet@33191	2146
blanchet@34969	2147	\opdefault{max\_genuine}{int}{$\mathbf{1}$}
blanchet@33191	2148	Specifies the maximum number of genuine counterexamples to display. If you set
blanchet@33191	2149	this option to a value greater than 1, you will need an incremental SAT solver:
blanchet@33191	2150	For efficiency, it is recommended to install the JNI version of MiniSat and set
blanchet@33191	2151	\textit{sat\_solver} = \textit{MiniSatJNI}. Also be aware that many of the
blanchet@33191	2152	counterexamples may look identical, unless the \textit{show\_all}
blanchet@33191	2153	(\S\ref{output-format}) option is enabled.
blanchet@33191	2154
blanchet@33191	2155	\nopagebreak
blanchet@33191	2156	{\small See also \textit{check\_genuine} (\S\ref{authentication}) and
blanchet@33191	2157	\textit{sat\_solver} (\S\ref{optimizations}).}
blanchet@33191	2158
blanchet@34969	2159	\opnodefault{eval}{term\_list}
blanchet@33191	2160	Specifies the list of terms whose values should be displayed along with
blanchet@33191	2161	counterexamples. This option suffers from an ``observer effect'': Nitpick might
blanchet@33191	2162	find different counterexamples for different values of this option.
blanchet@33191	2163
blanchet@34969	2164	\oparg{format}{term}{int\_seq}
blanchet@33191	2165	Specifies how to uncurry the value displayed for a variable or constant.
blanchet@33191	2166	Uncurrying sometimes increases the readability of the output for high-arity
blanchet@33191	2167	functions. For example, given the variable $y \mathbin{\Colon} {'a}\Rightarrow
blanchet@33191	2168	{'b}\Rightarrow {'c}\Rightarrow {'d}\Rightarrow {'e}\Rightarrow {'f}\Rightarrow
blanchet@33191	2169	{'g}$, setting \textit{format}~$y$ = 3 tells Nitpick to group the last three
blanchet@33191	2170	arguments, as if the type had been ${'a}\Rightarrow {'b}\Rightarrow
blanchet@33191	2171	{'c}\Rightarrow {'d}\times {'e}\times {'f}\Rightarrow {'g}$. In general, a list
blanchet@33191	2172	of values $n_1,\ldots,n_k$ tells Nitpick to show the last $n_k$ arguments as an
blanchet@33191	2173	$n_k$-tuple, the previous $n_{k-1}$ arguments as an $n_{k-1}$-tuple, and so on;
blanchet@33191	2174	arguments that are not accounted for are left alone, as if the specification had
blanchet@33191	2175	been $1,\ldots,1,n_1,\ldots,n_k$.
blanchet@33191	2176
blanchet@33191	2177	\nopagebreak
blanchet@33191	2178	{\small See also \textit{uncurry} (\S\ref{optimizations}).}
blanchet@33191	2179
blanchet@34969	2180	\opdefault{format}{int\_seq}{$\mathbf{1}$}
blanchet@33191	2181	Specifies the default format to use. Irrespective of the default format, the
blanchet@33191	2182	extra arguments to a Skolem constant corresponding to the outer bound variables
blanchet@33191	2183	are kept separated from the remaining arguments, the \textbf{for} arguments of
blanchet@33191	2184	an inductive definitions are kept separated from the remaining arguments, and
blanchet@33191	2185	the iteration counter of an unrolled inductive definition is shown alone. The
blanchet@33191	2186	default format can be overridden on a per-variable or per-constant basis using
blanchet@33191	2187	the \textit{format}~\qty{term} option described above.
blanchet@33191	2188	\end{enum}
blanchet@33191	2189
blanchet@33191	2190	%% MARK: Authentication
blanchet@33191	2191	\subsection{Authentication}
blanchet@33191	2192	\label{authentication}
blanchet@33191	2193
blanchet@33191	2194	\begin{enum}
blanchet@33191	2195	\opfalse{check\_potential}{trust\_potential}
blanchet@33191	2196	Specifies whether potential counterexamples should be given to Isabelle's
blanchet@33191	2197	\textit{auto} tactic to assess their validity. If a potential counterexample is
blanchet@33191	2198	shown to be genuine, Nitpick displays a message to this effect and terminates.
blanchet@33191	2199
blanchet@33191	2200	\nopagebreak
blanchet@33552	2201	{\small See also \textit{max\_potential} (\S\ref{output-format}).}
blanchet@33191	2202
blanchet@33191	2203	\opfalse{check\_genuine}{trust\_genuine}
blanchet@33191	2204	Specifies whether genuine and likely genuine counterexamples should be given to
blanchet@33191	2205	Isabelle's \textit{auto} tactic to assess their validity. If a ``genuine''
blanchet@33191	2206	counterexample is shown to be spurious, the user is kindly asked to send a bug
blanchet@33191	2207	report to the author at
blanchet@33191	2208	\texttt{blan{\color{white}nospam}\kern-\wd\boxA{}chette@in.tum.de}.
blanchet@33191	2209
blanchet@33191	2210	\nopagebreak
blanchet@33552	2211	{\small See also \textit{max\_genuine} (\S\ref{output-format}).}
blanchet@33191	2212
blanchet@34969	2213	\opnodefault{expect}{string}
blanchet@33191	2214	Specifies the expected outcome, which must be one of the following:
blanchet@33191	2215
blanchet@33191	2216	\begin{enum}
blanchet@33191	2217	\item[$\bullet$] \textbf{\textit{genuine}}: Nitpick found a genuine counterexample.
blanchet@33191	2218	\item[$\bullet$] \textbf{\textit{likely\_genuine}}: Nitpick found a ``likely
blanchet@33191	2219	genuine'' counterexample (i.e., a counterexample that is genuine unless
blanchet@33191	2220	it contradicts a missing axiom or a dangerous option was used inappropriately).
blanchet@33191	2221	\item[$\bullet$] \textbf{\textit{potential}}: Nitpick found a potential counterexample.
blanchet@33191	2222	\item[$\bullet$] \textbf{\textit{none}}: Nitpick found no counterexample.
blanchet@33191	2223	\item[$\bullet$] \textbf{\textit{unknown}}: Nitpick encountered some problem (e.g.,
blanchet@33191	2224	Kodkod ran out of memory).
blanchet@33191	2225	\end{enum}
blanchet@33191	2226
blanchet@33191	2227	Nitpick emits an error if the actual outcome differs from the expected outcome.
blanchet@33191	2228	This option is useful for regression testing.
blanchet@33191	2229	\end{enum}
blanchet@33191	2230
blanchet@33191	2231	\subsection{Optimizations}
blanchet@33191	2232	\label{optimizations}
blanchet@33191	2233
blanchet@33191	2234	\def\cpp{C\nobreak\raisebox{.1ex}{+}\nobreak\raisebox{.1ex}{+}}
blanchet@33191	2235
blanchet@33191	2236	\sloppy
blanchet@33191	2237
blanchet@33191	2238	\begin{enum}
blanchet@34969	2239	\opdefault{sat\_solver}{string}{smart}
blanchet@33191	2240	Specifies which SAT solver to use. SAT solvers implemented in C or \cpp{} tend
blanchet@33191	2241	to be faster than their Java counterparts, but they can be more difficult to
blanchet@33191	2242	install. Also, if you set the \textit{max\_potential} (\S\ref{output-format}) or
blanchet@33191	2243	\textit{max\_genuine} (\S\ref{output-format}) option to a value greater than 1,
blanchet@33191	2244	you will need an incremental SAT solver, such as \textit{MiniSatJNI}
blanchet@33191	2245	(recommended) or \textit{SAT4J}.
blanchet@33191	2246
blanchet@33191	2247	The supported solvers are listed below:
blanchet@33191	2248
blanchet@33191	2249	\begin{enum}
blanchet@33191	2250
blanchet@33191	2251	\item[$\bullet$] \textbf{\textit{MiniSat}}: MiniSat is an efficient solver
blanchet@33191	2252	written in \cpp{}. To use MiniSat, set the environment variable
blanchet@33191	2253	\texttt{MINISAT\_HOME} to the directory that contains the \texttt{minisat}
blanchet@33191	2254	executable. The \cpp{} sources and executables for MiniSat are available at
blanchet@33191	2255	\url{http://minisat.se/MiniSat.html}. Nitpick has been tested with versions 1.14
blanchet@33191	2256	and 2.0 beta (2007-07-21).
blanchet@33191	2257
blanchet@33191	2258	\item[$\bullet$] \textbf{\textit{MiniSatJNI}}: The JNI (Java Native Interface)
blanchet@33191	2259	version of MiniSat is bundled in \texttt{nativesolver.\allowbreak tgz}, which
blanchet@33191	2260	you will find on Kodkod's web site \cite{kodkod-2009}. Unlike the standard
blanchet@33191	2261	version of MiniSat, the JNI version can be used incrementally.
blanchet@33191	2262
blanchet@33726	2263	%%% No longer true:
blanchet@33726	2264	%%% "It is bundled with Kodkodi and requires no further installation or
blanchet@33726	2265	%%% configuration steps. Alternatively,"
blanchet@33191	2266	\item[$\bullet$] \textbf{\textit{PicoSAT}}: PicoSAT is an efficient solver
blanchet@33726	2267	written in C. You can install a standard version of
blanchet@33191	2268	PicoSAT and set the environment variable \texttt{PICOSAT\_HOME} to the directory
blanchet@33191	2269	that contains the \texttt{picosat} executable. The C sources for PicoSAT are
blanchet@33191	2270	available at \url{http://fmv.jku.at/picosat/} and are also bundled with Kodkodi.
blanchet@33191	2271	Nitpick has been tested with version 913.
blanchet@33191	2272
blanchet@33191	2273	\item[$\bullet$] \textbf{\textit{zChaff}}: zChaff is an efficient solver written
blanchet@33191	2274	in \cpp{}. To use zChaff, set the environment variable \texttt{ZCHAFF\_HOME} to
blanchet@33191	2275	the directory that contains the \texttt{zchaff} executable. The \cpp{} sources
blanchet@33191	2276	and executables for zChaff are available at
blanchet@33191	2277	\url{http://www.princeton.edu/~chaff/zchaff.html}. Nitpick has been tested with
blanchet@33191	2278	versions 2004-05-13, 2004-11-15, and 2007-03-12.
blanchet@33191	2279
blanchet@33191	2280	\item[$\bullet$] \textbf{\textit{zChaffJNI}}: The JNI version of zChaff is
blanchet@33191	2281	bundled in \texttt{native\-solver.\allowbreak tgz}, which you will find on
blanchet@33191	2282	Kodkod's web site \cite{kodkod-2009}.
blanchet@33191	2283
blanchet@33191	2284	\item[$\bullet$] \textbf{\textit{RSat}}: RSat is an efficient solver written in
blanchet@33191	2285	\cpp{}. To use RSat, set the environment variable \texttt{RSAT\_HOME} to the
blanchet@33191	2286	directory that contains the \texttt{rsat} executable. The \cpp{} sources for
blanchet@33191	2287	RSat are available at \url{http://reasoning.cs.ucla.edu/rsat/}. Nitpick has been
blanchet@33191	2288	tested with version 2.01.
blanchet@33191	2289
blanchet@33191	2290	\item[$\bullet$] \textbf{\textit{BerkMin}}: BerkMin561 is an efficient solver
blanchet@33191	2291	written in C. To use BerkMin, set the environment variable
blanchet@33191	2292	\texttt{BERKMIN\_HOME} to the directory that contains the \texttt{BerkMin561}
blanchet@33191	2293	executable. The BerkMin executables are available at
blanchet@33191	2294	\url{http://eigold.tripod.com/BerkMin.html}.
blanchet@33191	2295
blanchet@33191	2296	\item[$\bullet$] \textbf{\textit{BerkMinAlloy}}: Variant of BerkMin that is
blanchet@33191	2297	included with Alloy 4 and calls itself ``sat56'' in its banner text. To use this
blanchet@33191	2298	version of BerkMin, set the environment variable
blanchet@33191	2299	\texttt{BERKMINALLOY\_HOME} to the directory that contains the \texttt{berkmin}
blanchet@33191	2300	executable.
blanchet@33191	2301
blanchet@33191	2302	\item[$\bullet$] \textbf{\textit{Jerusat}}: Jerusat 1.3 is an efficient solver
blanchet@33191	2303	written in C. To use Jerusat, set the environment variable
blanchet@33191	2304	\texttt{JERUSAT\_HOME} to the directory that contains the \texttt{Jerusat1.3}
blanchet@33191	2305	executable. The C sources for Jerusat are available at
blanchet@33191	2306	\url{http://www.cs.tau.ac.il/~ale1/Jerusat1.3.tgz}.
blanchet@33191	2307
blanchet@33191	2308	\item[$\bullet$] \textbf{\textit{SAT4J}}: SAT4J is a reasonably efficient solver
blanchet@33191	2309	written in Java that can be used incrementally. It is bundled with Kodkodi and
blanchet@33191	2310	requires no further installation or configuration steps. Do not attempt to
blanchet@33191	2311	install the official SAT4J packages, because their API is incompatible with
blanchet@33191	2312	Kodkod.
blanchet@33191	2313
blanchet@33191	2314	\item[$\bullet$] \textbf{\textit{SAT4JLight}}: Variant of SAT4J that is
blanchet@33191	2315	optimized for small problems. It can also be used incrementally.
blanchet@33191	2316
blanchet@33191	2317	\item[$\bullet$] \textbf{\textit{HaifaSat}}: HaifaSat 1.0 beta is an
blanchet@33191	2318	experimental solver written in \cpp. To use HaifaSat, set the environment
blanchet@33191	2319	variable \texttt{HAIFASAT\_\allowbreak HOME} to the directory that contains the
blanchet@33191	2320	\texttt{HaifaSat} executable. The \cpp{} sources for HaifaSat are available at
blanchet@33191	2321	\url{http://cs.technion.ac.il/~gershman/HaifaSat.htm}.
blanchet@33191	2322
blanchet@33191	2323	\item[$\bullet$] \textbf{\textit{smart}}: If \textit{sat\_solver} is set to
blanchet@33726	2324	\textit{smart}, Nitpick selects the first solver among MiniSat,
blanchet@33726	2325	PicoSAT, zChaff, RSat, BerkMin, BerkMinAlloy, Jerusat, MiniSatJNI, and zChaffJNI
blanchet@33726	2326	that is recognized by Isabelle. If none is found, it falls back on SAT4J, which
blanchet@33726	2327	should always be available. If \textit{verbose} (\S\ref{output-format}) is
blanchet@33726	2328	enabled, Nitpick displays which SAT solver was chosen.
blanchet@33191	2329	\end{enum}
blanchet@33191	2330	\fussy
blanchet@33191	2331
blanchet@34969	2332	\opdefault{batch\_size}{int\_or\_smart}{smart}
blanchet@33191	2333	Specifies the maximum number of Kodkod problems that should be lumped together
blanchet@33191	2334	when invoking Kodkodi. Each problem corresponds to one scope. Lumping problems
blanchet@33191	2335	together ensures that Kodkodi is launched less often, but it makes the verbose
blanchet@33191	2336	output less readable and is sometimes detrimental to performance. If
blanchet@33191	2337	\textit{batch\_size} is set to \textit{smart}, the actual value used is 1 if
blanchet@33191	2338	\textit{debug} (\S\ref{output-format}) is set and 64 otherwise.
blanchet@33191	2339
blanchet@33191	2340	\optrue{destroy\_constrs}{dont\_destroy\_constrs}
blanchet@33191	2341	Specifies whether formulas involving (co)in\-duc\-tive datatype constructors should
blanchet@33191	2342	be rewritten to use (automatically generated) discriminators and destructors.
blanchet@33191	2343	This optimization can drastically reduce the size of the Boolean formulas given
blanchet@33191	2344	to the SAT solver.
blanchet@33191	2345
blanchet@33191	2346	\nopagebreak
blanchet@33191	2347	{\small See also \textit{debug} (\S\ref{output-format}).}
blanchet@33191	2348
blanchet@33191	2349	\optrue{specialize}{dont\_specialize}
blanchet@33191	2350	Specifies whether functions invoked with static arguments should be specialized.
blanchet@33191	2351	This optimization can drastically reduce the search space, especially for
blanchet@33191	2352	higher-order functions.
blanchet@33191	2353
blanchet@33191	2354	\nopagebreak
blanchet@33191	2355	{\small See also \textit{debug} (\S\ref{output-format}) and
blanchet@33191	2356	\textit{show\_consts} (\S\ref{output-format}).}
blanchet@33191	2357
blanchet@33191	2358	\optrue{skolemize}{dont\_skolemize}
blanchet@33191	2359	Specifies whether the formula should be skolemized. For performance reasons,
blanchet@33191	2360	(positive) $\forall$-quanti\-fiers that occur in the scope of a higher-order
blanchet@33191	2361	(positive) $\exists$-quanti\-fier are left unchanged.
blanchet@33191	2362
blanchet@33191	2363	\nopagebreak
blanchet@33191	2364	{\small See also \textit{debug} (\S\ref{output-format}) and
blanchet@33191	2365	\textit{show\_skolems} (\S\ref{output-format}).}
blanchet@33191	2366
blanchet@33191	2367	\optrue{star\_linear\_preds}{dont\_star\_linear\_preds}
blanchet@33191	2368	Specifies whether Nitpick should use Kodkod's transitive closure operator to
blanchet@33191	2369	encode non-well-founded ``linear inductive predicates,'' i.e., inductive
blanchet@33191	2370	predicates for which each the predicate occurs in at most one assumption of each
blanchet@33191	2371	introduction rule. Using the reflexive transitive closure is in principle
blanchet@33191	2372	equivalent to setting \textit{iter} to the cardinality of the predicate's
blanchet@33191	2373	domain, but it is usually more efficient.
blanchet@33191	2374
blanchet@33191	2375	{\small See also \textit{wf} (\S\ref{scope-of-search}), \textit{debug}
blanchet@33191	2376	(\S\ref{output-format}), and \textit{iter} (\S\ref{scope-of-search}).}
blanchet@33191	2377
blanchet@33191	2378	\optrue{uncurry}{dont\_uncurry}
blanchet@33191	2379	Specifies whether Nitpick should uncurry functions. Uncurrying has on its own no
blanchet@33191	2380	tangible effect on efficiency, but it creates opportunities for the boxing
blanchet@33191	2381	optimization.
blanchet@33191	2382
blanchet@33191	2383	\nopagebreak
blanchet@33191	2384	{\small See also \textit{box} (\S\ref{scope-of-search}), \textit{debug}
blanchet@33191	2385	(\S\ref{output-format}), and \textit{format} (\S\ref{output-format}).}
blanchet@33191	2386
blanchet@33191	2387	\optrue{fast\_descrs}{full\_descrs}
blanchet@33191	2388	Specifies whether Nitpick should optimize the definite and indefinite
blanchet@33191	2389	description operators (THE and SOME). The optimized versions usually help
blanchet@33191	2390	Nitpick generate more counterexamples or at least find them faster, but only the
blanchet@33191	2391	unoptimized versions are complete when all types occurring in the formula are
blanchet@33191	2392	finite.
blanchet@33191	2393
blanchet@33191	2394	{\small See also \textit{debug} (\S\ref{output-format}).}
blanchet@33191	2395
blanchet@33191	2396	\optrue{peephole\_optim}{no\_peephole\_optim}
blanchet@33191	2397	Specifies whether Nitpick should simplify the generated Kodkod formulas using a
blanchet@33191	2398	peephole optimizer. These optimizations can make a significant difference.
blanchet@33191	2399	Unless you are tracking down a bug in Nitpick or distrust the peephole
blanchet@33191	2400	optimizer, you should leave this option enabled.
blanchet@33191	2401
blanchet@34969	2402	\opdefault{sym\_break}{int}{20}
blanchet@33191	2403	Specifies an upper bound on the number of relations for which Kodkod generates
blanchet@33191	2404	symmetry breaking predicates. According to the Kodkod documentation
blanchet@33191	2405	\cite{kodkod-2009-options}, ``in general, the higher this value, the more
blanchet@33191	2406	symmetries will be broken, and the faster the formula will be solved. But,
blanchet@33191	2407	setting the value too high may have the opposite effect and slow down the
blanchet@33191	2408	solving.''
blanchet@33191	2409
blanchet@34969	2410	\opdefault{sharing\_depth}{int}{3}
blanchet@33191	2411	Specifies the depth to which Kodkod should check circuits for equivalence during
blanchet@33191	2412	the translation to SAT. The default of 3 is the same as in Alloy. The minimum
blanchet@33191	2413	allowed depth is 1. Increasing the sharing may result in a smaller SAT problem,
blanchet@33191	2414	but can also slow down Kodkod.
blanchet@33191	2415
blanchet@33191	2416	\opfalse{flatten\_props}{dont\_flatten\_props}
blanchet@33191	2417	Specifies whether Kodkod should try to eliminate intermediate Boolean variables.
blanchet@33191	2418	Although this might sound like a good idea, in practice it can drastically slow
blanchet@33191	2419	down Kodkod.
blanchet@33191	2420
blanchet@34969	2421	\opdefault{max\_threads}{int}{0}
blanchet@33191	2422	Specifies the maximum number of threads to use in Kodkod. If this option is set
blanchet@33191	2423	to 0, Kodkod will compute an appropriate value based on the number of processor
blanchet@33191	2424	cores available.
blanchet@33191	2425
blanchet@33191	2426	\nopagebreak
blanchet@33191	2427	{\small See also \textit{batch\_size} (\S\ref{optimizations}) and
blanchet@33191	2428	\textit{timeout} (\S\ref{timeouts}).}
blanchet@33191	2429	\end{enum}
blanchet@33191	2430
blanchet@33191	2431	\subsection{Timeouts}
blanchet@33191	2432	\label{timeouts}
blanchet@33191	2433
blanchet@33191	2434	\begin{enum}
blanchet@34969	2435	\opdefault{timeout}{time}{$\mathbf{30}$ s}
blanchet@33191	2436	Specifies the maximum amount of time that the \textbf{nitpick} command should
blanchet@33191	2437	spend looking for a counterexample. Nitpick tries to honor this constraint as
blanchet@33191	2438	well as it can but offers no guarantees. For automatic runs,
blanchet@33552	2439	\textit{timeout} is ignored; instead, Auto Quickcheck and Auto Nitpick share
blanchet@33552	2440	a time slot whose length is specified by the ``Auto Counterexample Time
blanchet@33552	2441	Limit'' option in Proof General.
blanchet@33191	2442
blanchet@33191	2443	\nopagebreak
blanchet@33552	2444	{\small See also \textit{max\_threads} (\S\ref{optimizations}).}
blanchet@33191	2445
blanchet@34969	2446	\opdefault{tac\_timeout}{time}{$\mathbf{500}$\,ms}
blanchet@33191	2447	Specifies the maximum amount of time that the \textit{auto} tactic should use
blanchet@33191	2448	when checking a counterexample, and similarly that \textit{lexicographic\_order}
blanchet@34969	2449	and \textit{size\_change} should use when checking whether a (co)in\-duc\-tive
blanchet@33191	2450	predicate is well-founded. Nitpick tries to honor this constraint as well as it
blanchet@33191	2451	can but offers no guarantees.
blanchet@33191	2452
blanchet@33191	2453	\nopagebreak
blanchet@33191	2454	{\small See also \textit{wf} (\S\ref{scope-of-search}),
blanchet@33191	2455	\textit{check\_potential} (\S\ref{authentication}),
blanchet@33191	2456	and \textit{check\_genuine} (\S\ref{authentication}).}
blanchet@33191	2457	\end{enum}
blanchet@33191	2458
blanchet@33191	2459	\section{Attribute Reference}
blanchet@33191	2460	\label{attribute-reference}
blanchet@33191	2461
blanchet@33191	2462	Nitpick needs to consider the definitions of all constants occurring in a
blanchet@33191	2463	formula in order to falsify it. For constants introduced using the
blanchet@33191	2464	\textbf{definition} command, the definition is simply the associated
blanchet@33191	2465	\textit{\_def} axiom. In contrast, instead of using the internal representation
blanchet@33191	2466	of functions synthesized by Isabelle's \textbf{primrec}, \textbf{function}, and
blanchet@33191	2467	\textbf{nominal\_primrec} packages, Nitpick relies on the more natural
blanchet@33191	2468	equational specification entered by the user.
blanchet@33191	2469
blanchet@33191	2470	Behind the scenes, Isabelle's built-in packages and theories rely on the
blanchet@33191	2471	following attributes to affect Nitpick's behavior:
blanchet@33191	2472
blanchet@33191	2473	\begin{itemize}
blanchet@33191	2474	\flushitem{\textit{nitpick\_def}}
blanchet@33191	2475
blanchet@33191	2476	\nopagebreak
blanchet@33191	2477	This attribute specifies an alternative definition of a constant. The
blanchet@33191	2478	alternative definition should be logically equivalent to the constant's actual
blanchet@33191	2479	axiomatic definition and should be of the form
blanchet@33191	2480
blanchet@33191	2481	\qquad $c~{?}x_1~\ldots~{?}x_n \,\equiv\, t$,
blanchet@33191	2482
blanchet@33191	2483	where ${?}x_1, \ldots, {?}x_n$ are distinct variables and $c$ does not occur in
blanchet@33191	2484	$t$.
blanchet@33191	2485
blanchet@33191	2486	\flushitem{\textit{nitpick\_simp}}
blanchet@33191	2487
blanchet@33191	2488	\nopagebreak
blanchet@33191	2489	This attribute specifies the equations that constitute the specification of a
blanchet@33191	2490	constant. For functions defined using the \textbf{primrec}, \textbf{function},
blanchet@33191	2491	and \textbf{nominal\_\allowbreak primrec} packages, this corresponds to the
blanchet@33191	2492	\textit{simps} rules. The equations must be of the form
blanchet@33191	2493
blanchet@33191	2494	\qquad $c~t_1~\ldots\ t_n \,=\, u.$
blanchet@33191	2495
blanchet@33191	2496	\flushitem{\textit{nitpick\_psimp}}
blanchet@33191	2497
blanchet@33191	2498	\nopagebreak
blanchet@33191	2499	This attribute specifies the equations that constitute the partial specification
blanchet@33191	2500	of a constant. For functions defined using the \textbf{function} package, this
blanchet@33191	2501	corresponds to the \textit{psimps} rules. The conditional equations must be of
blanchet@33191	2502	the form
blanchet@33191	2503
blanchet@33191	2504	\qquad $\lbrakk P_1;\> \ldots;\> P_m\rbrakk \,\Longrightarrow\, c\ t_1\ \ldots\ t_n \,=\, u$.
blanchet@33191	2505
blanchet@33191	2506	\flushitem{\textit{nitpick\_intro}}
blanchet@33191	2507
blanchet@33191	2508	\nopagebreak
blanchet@33191	2509	This attribute specifies the introduction rules of a (co)in\-duc\-tive predicate.
blanchet@33191	2510	For predicates defined using the \textbf{inductive} or \textbf{coinductive}
blanchet@33191	2511	command, this corresponds to the \textit{intros} rules. The introduction rules
blanchet@33191	2512	must be of the form
blanchet@33191	2513
blanchet@33191	2514	\qquad $\lbrakk P_1;\> \ldots;\> P_m;\> M~(c\ t_{11}\ \ldots\ t_{1n});\>
blanchet@33191	2515	\ldots;\> M~(c\ t_{k1}\ \ldots\ t_{kn})\rbrakk \,\Longrightarrow\, c\ u_1\
blanchet@33191	2516	\ldots\ u_n$,
blanchet@33191	2517
blanchet@33191	2518	where the $P_i$'s are side conditions that do not involve $c$ and $M$ is an
blanchet@33191	2519	optional monotonic operator. The order of the assumptions is irrelevant.
blanchet@33191	2520
blanchet@33191	2521	\end{itemize}
blanchet@33191	2522
blanchet@33191	2523	When faced with a constant, Nitpick proceeds as follows:
blanchet@33191	2524
blanchet@33191	2525	\begin{enum}
blanchet@33191	2526	\item[1.] If the \textit{nitpick\_simp} set associated with the constant
blanchet@33191	2527	is not empty, Nitpick uses these rules as the specification of the constant.
blanchet@33191	2528
blanchet@33191	2529	\item[2.] Otherwise, if the \textit{nitpick\_psimp} set associated with
blanchet@33191	2530	the constant is not empty, it uses these rules as the specification of the
blanchet@33191	2531	constant.
blanchet@33191	2532
blanchet@33191	2533	\item[3.] Otherwise, it looks up the definition of the constant:
blanchet@33191	2534
blanchet@33191	2535	\begin{enum}
blanchet@33191	2536	\item[1.] If the \textit{nitpick\_def} set associated with the constant
blanchet@33191	2537	is not empty, it uses the latest rule added to the set as the definition of the
blanchet@33191	2538	constant; otherwise it uses the actual definition axiom.
blanchet@33191	2539	\item[2.] If the definition is of the form
blanchet@33191	2540
blanchet@33191	2541	\qquad $c~{?}x_1~\ldots~{?}x_m \,\equiv\, \lambda y_1~\ldots~y_n.\; \textit{lfp}~(\lambda f.\; t)$,
blanchet@33191	2542
blanchet@33191	2543	then Nitpick assumes that the definition was made using an inductive package and
blanchet@33191	2544	based on the introduction rules marked with \textit{nitpick\_\allowbreak
blanchet@33191	2545	ind\_\allowbreak intros} tries to determine whether the definition is
blanchet@33191	2546	well-founded.
blanchet@33191	2547	\end{enum}
blanchet@33191	2548	\end{enum}
blanchet@33191	2549
blanchet@33191	2550	As an illustration, consider the inductive definition
blanchet@33191	2551
blanchet@33191	2552	\prew
blanchet@33191	2553	\textbf{inductive}~\textit{odd}~\textbf{where} \\
blanchet@33191	2554	``\textit{odd}~1'' $\,\mid$ \\
blanchet@33191	2555	``\textit{odd}~$n\,\Longrightarrow\, \textit{odd}~(\textit{Suc}~(\textit{Suc}~n))$''
blanchet@33191	2556	\postw
blanchet@33191	2557
blanchet@33191	2558	Isabelle automatically attaches the \textit{nitpick\_intro} attribute to
blanchet@33191	2559	the above rules. Nitpick then uses the \textit{lfp}-based definition in
blanchet@33191	2560	conjunction with these rules. To override this, we can specify an alternative
blanchet@33191	2561	definition as follows:
blanchet@33191	2562
blanchet@33191	2563	\prew
blanchet@33191	2564	\textbf{lemma} $\mathit{odd\_def}'$ [\textit{nitpick\_def}]: ``$\textit{odd}~n \,\equiv\, n~\textrm{mod}~2 = 1$''
blanchet@33191	2565	\postw
blanchet@33191	2566
blanchet@33191	2567	Nitpick then expands all occurrences of $\mathit{odd}~n$ to $n~\textrm{mod}~2
blanchet@33191	2568	= 1$. Alternatively, we can specify an equational specification of the constant:
blanchet@33191	2569
blanchet@33191	2570	\prew
blanchet@33191	2571	\textbf{lemma} $\mathit{odd\_simp}'$ [\textit{nitpick\_simp}]: ``$\textit{odd}~n = (n~\textrm{mod}~2 = 1)$''
blanchet@33191	2572	\postw
blanchet@33191	2573
blanchet@33191	2574	Such tweaks should be done with great care, because Nitpick will assume that the
blanchet@33191	2575	constant is completely defined by its equational specification. For example, if
blanchet@33191	2576	you make ``$\textit{odd}~(2 * k + 1)$'' a \textit{nitpick\_simp} rule and neglect to provide rules to handle the $2 * k$ case, Nitpick will define
blanchet@33191	2577	$\textit{odd}~n$ arbitrarily for even values of $n$. The \textit{debug}
blanchet@33191	2578	(\S\ref{output-format}) option is extremely useful to understand what is going
blanchet@33191	2579	on when experimenting with \textit{nitpick\_} attributes.
blanchet@33191	2580
blanchet@33191	2581	\section{Standard ML Interface}
blanchet@33191	2582	\label{standard-ml-interface}
blanchet@33191	2583
blanchet@33191	2584	Nitpick provides a rich Standard ML interface used mainly for internal purposes
blanchet@33191	2585	and debugging. Among the most interesting functions exported by Nitpick are
blanchet@33191	2586	those that let you invoke the tool programmatically and those that let you
blanchet@33191	2587	register and unregister custom coinductive datatypes.
blanchet@33191	2588
blanchet@33191	2589	\subsection{Invocation of Nitpick}
blanchet@33191	2590	\label{invocation-of-nitpick}
blanchet@33191	2591
blanchet@33191	2592	The \textit{Nitpick} structure offers the following functions for invoking your
blanchet@33191	2593	favorite counterexample generator:
blanchet@33191	2594
blanchet@33191	2595	\prew
blanchet@33191	2596	$\textbf{val}\,~\textit{pick\_nits\_in\_term} : \\
blanchet@33191	2597	\hbox{}\quad\textit{Proof.state} \rightarrow \textit{params} \rightarrow \textit{bool} \rightarrow \textit{term~list} \rightarrow \textit{term} \\
blanchet@33191	2598	\hbox{}\quad{\rightarrow}\; \textit{string} * \textit{Proof.state}$ \\
blanchet@33191	2599	$\textbf{val}\,~\textit{pick\_nits\_in\_subgoal} : \\
blanchet@33191	2600	\hbox{}\quad\textit{Proof.state} \rightarrow \textit{params} \rightarrow \textit{bool} \rightarrow \textit{int} \rightarrow \textit{string} * \textit{Proof.state}$
blanchet@33191	2601	\postw
blanchet@33191	2602
blanchet@33191	2603	The return value is a new proof state paired with an outcome string
blanchet@33191	2604	(``genuine'', ``likely\_genuine'', ``potential'', ``none'', or ``unknown''). The
blanchet@33191	2605	\textit{params} type is a large record that lets you set Nitpick's options. The
blanchet@33191	2606	current default options can be retrieved by calling the following function
blanchet@33224	2607	defined in the \textit{Nitpick\_Isar} structure:
blanchet@33191	2608
blanchet@33191	2609	\prew
blanchet@33191	2610	$\textbf{val}\,~\textit{default\_params} :\,
blanchet@33191	2611	\textit{theory} \rightarrow (\textit{string} * \textit{string})~\textit{list} \rightarrow \textit{params}$
blanchet@33191	2612	\postw
blanchet@33191	2613
blanchet@33191	2614	The second argument lets you override option values before they are parsed and
blanchet@33191	2615	put into a \textit{params} record. Here is an example:
blanchet@33191	2616
blanchet@33191	2617	\prew
blanchet@33224	2618	$\textbf{val}\,~\textit{params} = \textit{Nitpick\_Isar.default\_params}~\textit{thy}~[(\textrm{``}\textrm{timeout}\textrm{''},\, \textrm{``}\textrm{none}\textrm{''})]$ \\
blanchet@33191	2619	$\textbf{val}\,~(\textit{outcome},\, \textit{state}') = \textit{Nitpick.pick\_nits\_in\_subgoal}~\begin{aligned}[t]
blanchet@33191	2620	& \textit{state}~\textit{params}~\textit{false} \\[-2pt]
blanchet@33191	2621	& \textit{subgoal}\end{aligned}$
blanchet@33191	2622	\postw
blanchet@33191	2623
blanchet@33548	2624	\let\antiq=\textrm
blanchet@33548	2625
blanchet@33191	2626	\subsection{Registration of Coinductive Datatypes}
blanchet@33191	2627	\label{registration-of-coinductive-datatypes}
blanchet@33191	2628
blanchet@33191	2629	If you have defined a custom coinductive datatype, you can tell Nitpick about
blanchet@33191	2630	it, so that it can use an efficient Kodkod axiomatization similar to the one it
blanchet@33191	2631	uses for lazy lists. The interface for registering and unregistering coinductive
blanchet@33191	2632	datatypes consists of the following pair of functions defined in the
blanchet@33191	2633	\textit{Nitpick} structure:
blanchet@33191	2634
blanchet@33191	2635	\prew
blanchet@33191	2636	$\textbf{val}\,~\textit{register\_codatatype} :\,
blanchet@33191	2637	\textit{typ} \rightarrow \textit{string} \rightarrow \textit{styp~list} \rightarrow \textit{theory} \rightarrow \textit{theory}$ \\
blanchet@33191	2638	$\textbf{val}\,~\textit{unregister\_codatatype} :\,
blanchet@33191	2639	\textit{typ} \rightarrow \textit{theory} \rightarrow \textit{theory}$
blanchet@33191	2640	\postw
blanchet@33191	2641
blanchet@33191	2642	The type $'a~\textit{llist}$ of lazy lists is already registered; had it
blanchet@33191	2643	not been, you could have told Nitpick about it by adding the following line
blanchet@33191	2644	to your theory file:
blanchet@33191	2645
blanchet@33191	2646	\prew
blanchet@33191	2647	$\textbf{setup}~\,\{{*}\,~\!\begin{aligned}[t]
blanchet@33191	2648	& \textit{Nitpick.register\_codatatype} \\[-2pt]
blanchet@33191	2649	& \qquad @\{\antiq{typ}~``\kern1pt'a~\textit{llist}\textrm{''}\}~@\{\antiq{const\_name}~ \textit{llist\_case}\} \\[-2pt] %% TYPESETTING
blanchet@33191	2650	& \qquad (\textit{map}~\textit{dest\_Const}~[@\{\antiq{term}~\textit{LNil}\},\, @\{\antiq{term}~\textit{LCons}\}])\,\ {*}\}\end{aligned}$
blanchet@33191	2651	\postw
blanchet@33191	2652
blanchet@33191	2653	The \textit{register\_codatatype} function takes a coinductive type, its case
blanchet@33191	2654	function, and the list of its constructors. The case function must take its
blanchet@33191	2655	arguments in the order that the constructors are listed. If no case function
blanchet@33191	2656	with the correct signature is available, simply pass the empty string.
blanchet@33191	2657
blanchet@33191	2658	On the other hand, if your goal is to cripple Nitpick, add the following line to
blanchet@33191	2659	your theory file and try to check a few conjectures about lazy lists:
blanchet@33191	2660
blanchet@33191	2661	\prew
blanchet@33191	2662	$\textbf{setup}~\,\{{*}\,~\textit{Nitpick.unregister\_codatatype}~@\{\antiq{typ}~``
blanchet@33191	2663	\kern1pt'a~\textit{list}\textrm{''}\}\ \,{*}\}$
blanchet@33191	2664	\postw
blanchet@33191	2665
blanchet@33572	2666	Inductive datatypes can be registered as coinductive datatypes, given
blanchet@33572	2667	appropriate coinductive constructors. However, doing so precludes
blanchet@33572	2668	the use of the inductive constructors---Nitpick will generate an error if they
blanchet@33572	2669	are needed.
blanchet@33572	2670
blanchet@33191	2671	\section{Known Bugs and Limitations}
blanchet@33191	2672	\label{known-bugs-and-limitations}
blanchet@33191	2673
blanchet@33191	2674	Here are the known bugs and limitations in Nitpick at the time of writing:
blanchet@33191	2675
blanchet@33191	2676	\begin{enum}
blanchet@33191	2677	\item[$\bullet$] Underspecified functions defined using the \textbf{primrec},
blanchet@33191	2678	\textbf{function}, or \textbf{nominal\_\allowbreak primrec} packages can lead
blanchet@33191	2679	Nitpick to generate spurious counterexamples for theorems that refer to values
blanchet@33191	2680	for which the function is not defined. For example:
blanchet@33191	2681
blanchet@33191	2682	\prew
blanchet@33191	2683	\textbf{primrec} \textit{prec} \textbf{where} \\
blanchet@33191	2684	``$\textit{prec}~(\textit{Suc}~n) = n$'' \\[2\smallskipamount]
blanchet@33191	2685	\textbf{lemma} ``$\textit{prec}~0 = \undef$'' \\
blanchet@33191	2686	\textbf{nitpick} \\[2\smallskipamount]
blanchet@33191	2687	\quad{\slshape Nitpick found a counterexample for \textit{card nat}~= 2:
blanchet@33191	2688	\nopagebreak
blanchet@33191	2689	\\[2\smallskipamount]
blanchet@33191	2690	\hbox{}\qquad Empty assignment} \nopagebreak\\[2\smallskipamount]
blanchet@34969	2691	\textbf{by}~(\textit{auto simp}:~\textit{prec\_def})
blanchet@33191	2692	\postw
blanchet@33191	2693
blanchet@33191	2694	Such theorems are considered bad style because they rely on the internal
blanchet@33191	2695	representation of functions synthesized by Isabelle, which is an implementation
blanchet@33191	2696	detail.
blanchet@33191	2697
blanchet@33550	2698	\item[$\bullet$] Nitpick maintains a global cache of wellfoundedness conditions,
blanchet@33547	2699	which can become invalid if you change the definition of an inductive predicate
blanchet@33547	2700	that is registered in the cache. To clear the cache,
blanchet@33547	2701	run Nitpick with the \textit{tac\_timeout} option set to a new value (e.g.,
blanchet@33547	2702	501$\,\textit{ms}$).
blanchet@33547	2703
blanchet@33191	2704	\item[$\bullet$] Nitpick produces spurious counterexamples when invoked after a
blanchet@33191	2705	\textbf{guess} command in a structured proof.
blanchet@33191	2706
blanchet@33191	2707	\item[$\bullet$] The \textit{nitpick\_} attributes and the
blanchet@33191	2708	\textit{Nitpick.register\_} functions can cause havoc if used improperly.
blanchet@33191	2709
blanchet@33570	2710	\item[$\bullet$] Although this has never been observed, arbitrary theorem
blanchet@33572	2711	morphisms could possibly confuse Nitpick, resulting in spurious counterexamples.
blanchet@33570	2712
blanchet@33191	2713	\item[$\bullet$] Local definitions are not supported and result in an error.
blanchet@33191	2714
blanchet@33726	2715	%\item[$\bullet$] All constants and types whose names start with
blanchet@33726	2716	%\textit{Nitpick}{.} are reserved for internal use.
blanchet@33191	2717	\end{enum}
blanchet@33191	2718
blanchet@33191	2719	\let\em=\sl
blanchet@33191	2720	\bibliography{../manual}{}
blanchet@33191	2721	\bibliographystyle{abbrv}
blanchet@33191	2722
blanchet@33191	2723	\end{document}

author	blanchet
	Tue, 02 Feb 2010 11:38:38 +0100
changeset 34969	7b8c366e34a2
parent 34123	8a2c5d7aff51
child 34985	5e492a862b34
permissions	-rw-r--r--