| author | wenzelm |
| Wed, 17 Aug 2022 16:03:36 +0200 | |
| changeset 75890 | a1336e2d7680 |
| parent 75806 | 2b106aae897c |
| child 75872 | 8bfad7bc74cb |
| permissions | -rw-r--r-- |
| 36926 | 1 |
\documentclass[a4paper,12pt]{article}
|
2 |
\usepackage[T1]{fontenc}
|
|
3 |
\usepackage{amsmath}
|
|
4 |
\usepackage{amssymb}
|
|
5 |
\usepackage{color}
|
|
6 |
\usepackage{footmisc}
|
|
7 |
\usepackage{graphicx}
|
|
8 |
%\usepackage{mathpazo}
|
|
9 |
\usepackage{multicol}
|
|
10 |
\usepackage{stmaryrd}
|
|
11 |
%\usepackage[scaled=.85]{beramono}
|
|
|
48962
a1acc1cb0271
more standard document preparation within session context;
wenzelm
parents:
48803
diff
changeset
|
12 |
\usepackage{isabelle,iman,pdfsetup}
|
| 36926 | 13 |
|
| 68649 | 14 |
\newcommand\download{\url{https://isabelle.in.tum.de/components/}}
|
| 46242 | 15 |
|
| 57040 | 16 |
\let\oldS=\S |
17 |
\def\S{\oldS\,}
|
|
18 |
||
| 43216 | 19 |
\def\qty#1{\ensuremath{\left<\mathit{#1\/}\right>}}
|
20 |
\def\qtybf#1{$\mathbf{\left<\textbf{\textit{#1\/}}\right>}$}
|
|
21 |
||
| 45516 | 22 |
\newcommand\const[1]{\textsf{#1}}
|
23 |
||
| 36926 | 24 |
%\oddsidemargin=4.6mm |
25 |
%\evensidemargin=4.6mm |
|
26 |
%\textwidth=150mm |
|
27 |
%\topmargin=4.6mm |
|
28 |
%\headheight=0mm |
|
29 |
%\headsep=0mm |
|
30 |
%\textheight=234mm |
|
31 |
||
32 |
\def\Colon{\mathord{:\mkern-1.5mu:}}
|
|
33 |
%\def\lbrakk{\mathopen{\lbrack\mkern-3.25mu\lbrack}}
|
|
34 |
%\def\rbrakk{\mathclose{\rbrack\mkern-3.255mu\rbrack}}
|
|
35 |
\def\lparr{\mathopen{(\mkern-4mu\mid}}
|
|
36 |
\def\rparr{\mathclose{\mid\mkern-4mu)}}
|
|
37 |
||
38 |
\def\unk{{?}}
|
|
39 |
\def\undef{(\lambda x.\; \unk)}
|
|
40 |
%\def\unr{\textit{others}}
|
|
41 |
\def\unr{\ldots}
|
|
|
73595
aece5cc9efb7
simplified typesetting of \<guillemotleft>...\<guillemotright>;
wenzelm
parents:
73436
diff
changeset
|
42 |
\def\Abs#1{\hbox{\rm{\guillemetleft}}{\,#1\,}\hbox{\rm{\guillemetright}}}
|
| 36926 | 43 |
\def\Q{{\smash{\lower.2ex\hbox{$\scriptstyle?$}}}}
|
44 |
||
45 |
\urlstyle{tt}
|
|
46 |
||
| 55290 | 47 |
\renewcommand\_{\hbox{\textunderscore\kern-.05ex}}
|
48 |
||
| 72589 | 49 |
\hyphenation{Isa-belle super-posi-tion zipper-posi-tion}
|
50 |
||
| 36926 | 51 |
\begin{document}
|
52 |
||
| 45516 | 53 |
%%% TYPESETTING |
54 |
%\renewcommand\labelitemi{$\bullet$}
|
|
55 |
\renewcommand\labelitemi{\raise.065ex\hbox{\small\textbullet}}
|
|
56 |
||
| 73723 | 57 |
\title{\includegraphics[scale=0.5]{isabelle_logo} \\[4ex]
|
| 36926 | 58 |
Hammering Away \\[\smallskipamount] |
59 |
\Large A User's Guide to Sledgehammer for Isabelle/HOL} |
|
60 |
\author{\hbox{} \\
|
|
|
70818
13d6b561b0ea
added para constrasting 'primrec' and 'fun' -- and removed my middle name
blanchet
parents:
68649
diff
changeset
|
61 |
Jasmin Blanchette \\ |
|
43002
e88fde86e4c2
mention contributions from LCP and explain metis and metisFT encodings
blanchet
parents:
42996
diff
changeset
|
62 |
{\normalsize Institut f\"ur Informatik, Technische Universit\"at M\"unchen} \\[4\smallskipamount]
|
|
e88fde86e4c2
mention contributions from LCP and explain metis and metisFT encodings
blanchet
parents:
42996
diff
changeset
|
63 |
{\normalsize with contributions from} \\[4\smallskipamount]
|
|
72342
4195e75a92ef
[mirabelle] add initial documentation in Sledgehammer's doc
desharna
parents:
72319
diff
changeset
|
64 |
Martin Desharnais \\ |
|
4195e75a92ef
[mirabelle] add initial documentation in Sledgehammer's doc
desharna
parents:
72319
diff
changeset
|
65 |
{\normalsize Forschungsinstitut CODE, Universit\"at der Bundeswehr M\"unchen} \\[4\smallskipamount]
|
|
43002
e88fde86e4c2
mention contributions from LCP and explain metis and metisFT encodings
blanchet
parents:
42996
diff
changeset
|
66 |
Lawrence C. Paulson \\ |
|
e88fde86e4c2
mention contributions from LCP and explain metis and metisFT encodings
blanchet
parents:
42996
diff
changeset
|
67 |
{\normalsize Computer Laboratory, University of Cambridge} \\
|
| 36926 | 68 |
\hbox{}}
|
69 |
||
70 |
\maketitle |
|
71 |
||
72 |
\tableofcontents |
|
73 |
||
74 |
\setlength{\parskip}{.7em plus .2em minus .1em}
|
|
75 |
\setlength{\parindent}{0pt}
|
|
76 |
\setlength{\abovedisplayskip}{\parskip}
|
|
77 |
\setlength{\abovedisplayshortskip}{.9\parskip}
|
|
78 |
\setlength{\belowdisplayskip}{\parskip}
|
|
79 |
\setlength{\belowdisplayshortskip}{.9\parskip}
|
|
80 |
||
| 52078 | 81 |
% general-purpose enum environment with correct spacing |
| 36926 | 82 |
\newenvironment{enum}%
|
83 |
{\begin{list}{}{%
|
|
84 |
\setlength{\topsep}{.1\parskip}%
|
|
85 |
\setlength{\partopsep}{.1\parskip}%
|
|
86 |
\setlength{\itemsep}{\parskip}%
|
|
87 |
\advance\itemsep by-\parsep}} |
|
88 |
{\end{list}}
|
|
89 |
||
90 |
\def\pre{\begingroup\vskip0pt plus1ex\advance\leftskip by\leftmargin
|
|
91 |
\advance\rightskip by\leftmargin} |
|
92 |
\def\post{\vskip0pt plus1ex\endgroup}
|
|
93 |
||
94 |
\def\prew{\pre\advance\rightskip by-\leftmargin}
|
|
95 |
\def\postw{\post}
|
|
96 |
||
| 68565 | 97 |
|
| 36926 | 98 |
\section{Introduction}
|
99 |
\label{introduction}
|
|
100 |
||
|
42964
bf45fd2488a2
document primitive support for LEO-II and Satallax
blanchet
parents:
42945
diff
changeset
|
101 |
Sledgehammer is a tool that applies automatic theorem provers (ATPs) |
|
47561
92d88c89efff
update documentation (mostly based on feedback by Makarius)
blanchet
parents:
47530
diff
changeset
|
102 |
and satisfiability-modulo-theories (SMT) solvers on the current goal.% |
|
92d88c89efff
update documentation (mostly based on feedback by Makarius)
blanchet
parents:
47530
diff
changeset
|
103 |
\footnote{The distinction between ATPs and SMT solvers is convenient but mostly
|
| 68565 | 104 |
historical.} |
|
47561
92d88c89efff
update documentation (mostly based on feedback by Makarius)
blanchet
parents:
47530
diff
changeset
|
105 |
% |
|
72403
4a3169d8885c
removed support for obsolete prover SNARK and underperforming prover E-Par
blanchet
parents:
72402
diff
changeset
|
106 |
The supported ATPs include agsyHOL \cite{agsyHOL}, Alt-Ergo \cite{alt-ergo}, E
|
| 72592 | 107 |
\cite{schulz-2019}, iProver \cite{korovin-2009}, LEO-II \cite{leo2}, Leo-III
|
|
72403
4a3169d8885c
removed support for obsolete prover SNARK and underperforming prover E-Par
blanchet
parents:
72402
diff
changeset
|
108 |
\cite{leo3}, Satallax \cite{satallax}, SPASS \cite{weidenbach-et-al-2009},
|
|
4a3169d8885c
removed support for obsolete prover SNARK and underperforming prover E-Par
blanchet
parents:
72402
diff
changeset
|
109 |
Vampire \cite{riazanov-voronkov-2002}, Waldmeister \cite{waldmeister}, and
|
|
4a3169d8885c
removed support for obsolete prover SNARK and underperforming prover E-Par
blanchet
parents:
72402
diff
changeset
|
110 |
Zipperposition \cite{cruanes-2014}. The ATPs are run either locally or remotely
|
|
4a3169d8885c
removed support for obsolete prover SNARK and underperforming prover E-Par
blanchet
parents:
72402
diff
changeset
|
111 |
via the System\-On\-TPTP web service \cite{sutcliffe-2000}. The supported SMT
|
|
75806
2b106aae897c
added support for cvc5 (whose interface is almost identical to CVC4)
blanchet
parents:
75387
diff
changeset
|
112 |
solvers are CVC4 \cite{cvc4}, cvc5 \cite{barbosa-et-al-cvc5}, veriT
|
|
2b106aae897c
added support for cvc5 (whose interface is almost identical to CVC4)
blanchet
parents:
75387
diff
changeset
|
113 |
\cite{bouton-et-al-2009}, and Z3 \cite{de-moura-2008}. These are always run
|
|
2b106aae897c
added support for cvc5 (whose interface is almost identical to CVC4)
blanchet
parents:
75387
diff
changeset
|
114 |
locally. |
| 36926 | 115 |
|
| 57241 | 116 |
The problem passed to the external provers (or solvers) consists of your current |
117 |
goal together with a heuristic selection of hundreds of facts (theorems) from the |
|
| 52078 | 118 |
current theory context, filtered by relevance. |
|
37517
19ba7ec5f1e3
steal some of http://isabelle.in.tum.de/sledgehammer.html and add it to the docs
blanchet
parents:
37498
diff
changeset
|
119 |
|
|
72403
4a3169d8885c
removed support for obsolete prover SNARK and underperforming prover E-Par
blanchet
parents:
72402
diff
changeset
|
120 |
The result of a successful proof search is some source text that typically |
|
4a3169d8885c
removed support for obsolete prover SNARK and underperforming prover E-Par
blanchet
parents:
72402
diff
changeset
|
121 |
reconstructs the proof within Isabelle. For ATPs, the reconstructed proof |
|
4a3169d8885c
removed support for obsolete prover SNARK and underperforming prover E-Par
blanchet
parents:
72402
diff
changeset
|
122 |
typically relies on the general-purpose \textit{metis} proof method, which
|
| 45380 | 123 |
integrates the Metis ATP in Isabelle/HOL with explicit inferences going through |
124 |
the kernel. Thus its results are correct by construction. |
|
| 36926 | 125 |
|
|
53760
cf37f4b84824
moved focus to Isabell/jEdit and away from Proof General
blanchet
parents:
53759
diff
changeset
|
126 |
For Isabelle/jEdit users, Sledgehammer provides an automatic mode that can be |
|
cf37f4b84824
moved focus to Isabell/jEdit and away from Proof General
blanchet
parents:
53759
diff
changeset
|
127 |
enabled via the ``Auto Sledgehammer'' option under ``Plugins > Plugin Options > |
| 54114 | 128 |
Isabelle > General.'' In this mode, a reduced version of Sledgehammer is run on |
129 |
every newly entered theorem for a few seconds. |
|
| 39320 | 130 |
|
| 36926 | 131 |
\newbox\boxA |
| 46298 | 132 |
\setbox\boxA=\hbox{\texttt{NOSPAM}}
|
| 36926 | 133 |
|
| 72589 | 134 |
\newcommand\authoremail{\texttt{jasmin.blan{\color{white}NOSPAM}\kern-\wd\boxA{}chette@\allowbreak
|
| 75021 | 135 |
gmail.\allowbreak com}} |
| 42763 | 136 |
|
| 40689 | 137 |
To run Sledgehammer, you must make sure that the theory \textit{Sledgehammer} is
|
138 |
imported---this is rarely a problem in practice since it is part of |
|
| 72589 | 139 |
\textit{Main}. Examples of Sledgehammer use can be found in the
|
140 |
\texttt{src/HOL/Metis\_Examples} directory. Comments and bug reports
|
|
141 |
concerning Sledgehammer or this manual should be directed to the author at |
|
142 |
\authoremail. |
|
| 36926 | 143 |
|
144 |
||
145 |
\section{Installation}
|
|
146 |
\label{installation}
|
|
147 |
||
| 48387 | 148 |
Sledgehammer is part of Isabelle, so you do not need to install it. However, it |
| 46242 | 149 |
relies on third-party automatic provers (ATPs and SMT solvers). |
| 42763 | 150 |
|
| 74048 | 151 |
Among the ATPs, agsyHOL, Alt-Ergo, E, LEO-II, Leo-III, Satallax, SPASS, Vampire, |
152 |
and Zipperposition can be run locally; in addition, agsyHOL, Alt-Ergo, E, |
|
153 |
iProver, LEO-II, Leo-III, Satallax, Vampire, Waldmeister, and Zipperposition are |
|
154 |
available remotely via System\-On\-TPTP \cite{sutcliffe-2000}. The SMT solvers
|
|
|
75806
2b106aae897c
added support for cvc5 (whose interface is almost identical to CVC4)
blanchet
parents:
75387
diff
changeset
|
155 |
CVC4, cvc5, veriT, and Z3 can be run locally. |
| 36926 | 156 |
|
| 46242 | 157 |
There are three main ways to install automatic provers on your machine: |
| 36926 | 158 |
|
| 46242 | 159 |
\begin{sloppy}
|
160 |
\begin{enum}
|
|
161 |
\item[\labelitemi] If you installed an official Isabelle package, it should |
|
|
75806
2b106aae897c
added support for cvc5 (whose interface is almost identical to CVC4)
blanchet
parents:
75387
diff
changeset
|
162 |
already include properly set up executables for CVC4, cvc5, E, SPASS, Vampire, |
|
2b106aae897c
added support for cvc5 (whose interface is almost identical to CVC4)
blanchet
parents:
75387
diff
changeset
|
163 |
veriT, Z3, and Zipperposition ready to use. |
| 46242 | 164 |
|
| 74048 | 165 |
\item[\labelitemi] Alternatively, you can download the Isabelle-aware CVC4, E, |
| 75021 | 166 |
SPASS, Vampire, veriT, Z3, and Zipperposition binary packages from \download. |
167 |
Extract the archives, then add a line to your |
|
168 |
\texttt{\$ISABELLE\_HOME\_USER\slash etc\slash components}%
|
|
|
41747
f58d4d202924
fix path to etc/settings and etc/components in doc
blanchet
parents:
41740
diff
changeset
|
169 |
\footnote{The variable \texttt{\$ISABELLE\_HOME\_USER} is set by Isabelle at
|
| 46242 | 170 |
startup. Its value can be retrieved by executing \texttt{isabelle}
|
|
41747
f58d4d202924
fix path to etc/settings and etc/components in doc
blanchet
parents:
41740
diff
changeset
|
171 |
\texttt{getenv} \texttt{ISABELLE\_HOME\_USER} on the command line.}
|
| 72592 | 172 |
file with the absolute path to the prover. For example, if the |
173 |
\texttt{components} file does not exist yet and you extracted SPASS to
|
|
174 |
\texttt{/usr/local/spass-3.8ds}, create it with the single line
|
|
| 36926 | 175 |
|
176 |
\prew |
|
| 47577 | 177 |
\texttt{/usr/local/spass-3.8ds}
|
| 36926 | 178 |
\postw |
179 |
||
|
47561
92d88c89efff
update documentation (mostly based on feedback by Makarius)
blanchet
parents:
47530
diff
changeset
|
180 |
in it. |
| 38043 | 181 |
|
| 70937 | 182 |
\item[\labelitemi] If you prefer to build agsyHOL, Alt-Ergo, E, LEO-II, |
| 75021 | 183 |
Leo-III, Satallax, or Zipperposition manually, set the environment variable |
| 52078 | 184 |
\texttt{AGSYHOL\_HOME}, \texttt{E\_HOME}, \texttt{LEO2\_HOME},
|
| 75021 | 185 |
\texttt{LEO3\_HOME}, \texttt{SATALLAX\_HOME}, or \texttt{ZIPPERPOSITION\_HOME}
|
| 68565 | 186 |
to the directory that contains the \texttt{agsyHOL},
|
| 75021 | 187 |
\texttt{eprover} (or \texttt{eprover-ho}),
|
188 |
\texttt{leo}, \texttt{leo3}, \texttt{satallax}, or \texttt{zipperposition}
|
|
189 |
executable; for Alt-Ergo, set the environment variable \texttt{WHY3\_HOME} to the
|
|
|
73970
34c8cf767fa3
adjusted E setup to avoid generating FOOL with 2.5 (where 'ite' is missing)
blanchet
parents:
73941
diff
changeset
|
190 |
directory that contains the \texttt{why3} executable. Ideally, you
|
| 70929 | 191 |
should also set \texttt{E\_VERSION}, \texttt{LEO2\_VERSION},
|
| 75021 | 192 |
\texttt{LEO3\_VERSION}, \texttt{SATALLAX\_VERSION}, or
|
193 |
\texttt{ZIPPERPOSITION\_VERSION} to the prover's version number (e.g., ``3.6'').
|
|
| 36926 | 194 |
|
|
75806
2b106aae897c
added support for cvc5 (whose interface is almost identical to CVC4)
blanchet
parents:
75387
diff
changeset
|
195 |
Similarly, if you want to install CVC4, cvc5, veriT, or Z3, set the environment |
|
2b106aae897c
added support for cvc5 (whose interface is almost identical to CVC4)
blanchet
parents:
75387
diff
changeset
|
196 |
variable \texttt{CVC4\_\allowbreak SOLVER}, \texttt{CVC5\_\allowbreak SOLVER},
|
|
2b106aae897c
added support for cvc5 (whose interface is almost identical to CVC4)
blanchet
parents:
75387
diff
changeset
|
197 |
\texttt{ISABELLE\_\allowbreak VERIT},
|
| 74048 | 198 |
or \texttt{Z3\_SOLVER} to the complete path of the executable, \emph{including
|
|
75806
2b106aae897c
added support for cvc5 (whose interface is almost identical to CVC4)
blanchet
parents:
75387
diff
changeset
|
199 |
the file name}. Ideally, also set \texttt{CVC4\_VERSION}, \texttt{CVC5\_VERSION},
|
| 74048 | 200 |
\texttt{VERIT\_VERSION}, or \texttt{Z3\_VERSION} to the solver's version number
|
201 |
(e.g., ``4.4.0''). |
|
| 46242 | 202 |
\end{enum}
|
203 |
\end{sloppy}
|
|
| 36926 | 204 |
|
| 66735 | 205 |
To check whether the provers are successfully installed, try out the example |
206 |
in \S\ref{first-steps}. If the remote versions of any of these provers is used
|
|
207 |
(identified by the prefix ``\textit{remote\_\/}''), or if the local versions
|
|
208 |
fail to solve the easy goal presented there, something must be wrong with the |
|
209 |
installation. |
|
| 46242 | 210 |
|
| 68565 | 211 |
|
| 36926 | 212 |
\section{First Steps}
|
213 |
\label{first-steps}
|
|
214 |
||
215 |
To illustrate Sledgehammer in context, let us start a theory file and |
|
216 |
attempt to prove a simple lemma: |
|
217 |
||
218 |
\prew |
|
219 |
\textbf{theory}~\textit{Scratch} \\
|
|
| 75021 | 220 |
\noindent\hbox{}\quad \textbf{imports}~\textit{Main} \\
|
| 36926 | 221 |
\textbf{begin} \\[2\smallskipamount]
|
222 |
% |
|
| 42945 | 223 |
\textbf{lemma} ``$[a] = [b] \,\Longrightarrow\, a = b$'' \\
|
| 36926 | 224 |
\textbf{sledgehammer}
|
225 |
\postw |
|
226 |
||
|
53760
cf37f4b84824
moved focus to Isabell/jEdit and away from Proof General
blanchet
parents:
53759
diff
changeset
|
227 |
Instead of issuing the \textbf{sledgehammer} command, you can also use the
|
| 72592 | 228 |
Sledgehammer panel in Isabelle/jEdit. Sledgehammer might produce something like |
229 |
the following output after a few seconds: |
|
| 36926 | 230 |
|
231 |
\prew |
|
232 |
\slshape |
|
| 75021 | 233 |
e found a proof\ldots \\ |
234 |
cvc4 found a proof\ldots \\ |
|
235 |
z3 found a proof\ldots \\ |
|
236 |
vampire found a proof\ldots \\ |
|
237 |
e: Try this: \textbf{by} \textit{simp} (0.3 ms) \\
|
|
238 |
cvc4: Try this: \textbf{by} \textit{simp} (0.4 ms) \\
|
|
239 |
z3: Try this: \textbf{by} \textit{simp} (0.5 ms) \\
|
|
240 |
vampire: Try this: \textbf{by} \textit{simp} (0.3 ms) \\
|
|
241 |
QED |
|
| 36926 | 242 |
\postw |
243 |
||
| 75021 | 244 |
Sledgehammer ran CVC4, E, Vampire, Z3, and possibly other provers in parallel. |
245 |
The list may vary depending on which provers are installed and how many |
|
246 |
processor cores are available. |
|
| 36926 | 247 |
|
| 72592 | 248 |
For each successful prover, Sledgehammer gives a one-line Isabelle proof. Rough |
249 |
timings are shown in parentheses, indicating how fast the call is. You can |
|
250 |
click the proof to insert it into the theory text. |
|
| 36926 | 251 |
|
|
51190
2654b3965c8d
made "isar_proofs" a 3-way option, to provide a way to totally disable isar_proofs if desired
blanchet
parents:
51189
diff
changeset
|
252 |
In addition, you can ask Sledgehammer for an Isar text proof by enabling the |
| 49919 | 253 |
\textit{isar\_proofs} option (\S\ref{output-format}):
|
| 36926 | 254 |
|
255 |
\prew |
|
| 49919 | 256 |
\textbf{sledgehammer} [\textit{isar\_proofs}]
|
| 36926 | 257 |
\postw |
258 |
||
259 |
When Isar proof construction is successful, it can yield proofs that are more |
|
| 72592 | 260 |
readable and also faster than \textit{metis} or \textit{smt} one-line
|
261 |
proofs. This feature is experimental. |
|
| 36926 | 262 |
|
| 68565 | 263 |
|
|
37517
19ba7ec5f1e3
steal some of http://isabelle.in.tum.de/sledgehammer.html and add it to the docs
blanchet
parents:
37498
diff
changeset
|
264 |
\section{Hints}
|
|
19ba7ec5f1e3
steal some of http://isabelle.in.tum.de/sledgehammer.html and add it to the docs
blanchet
parents:
37498
diff
changeset
|
265 |
\label{hints}
|
|
19ba7ec5f1e3
steal some of http://isabelle.in.tum.de/sledgehammer.html and add it to the docs
blanchet
parents:
37498
diff
changeset
|
266 |
|
| 42884 | 267 |
This section presents a few hints that should help you get the most out of |
|
46643
a88bccd2b567
added support for Alt-Ergo through Why3 (mostly for experimental purposes, e.g. polymorphism vs. monomorphization)
blanchet
parents:
46640
diff
changeset
|
268 |
Sledgehammer. Frequently asked questions are answered in |
| 45380 | 269 |
\S\ref{frequently-asked-questions}.
|
| 42884 | 270 |
|
| 46242 | 271 |
%\newcommand\point[1]{\medskip\par{\sl\bfseries#1}\par\nopagebreak}
|
| 75021 | 272 |
\newcommand\point[1]{\subsection{\slshape #1}}
|
| 42763 | 273 |
|
| 68565 | 274 |
|
| 42763 | 275 |
\point{Presimplify the goal}
|
276 |
||
|
37517
19ba7ec5f1e3
steal some of http://isabelle.in.tum.de/sledgehammer.html and add it to the docs
blanchet
parents:
37498
diff
changeset
|
277 |
For best results, first simplify your problem by calling \textit{auto} or at
|
| 42945 | 278 |
least \textit{safe} followed by \textit{simp\_all}. The SMT solvers provide
|
279 |
arithmetic decision procedures, but the ATPs typically do not (or if they do, |
|
280 |
Sledgehammer does not use it yet). Apart from Waldmeister, they are not |
|
|
53759
a198ce71de11
took out Waldmeister from list of default provers -- it's usually just visual noise, and its integration in Sledgehammer leaves much to be desired
blanchet
parents:
53757
diff
changeset
|
281 |
particularly good at heavy rewriting, but because they regard equations as |
| 42945 | 282 |
undirected, they often prove theorems that require the reverse orientation of a |
283 |
\textit{simp} rule. Higher-order problems can be tackled, but the success rate
|
|
| 75021 | 284 |
is better for first-order problems. |
|
37517
19ba7ec5f1e3
steal some of http://isabelle.in.tum.de/sledgehammer.html and add it to the docs
blanchet
parents:
37498
diff
changeset
|
285 |
|
| 68565 | 286 |
|
|
53760
cf37f4b84824
moved focus to Isabell/jEdit and away from Proof General
blanchet
parents:
53759
diff
changeset
|
287 |
\point{Familiarize yourself with the main options}
|
| 42763 | 288 |
|
289 |
Sledgehammer's options are fully documented in \S\ref{command-syntax}. Many of
|
|
290 |
the options are very specialized, but serious users of the tool should at least |
|
291 |
familiarize themselves with the following options: |
|
292 |
||
293 |
\begin{enum}
|
|
| 45516 | 294 |
\item[\labelitemi] \textbf{\textit{provers}} (\S\ref{mode-of-operation}) specifies
|
| 42884 | 295 |
the automatic provers (ATPs and SMT solvers) that should be run whenever |
| 75021 | 296 |
Sledgehammer is invoked (e.g., ``\textit{provers}~= \textit{cvc4 e
|
297 |
vampire zipperposition\/}''). |
|
| 42763 | 298 |
|
| 48294 | 299 |
\item[\labelitemi] \textbf{\textit{max\_facts}} (\S\ref{relevance-filter})
|
| 42884 | 300 |
specifies the maximum number of facts that should be passed to the provers. By |
| 48294 | 301 |
default, the value is prover-dependent but varies between about 50 and 1000. If |
302 |
the provers time out, you can try lowering this value to, say, 25 or 50 and see |
|
| 42884 | 303 |
if that helps. |
| 42763 | 304 |
|
| 49919 | 305 |
\item[\labelitemi] \textbf{\textit{isar\_proofs}} (\S\ref{output-format}) specifies
|
| 75021 | 306 |
that Isar proofs should be generated, in addition to one-line proofs. The length |
307 |
of the Isar proofs can be controlled by setting \textit{compress}
|
|
308 |
(\S\ref{output-format}).
|
|
| 43038 | 309 |
|
| 45516 | 310 |
\item[\labelitemi] \textbf{\textit{timeout}} (\S\ref{timeouts}) controls the
|
| 61317 | 311 |
provers' time limit. It is set to 30 seconds by default. |
| 42763 | 312 |
\end{enum}
|
313 |
||
| 42884 | 314 |
Options can be set globally using \textbf{sledgehammer\_params}
|
|
43010
a14cf580a5a5
readded Waldmeister as default to the documentation and other minor changes
blanchet
parents:
43008
diff
changeset
|
315 |
(\S\ref{command-syntax}). The command also prints the list of all available
|
|
a14cf580a5a5
readded Waldmeister as default to the documentation and other minor changes
blanchet
parents:
43008
diff
changeset
|
316 |
options with their current value. Fact selection can be influenced by specifying |
|
a14cf580a5a5
readded Waldmeister as default to the documentation and other minor changes
blanchet
parents:
43008
diff
changeset
|
317 |
``$(\textit{add}{:}~\textit{my\_facts})$'' after the \textbf{sledgehammer} call
|
|
a14cf580a5a5
readded Waldmeister as default to the documentation and other minor changes
blanchet
parents:
43008
diff
changeset
|
318 |
to ensure that certain facts are included, or simply ``$(\textit{my\_facts})$''
|
| 58090 | 319 |
to force Sledgehammer to run only with $\textit{my\_facts}$ (and any facts
|
320 |
chained into the goal). |
|
| 42763 | 321 |
|
| 68565 | 322 |
|
| 42763 | 323 |
\section{Frequently Asked Questions}
|
324 |
\label{frequently-asked-questions}
|
|
325 |
||
| 42945 | 326 |
This sections answers frequently (and infrequently) asked questions about |
| 48387 | 327 |
Sledgehammer. It is a good idea to skim over it now even if you do not have any |
| 75021 | 328 |
questions at this stage. |
| 42945 | 329 |
|
| 68565 | 330 |
|
|
43008
bb212c2ad238
renamed "minimize" to "min" to make Sledgehammer output a little bit more concise
blanchet
parents:
43007
diff
changeset
|
331 |
\point{Which facts are passed to the automatic provers?}
|
| 42883 | 332 |
|
| 75021 | 333 |
Sledgehammer heuristically selects a subset of lemmas from the currently loaded |
334 |
libraries. The component that performs this selection is called \emph{relevance
|
|
335 |
filter} (\S\ref{relevance-filter}).
|
|
| 48387 | 336 |
|
337 |
\begin{enum}
|
|
338 |
\item[\labelitemi] |
|
| 72589 | 339 |
The traditional relevance filter, \emph{MePo}
|
340 |
(\underline{Me}ng--\underline{Pau}lson), assigns a score to every available
|
|
341 |
fact (lemma, theorem, definition, or axiom) based upon how many constants that |
|
|
75019
30a619de7973
use same default for FO and HO provers w.r.t. induction principles, based on evaluation -- this also simplifies the code
blanchet
parents:
75016
diff
changeset
|
342 |
fact shares with the goal. This process iterates to include facts |
| 72589 | 343 |
relevant to those just accepted. The constants are weighted to give unusual |
|
75019
30a619de7973
use same default for FO and HO provers w.r.t. induction principles, based on evaluation -- this also simplifies the code
blanchet
parents:
75016
diff
changeset
|
344 |
ones greater significance. MePo copes best when the goal contains some |
| 72589 | 345 |
unusual constants; if all the constants are common, it is unable to |
346 |
discriminate among the hundreds of facts that are picked up. The filter is also |
|
347 |
memoryless: It has no information about how many times a particular fact has |
|
348 |
been used in a proof, and it cannot learn. |
|
| 48387 | 349 |
|
350 |
\item[\labelitemi] |
|
|
57272
fd539459a112
enabled MaSh by default -- set 'MaSh' to 'none' in Isabelle Plugin Options to disable
blanchet
parents:
57245
diff
changeset
|
351 |
An alternative to MePo is \emph{MaSh} (\underline{Ma}chine Learner for
|
|
fd539459a112
enabled MaSh by default -- set 'MaSh' to 'none' in Isabelle Plugin Options to disable
blanchet
parents:
57245
diff
changeset
|
352 |
\underline{S}ledge\underline{h}ammer). It applies machine learning to the
|
|
fd539459a112
enabled MaSh by default -- set 'MaSh' to 'none' in Isabelle Plugin Options to disable
blanchet
parents:
57245
diff
changeset
|
353 |
problem of finding relevant facts. |
| 48387 | 354 |
|
| 61043 | 355 |
\item[\labelitemi] The \emph{MeSh} filter combines MePo and MaSh. This is
|
356 |
the default. |
|
| 48387 | 357 |
\end{enum}
|
358 |
||
| 42883 | 359 |
The number of facts included in a problem varies from prover to prover, since |
|
43008
bb212c2ad238
renamed "minimize" to "min" to make Sledgehammer output a little bit more concise
blanchet
parents:
43007
diff
changeset
|
360 |
some provers get overwhelmed more easily than others. You can show the number of |
| 42883 | 361 |
facts given using the \textit{verbose} option (\S\ref{output-format}) and the
|
362 |
actual facts using \textit{debug} (\S\ref{output-format}).
|
|
363 |
||
364 |
Sledgehammer is good at finding short proofs combining a handful of existing |
|
365 |
lemmas. If you are looking for longer proofs, you must typically restrict the |
|
| 48294 | 366 |
number of facts, by setting the \textit{max\_facts} option
|
| 43574 | 367 |
(\S\ref{relevance-filter}) to, say, 25 or 50.
|
| 42883 | 368 |
|
| 42996 | 369 |
You can also influence which facts are actually selected in a number of ways. If |
370 |
you simply want to ensure that a fact is included, you can specify it using the |
|
| 75021 | 371 |
syntax ``$(\textit{add}{:}~\textit{my\_facts})$''. For example:
|
| 42996 | 372 |
% |
373 |
\prew |
|
374 |
\textbf{sledgehammer} (\textit{add}: \textit{hd.simps} \textit{tl.simps})
|
|
375 |
\postw |
|
376 |
% |
|
377 |
The specified facts then replace the least relevant facts that would otherwise be |
|
378 |
included; the other selected facts remain the same. |
|
379 |
If you want to direct the selection in a particular direction, you can specify |
|
380 |
the facts via \textbf{using}:
|
|
381 |
% |
|
382 |
\prew |
|
383 |
\textbf{using} \textit{hd.simps} \textit{tl.simps} \\
|
|
384 |
\textbf{sledgehammer}
|
|
385 |
\postw |
|
386 |
% |
|
387 |
The facts are then more likely to be selected than otherwise, and if they are |
|
| 75021 | 388 |
selected at a given iteration of MePo, they also influence which facts are |
389 |
selected at subsequent iterations. |
|
| 42996 | 390 |
|
| 68565 | 391 |
|
| 46300 | 392 |
\point{Why does Metis fail to reconstruct the proof?}
|
393 |
||
394 |
There are many reasons. If Metis runs seemingly forever, that is a sign that the |
|
|
57736
5f37ef22f9af
update documentation after removal of 'min' subcommand
blanchet
parents:
57733
diff
changeset
|
395 |
proof is too difficult for it. Metis's search is complete for first-order logic |
| 68565 | 396 |
with equality, so if the proof was found by a superposition-based ATP such as |
| 75021 | 397 |
E, SPASS, or Vampire, Metis should \emph{eventually} find it---in principle.
|
| 46300 | 398 |
|
399 |
In some rare cases, \textit{metis} fails fairly quickly, and you get the error
|
|
|
57736
5f37ef22f9af
update documentation after removal of 'min' subcommand
blanchet
parents:
57733
diff
changeset
|
400 |
message ``One-line proof reconstruction failed.'' This indicates that |
|
5f37ef22f9af
update documentation after removal of 'min' subcommand
blanchet
parents:
57733
diff
changeset
|
401 |
Sledgehammer determined that the goal is provable, but the proof is, for |
|
5f37ef22f9af
update documentation after removal of 'min' subcommand
blanchet
parents:
57733
diff
changeset
|
402 |
technical reasons, beyond \textit{metis}'s power. You can then try again with
|
|
5f37ef22f9af
update documentation after removal of 'min' subcommand
blanchet
parents:
57733
diff
changeset
|
403 |
the \textit{strict} option (\S\ref{problem-encoding}).
|
| 46300 | 404 |
|
| 68565 | 405 |
|
| 72589 | 406 |
\point{What are the \textit{full\_types}, \textit{no\_types}, and \\
|
| 46298 | 407 |
\textit{mono\_tags} arguments to Metis?}
|
| 42883 | 408 |
|
| 46298 | 409 |
The \textit{metis}~(\textit{full\_types}) proof method
|
410 |
and its cousin \textit{metis}~(\textit{mono\_tags}) are fully-typed
|
|
|
53760
cf37f4b84824
moved focus to Isabell/jEdit and away from Proof General
blanchet
parents:
53759
diff
changeset
|
411 |
versions of Metis. It is somewhat slower than \textit{metis}, but the proof
|
|
43228
2ed2f092e990
obsoleted "metisFT", and added "no_types" version of Metis as fallback to Sledgehammer after noticing how useful it can be
blanchet
parents:
43217
diff
changeset
|
412 |
search is fully typed, and it also includes more powerful rules such as the |
| 45516 | 413 |
axiom ``$x = \const{True} \mathrel{\lor} x = \const{False}$'' for reasoning in
|
| 75021 | 414 |
higher-order positions (e.g., in set comprehensions). The method is tried as a |
| 72592 | 415 |
fallback when \textit{metis} fails, and it is sometimes generated by
|
416 |
Sledgehammer instead of \textit{metis} if the proof obviously requires type
|
|
417 |
information or if \textit{metis} failed when Sledgehammer preplayed the proof.
|
|
| 46298 | 418 |
% |
| 43229 | 419 |
At the other end of the soundness spectrum, \textit{metis} (\textit{no\_types})
|
420 |
uses no type information at all during the proof search, which is more efficient |
|
421 |
but often fails. Calls to \textit{metis} (\textit{no\_types}) are occasionally
|
|
422 |
generated by Sledgehammer. |
|
| 46298 | 423 |
% |
424 |
See the \textit{type\_enc} option (\S\ref{problem-encoding}) for details.
|
|
| 43229 | 425 |
|
| 46298 | 426 |
Incidentally, if you ever see warnings such as |
| 42883 | 427 |
|
428 |
\prew |
|
| 43007 | 429 |
\slshape |
| 63729 | 430 |
Metis: Falling back on ``\textit{metis} (\textit{full\_types})''
|
| 42883 | 431 |
\postw |
432 |
||
| 45380 | 433 |
for a successful \textit{metis} proof, you can advantageously pass the
|
|
43228
2ed2f092e990
obsoleted "metisFT", and added "no_types" version of Metis as fallback to Sledgehammer after noticing how useful it can be
blanchet
parents:
43217
diff
changeset
|
434 |
\textit{full\_types} option to \textit{metis} directly.
|
|
2ed2f092e990
obsoleted "metisFT", and added "no_types" version of Metis as fallback to Sledgehammer after noticing how useful it can be
blanchet
parents:
43217
diff
changeset
|
435 |
|
| 68565 | 436 |
|
|
73932
fd21b4a93043
added opaque_combs and renamed hide_lams to opaque_lifting
desharna
parents:
73859
diff
changeset
|
437 |
\point{And what are the \textit{lifting} and \textit{opaque\_lifting} \\
|
|
fd21b4a93043
added opaque_combs and renamed hide_lams to opaque_lifting
desharna
parents:
73859
diff
changeset
|
438 |
arguments to Metis?} |
| 46298 | 439 |
|
440 |
Orthogonally to the encoding of types, it is important to choose an appropriate |
|
| 72592 | 441 |
translation of $\lambda$-abstractions. Metis supports three translation |
442 |
schemes, in decreasing order of power: Curry combinators (the default), |
|
| 46298 | 443 |
$\lambda$-lifting, and a ``hiding'' scheme that disables all reasoning under |
| 75021 | 444 |
$\lambda$-abstractions. See the \textit{lam\_trans} option
|
| 72592 | 445 |
(\S\ref{problem-encoding}) for details.
|
| 46298 | 446 |
|
| 68565 | 447 |
|
448 |
\point{Are the generated proofs minimal?}
|
|
| 43036 | 449 |
|
| 43054 | 450 |
Automatic provers frequently use many more facts than are necessary. |
| 72592 | 451 |
Sledgehammer includes a proof minimization tool that takes a set of facts returned by |
| 57722 | 452 |
a given prover and repeatedly calls a prover or proof method with subsets of |
453 |
those facts to find a minimal set. Reducing the number of facts typically helps |
|
| 75021 | 454 |
reconstruction and declutters the proof documents. |
| 43036 | 455 |
|
| 68565 | 456 |
|
|
43008
bb212c2ad238
renamed "minimize" to "min" to make Sledgehammer output a little bit more concise
blanchet
parents:
43007
diff
changeset
|
457 |
\point{A strange error occurred---what should I do?}
|
| 42763 | 458 |
|
459 |
Sledgehammer tries to give informative error messages. Please report any strange |
|
| 63729 | 460 |
error to the author at \authoremail. |
| 42763 | 461 |
|
| 68565 | 462 |
|
| 42763 | 463 |
\point{Auto can solve it---why not Sledgehammer?}
|
464 |
||
465 |
Problems can be easy for \textit{auto} and difficult for automatic provers, but
|
|
| 48387 | 466 |
the reverse is also true, so do not be discouraged if your first attempts fail. |
| 39320 | 467 |
Because the system refers to all theorems known to Isabelle, it is particularly |
| 57040 | 468 |
suitable when your goal has a short proof but requires lemmas that you do not |
469 |
know about. |
|
|
37517
19ba7ec5f1e3
steal some of http://isabelle.in.tum.de/sledgehammer.html and add it to the docs
blanchet
parents:
37498
diff
changeset
|
470 |
|
| 68565 | 471 |
|
| 42883 | 472 |
\point{Why are there so many options?}
|
473 |
||
| 72589 | 474 |
Sledgehammer's philosophy is that it should work out of the box, without user |
475 |
guidance. Most of the options are meant to be used by the Sledgehammer |
|
476 |
developers for experiments. |
|
| 42883 | 477 |
|
| 68565 | 478 |
|
| 36926 | 479 |
\section{Command Syntax}
|
480 |
\label{command-syntax}
|
|
481 |
||
| 46242 | 482 |
\subsection{Sledgehammer}
|
| 57040 | 483 |
\label{sledgehammer}
|
| 46242 | 484 |
|
| 36926 | 485 |
Sledgehammer can be invoked at any point when there is an open goal by entering |
486 |
the \textbf{sledgehammer} command in the theory file. Its general syntax is as
|
|
487 |
follows: |
|
488 |
||
489 |
\prew |
|
| 43216 | 490 |
\textbf{sledgehammer} \qty{subcommand}$^?$ \qty{options}$^?$ \qty{facts\_override}$^?$ \qty{num}$^?$
|
| 36926 | 491 |
\postw |
492 |
||
| 43216 | 493 |
In the general syntax, the \qty{subcommand} may be any of the following:
|
| 36926 | 494 |
|
495 |
\begin{enum}
|
|
| 45516 | 496 |
\item[\labelitemi] \textbf{\textit{run} (the default):} Runs Sledgehammer on
|
| 43216 | 497 |
subgoal number \qty{num} (1 by default), with the given options and facts.
|
| 36926 | 498 |
|
| 45516 | 499 |
\item[\labelitemi] \textbf{\textit{supported\_provers}:} Prints the list of
|
| 41724 | 500 |
automatic provers supported by Sledgehammer. See \S\ref{installation} and
|
501 |
\S\ref{mode-of-operation} for more information on how to install automatic
|
|
502 |
provers. |
|
| 36926 | 503 |
|
| 48393 | 504 |
\item[\labelitemi] \textbf{\textit{refresh\_tptp}:} Refreshes the list of remote
|
505 |
ATPs available at System\-On\-TPTP \cite{sutcliffe-2000}.
|
|
506 |
\end{enum}
|
|
507 |
||
| 49365 | 508 |
In addition, the following subcommands provide finer control over machine |
| 48393 | 509 |
learning with MaSh: |
510 |
||
511 |
\begin{enum}
|
|
512 |
\item[\labelitemi] \textbf{\textit{unlearn}:} Resets MaSh, erasing any
|
|
513 |
persistent state. |
|
| 48387 | 514 |
|
| 48393 | 515 |
\item[\labelitemi] \textbf{\textit{learn\_isar}:} Invokes MaSh on the current
|
516 |
theory to process all the available facts, learning from their Isabelle/Isar |
|
517 |
proofs. This happens automatically at Sledgehammer invocations if the |
|
518 |
\textit{learn} option (\S\ref{relevance-filter}) is enabled.
|
|
| 48387 | 519 |
|
|
50484
8ec31bdb9d36
adopt the neutral "prover" terminology for MaSh rather than the ambiguous/wrong ATP terminology (which sometimes excludes SMT solvers)
blanchet
parents:
50459
diff
changeset
|
520 |
\item[\labelitemi] \textbf{\textit{learn\_prover}:} Invokes MaSh on the current
|
|
8ec31bdb9d36
adopt the neutral "prover" terminology for MaSh rather than the ambiguous/wrong ATP terminology (which sometimes excludes SMT solvers)
blanchet
parents:
50459
diff
changeset
|
521 |
theory to process all the available facts, learning from proofs generated by |
|
8ec31bdb9d36
adopt the neutral "prover" terminology for MaSh rather than the ambiguous/wrong ATP terminology (which sometimes excludes SMT solvers)
blanchet
parents:
50459
diff
changeset
|
522 |
automatic provers. The prover to use and its timeout can be set using the |
| 48393 | 523 |
\textit{prover} (\S\ref{mode-of-operation}) and \textit{timeout}
|
| 66735 | 524 |
(\S\ref{timeouts}) options. It is recommended to perform learning using a
|
525 |
first-order ATP (such as E, SPASS, and Vampire) as opposed to a |
|
| 48393 | 526 |
higher-order ATP or an SMT solver. |
527 |
||
528 |
\item[\labelitemi] \textbf{\textit{relearn\_isar}:} Same as \textit{unlearn}
|
|
529 |
followed by \textit{learn\_isar}.
|
|
530 |
||
|
50484
8ec31bdb9d36
adopt the neutral "prover" terminology for MaSh rather than the ambiguous/wrong ATP terminology (which sometimes excludes SMT solvers)
blanchet
parents:
50459
diff
changeset
|
531 |
\item[\labelitemi] \textbf{\textit{relearn\_prover}:} Same as \textit{unlearn}
|
|
8ec31bdb9d36
adopt the neutral "prover" terminology for MaSh rather than the ambiguous/wrong ATP terminology (which sometimes excludes SMT solvers)
blanchet
parents:
50459
diff
changeset
|
532 |
followed by \textit{learn\_prover}.
|
| 36926 | 533 |
\end{enum}
|
534 |
||
| 43216 | 535 |
Sledgehammer's behavior can be influenced by various \qty{options}, which can be
|
536 |
specified in brackets after the \textbf{sledgehammer} command. The
|
|
537 |
\qty{options} are a list of key--value pairs of the form ``[$k_1 = v_1,
|
|
|
50484
8ec31bdb9d36
adopt the neutral "prover" terminology for MaSh rather than the ambiguous/wrong ATP terminology (which sometimes excludes SMT solvers)
blanchet
parents:
50459
diff
changeset
|
538 |
\ldots, k_n = v_n$]''. For Boolean options, ``= \textit{true\/}'' is optional.
|
|
8ec31bdb9d36
adopt the neutral "prover" terminology for MaSh rather than the ambiguous/wrong ATP terminology (which sometimes excludes SMT solvers)
blanchet
parents:
50459
diff
changeset
|
539 |
For example: |
| 36926 | 540 |
|
541 |
\prew |
|
| 49919 | 542 |
\textbf{sledgehammer} [\textit{isar\_proofs}, \,\textit{timeout} = 120]
|
| 36926 | 543 |
\postw |
544 |
||
545 |
Default values can be set using \textbf{sledgehammer\_\allowbreak params}:
|
|
546 |
||
547 |
\prew |
|
| 43216 | 548 |
\textbf{sledgehammer\_params} \qty{options}
|
| 36926 | 549 |
\postw |
550 |
||
551 |
The supported options are described in \S\ref{option-reference}.
|
|
552 |
||
| 43216 | 553 |
The \qty{facts\_override} argument lets you alter the set of facts that go
|
554 |
through the relevance filter. It may be of the form ``(\qty{facts})'', where
|
|
555 |
\qty{facts} is a space-separated list of Isabelle facts (theorems, local
|
|
| 36926 | 556 |
assumptions, etc.), in which case the relevance filter is bypassed and the given |
| 43216 | 557 |
facts are used. It may also be of the form ``(\textit{add}:\ \qty{facts\/_{\mathrm{1}}})'',
|
558 |
``(\textit{del}:\ \qty{facts\/_{\mathrm{2}}})'', or ``(\textit{add}:\ \qty{facts\/_{\mathrm{1}}}\
|
|
559 |
\textit{del}:\ \qty{facts\/_{\mathrm{2}}})'', where the relevance filter is instructed to
|
|
560 |
proceed as usual except that it should consider \qty{facts\/_{\mathrm{1}}}
|
|
561 |
highly-relevant and \qty{facts\/_{\mathrm{2}}} fully irrelevant.
|
|
| 36926 | 562 |
|
|
53760
cf37f4b84824
moved focus to Isabell/jEdit and away from Proof General
blanchet
parents:
53759
diff
changeset
|
563 |
If you use Isabelle/jEdit, Sledgehammer also provides an automatic mode that can |
|
cf37f4b84824
moved focus to Isabell/jEdit and away from Proof General
blanchet
parents:
53759
diff
changeset
|
564 |
be enabled via the ``Auto Sledgehammer'' option under ``Plugins > Plugin Options |
|
cf37f4b84824
moved focus to Isabell/jEdit and away from Proof General
blanchet
parents:
53759
diff
changeset
|
565 |
> Isabelle > General.'' For automatic runs, only the first prover set using |
|
75022
e9e27d2e61a1
updated documentation of 'slice' (now 'slices') option
blanchet
parents:
75021
diff
changeset
|
566 |
\textit{provers} (\S\ref{mode-of-operation}) is considered,
|
|
e9e27d2e61a1
updated documentation of 'slice' (now 'slices') option
blanchet
parents:
75021
diff
changeset
|
567 |
\textit{dont\_slice} (\S\ref{timeouts}) is set, fewer facts are
|
| 54114 | 568 |
passed to the prover, \textit{fact\_filter} (\S\ref{relevance-filter}) is set to
|
569 |
\textit{mepo}, \textit{strict} (\S\ref{problem-encoding}) is enabled,
|
|
570 |
\textit{verbose} (\S\ref{output-format}) and \textit{debug}
|
|
|
60306
6b7c64ab8bd2
made Auto Sledgehammer behave more like the real thing
blanchet
parents:
60185
diff
changeset
|
571 |
(\S\ref{output-format}) are disabled, and \textit{timeout} (\S\ref{timeouts}) is
|
| 54114 | 572 |
superseded by the ``Auto Time Limit'' option in jEdit. Sledgehammer's output is |
573 |
also more concise. |
|
| 39320 | 574 |
|
| 68565 | 575 |
|
| 46242 | 576 |
\subsection{Metis}
|
| 57040 | 577 |
\label{metis}
|
| 46242 | 578 |
|
| 43216 | 579 |
The \textit{metis} proof method has the syntax
|
580 |
||
581 |
\prew |
|
| 45518 | 582 |
\textbf{\textit{metis}}~(\qty{options})${}^?$~\qty{facts}${}^?$
|
| 43216 | 583 |
\postw |
584 |
||
| 45518 | 585 |
where \qty{facts} is a list of arbitrary facts and \qty{options} is a
|
586 |
comma-separated list consisting of at most one $\lambda$ translation scheme |
|
587 |
specification with the same semantics as Sledgehammer's \textit{lam\_trans}
|
|
588 |
option (\S\ref{problem-encoding}) and at most one type encoding specification
|
|
589 |
with the same semantics as Sledgehammer's \textit{type\_enc} option
|
|
590 |
(\S\ref{problem-encoding}).
|
|
591 |
% |
|
|
73932
fd21b4a93043
added opaque_combs and renamed hide_lams to opaque_lifting
desharna
parents:
73859
diff
changeset
|
592 |
The supported $\lambda$ translation schemes are \textit{opaque\_lifting},
|
| 46366 | 593 |
\textit{lifting}, and \textit{combs} (the default).
|
| 45518 | 594 |
% |
595 |
All the untyped type encodings listed in \S\ref{problem-encoding} are supported.
|
|
596 |
For convenience, the following aliases are provided: |
|
597 |
\begin{enum}
|
|
| 48393 | 598 |
\item[\labelitemi] \textbf{\textit{full\_types}:} Alias for \textit{poly\_guards\_query}.
|
599 |
\item[\labelitemi] \textbf{\textit{partial\_types}:} Alias for \textit{poly\_args}.
|
|
600 |
\item[\labelitemi] \textbf{\textit{no\_types}:} Alias for \textit{erased}.
|
|
| 45518 | 601 |
\end{enum}
|
| 43216 | 602 |
|
| 68565 | 603 |
|
| 36926 | 604 |
\section{Option Reference}
|
605 |
\label{option-reference}
|
|
606 |
||
| 43014 | 607 |
\def\defl{\{}
|
608 |
\def\defr{\}}
|
|
609 |
||
| 36926 | 610 |
\def\flushitem#1{\item[]\noindent\kern-\leftmargin \textbf{#1}}
|
| 47036 | 611 |
\def\optrueonly#1{\flushitem{\textit{#1} $\bigl[$= \textit{true}$\bigr]$\enskip}\nopagebreak\\[\parskip]}
|
| 43014 | 612 |
\def\optrue#1#2{\flushitem{\textit{#1} $\bigl[$= \qtybf{bool}$\bigr]$\enskip \defl\textit{true}\defr\hfill (neg.: \textit{#2})}\nopagebreak\\[\parskip]}
|
613 |
\def\opfalse#1#2{\flushitem{\textit{#1} $\bigl[$= \qtybf{bool}$\bigr]$\enskip \defl\textit{false}\defr\hfill (neg.: \textit{#2})}\nopagebreak\\[\parskip]}
|
|
614 |
\def\opsmart#1#2{\flushitem{\textit{#1} $\bigl[$= \qtybf{smart\_bool}$\bigr]$\enskip \defl\textit{smart}\defr\hfill (neg.: \textit{#2})}\nopagebreak\\[\parskip]}
|
|
|
46409
d4754183ccce
made option available to users (mostly for experiments)
blanchet
parents:
46366
diff
changeset
|
615 |
\def\opsmartx#1#2{\flushitem{\textit{#1} $\bigl[$= \qtybf{smart\_bool}$\bigr]$\enskip \defl\textit{smart}\defr\\\hbox{}\hfill (neg.: \textit{#2})}\nopagebreak\\[\parskip]}
|
| 36926 | 616 |
\def\opnodefault#1#2{\flushitem{\textit{#1} = \qtybf{#2}} \nopagebreak\\[\parskip]}
|
| 43014 | 617 |
\def\opnodefaultbrk#1#2{\flushitem{$\bigl[$\textit{#1} =$\bigr]$ \qtybf{#2}} \nopagebreak\\[\parskip]}
|
618 |
\def\opdefault#1#2#3{\flushitem{\textit{#1} = \qtybf{#2}\enskip \defl\textit{#3}\defr} \nopagebreak\\[\parskip]}
|
|
| 36926 | 619 |
\def\oparg#1#2#3{\flushitem{\textit{#1} \qtybf{#2} = \qtybf{#3}} \nopagebreak\\[\parskip]}
|
620 |
\def\opargbool#1#2#3{\flushitem{\textit{#1} \qtybf{#2} $\bigl[$= \qtybf{bool}$\bigr]$\hfill (neg.: \textit{#3})}\nopagebreak\\[\parskip]}
|
|
| 43014 | 621 |
\def\opargboolorsmart#1#2#3{\flushitem{\textit{#1} \qtybf{#2} $\bigl[$= \qtybf{smart\_bool}$\bigr]$\hfill (neg.: \textit{#3})}\nopagebreak\\[\parskip]}
|
| 36926 | 622 |
|
623 |
Sledgehammer's options are categorized as follows:\ mode of operation |
|
| 38984 | 624 |
(\S\ref{mode-of-operation}), problem encoding (\S\ref{problem-encoding}),
|
625 |
relevance filter (\S\ref{relevance-filter}), output format
|
|
| 57241 | 626 |
(\S\ref{output-format}), regression testing (\S\ref{regression-testing}),
|
627 |
and timeouts (\S\ref{timeouts}).
|
|
| 36926 | 628 |
|
629 |
The descriptions below refer to the following syntactic quantities: |
|
630 |
||
631 |
\begin{enum}
|
|
| 45516 | 632 |
\item[\labelitemi] \qtybf{string}: A string.
|
633 |
\item[\labelitemi] \qtybf{bool\/}: \textit{true} or \textit{false}.
|
|
634 |
\item[\labelitemi] \qtybf{smart\_bool\/}: \textit{true}, \textit{false}, or
|
|
| 40203 | 635 |
\textit{smart}.
|
| 45516 | 636 |
\item[\labelitemi] \qtybf{int\/}: An integer.
|
|
54816
10d48c2a3e32
made timeouts in Sledgehammer not be 'option's -- simplified lots of code
blanchet
parents:
54788
diff
changeset
|
637 |
\item[\labelitemi] \qtybf{float}: A floating-point number (e.g., 2.5 or 60)
|
|
10d48c2a3e32
made timeouts in Sledgehammer not be 'option's -- simplified lots of code
blanchet
parents:
54788
diff
changeset
|
638 |
expressing a number of seconds. |
| 45516 | 639 |
\item[\labelitemi] \qtybf{float\_pair\/}: A pair of floating-point numbers
|
|
40343
4521d56aef63
use floating-point numbers for Sledgehammer's "thresholds" option rather than percentages;
blanchet
parents:
40341
diff
changeset
|
640 |
(e.g., 0.6 0.95). |
| 45516 | 641 |
\item[\labelitemi] \qtybf{smart\_int\/}: An integer or \textit{smart}.
|
| 36926 | 642 |
\end{enum}
|
643 |
||
| 43217 | 644 |
Default values are indicated in curly brackets (\textrm{\{\}}). Boolean options
|
| 61317 | 645 |
have a negative counterpart (e.g., \textit{minimize} vs.\
|
646 |
\textit{dont\_minimize}). When setting Boolean options or their negative
|
|
| 47963 | 647 |
counterparts, ``= \textit{true\/}'' may be omitted.
|
| 36926 | 648 |
|
| 68565 | 649 |
|
| 36926 | 650 |
\subsection{Mode of Operation}
|
651 |
\label{mode-of-operation}
|
|
652 |
||
653 |
\begin{enum}
|
|
| 43014 | 654 |
\opnodefaultbrk{provers}{string}
|
|
40059
6ad9081665db
use consistent terminology in Sledgehammer: "prover = ATP or SMT solver or ..."
blanchet
parents:
39335
diff
changeset
|
655 |
Specifies the automatic provers to use as a space-separated list (e.g., |
| 68565 | 656 |
``\textit{cvc4}~\textit{e}~\textit{spass}~\textit{vampire\/}'').
|
| 46299 | 657 |
Provers can be run locally or remotely; see \S\ref{installation} for
|
| 75036 | 658 |
installation instructions. By default, \textit{provers} is set to the list of
|
659 |
all installed local provers. |
|
| 46299 | 660 |
|
661 |
The following local provers are supported: |
|
| 36926 | 662 |
|
| 48701 | 663 |
\begin{sloppy}
|
| 36926 | 664 |
\begin{enum}
|
| 70937 | 665 |
\item[\labelitemi] \textbf{\textit{agsyhol}:} agsyHOL is an automatic
|
|
70936
646651bcf261
updated nomenclature for TPTP languages to use modern three-symbol abbreviations (e.g. TF1)
blanchet
parents:
70935
diff
changeset
|
666 |
higher-order prover developed by Fredrik Lindblad \cite{agsyHOL}. To use
|
| 70937 | 667 |
agsyHOL, set the environment variable \texttt{AGSYHOL\_HOME} to the directory
|
|
74045
302994f5a3c2
updated Sledgehammer docs -- removed most version numbers since these are tedious to maintain
blanchet
parents:
74005
diff
changeset
|
668 |
that contains the \texttt{agsyHOL} executable.
|
| 52078 | 669 |
|
|
46643
a88bccd2b567
added support for Alt-Ergo through Why3 (mostly for experimental purposes, e.g. polymorphism vs. monomorphization)
blanchet
parents:
46640
diff
changeset
|
670 |
\item[\labelitemi] \textbf{\textit{alt\_ergo}:} Alt-Ergo is a polymorphic
|
| 52078 | 671 |
ATP developed by Bobot et al.\ \cite{alt-ergo}.
|
|
70936
646651bcf261
updated nomenclature for TPTP languages to use modern three-symbol abbreviations (e.g. TF1)
blanchet
parents:
70935
diff
changeset
|
672 |
It supports the TPTP polymorphic typed first-order format (TF1) via Why3 |
| 53102 | 673 |
\cite{why3}. To use Alt-Ergo, set the environment variable \texttt{WHY3\_HOME}
|
|
56379
d8ecce5d51cd
use Alt-Ergo 0.95.2, the latest and greatest version
blanchet
parents:
56378
diff
changeset
|
674 |
to the directory that contains the \texttt{why3} executable. Sledgehammer
|
|
d8ecce5d51cd
use Alt-Ergo 0.95.2, the latest and greatest version
blanchet
parents:
56378
diff
changeset
|
675 |
requires Alt-Ergo 0.95.2 and Why3 0.83. |
|
46643
a88bccd2b567
added support for Alt-Ergo through Why3 (mostly for experimental purposes, e.g. polymorphism vs. monomorphization)
blanchet
parents:
46640
diff
changeset
|
676 |
|
| 74048 | 677 |
\item[\labelitemi] \textbf{\textit{cvc4}:} CVC4 is an SMT solver developed by
|
|
75806
2b106aae897c
added support for cvc5 (whose interface is almost identical to CVC4)
blanchet
parents:
75387
diff
changeset
|
678 |
Barrett et al.\ \cite{cvc4}. To use CVC4,
|
| 74048 | 679 |
set the environment variable \texttt{CVC4\_SOLVER} to the complete path of the
|
680 |
executable, including the file name, or install the prebuilt CVC4 package from |
|
|
74045
302994f5a3c2
updated Sledgehammer docs -- removed most version numbers since these are tedious to maintain
blanchet
parents:
74005
diff
changeset
|
681 |
\download. |
| 57241 | 682 |
|
|
75806
2b106aae897c
added support for cvc5 (whose interface is almost identical to CVC4)
blanchet
parents:
75387
diff
changeset
|
683 |
\item[\labelitemi] \textbf{\textit{cvc5}:} cvc5 is an SMT solver developed by
|
|
2b106aae897c
added support for cvc5 (whose interface is almost identical to CVC4)
blanchet
parents:
75387
diff
changeset
|
684 |
Barbosa et al.\ \cite{barbosa-et-al-cvc5}. To use cvc5,
|
|
2b106aae897c
added support for cvc5 (whose interface is almost identical to CVC4)
blanchet
parents:
75387
diff
changeset
|
685 |
set the environment variable \texttt{CVC5\_SOLVER} to the complete path of the
|
|
2b106aae897c
added support for cvc5 (whose interface is almost identical to CVC4)
blanchet
parents:
75387
diff
changeset
|
686 |
executable, including the file name. |
|
2b106aae897c
added support for cvc5 (whose interface is almost identical to CVC4)
blanchet
parents:
75387
diff
changeset
|
687 |
|
| 45516 | 688 |
\item[\labelitemi] \textbf{\textit{e}:} E is a first-order resolution prover
|
| 72592 | 689 |
developed by Stephan Schulz \cite{schulz-2019}. To use E, set the environment
|
|
42964
bf45fd2488a2
document primitive support for LEO-II and Satallax
blanchet
parents:
42945
diff
changeset
|
690 |
variable \texttt{E\_HOME} to the directory that contains the \texttt{eproof}
|
| 52757 | 691 |
executable and \texttt{E\_VERSION} to the version number (e.g., ``1.8''), or
|
|
74045
302994f5a3c2
updated Sledgehammer docs -- removed most version numbers since these are tedious to maintain
blanchet
parents:
74005
diff
changeset
|
692 |
install the prebuilt E package from \download. |
| 48652 | 693 |
|
| 48701 | 694 |
\item[\labelitemi] \textbf{\textit{iprover}:} iProver is a pure
|
|
74045
302994f5a3c2
updated Sledgehammer docs -- removed most version numbers since these are tedious to maintain
blanchet
parents:
74005
diff
changeset
|
695 |
instantiation-based prover developed by Konstantin Korovin \cite{korovin-2009}.
|
|
302994f5a3c2
updated Sledgehammer docs -- removed most version numbers since these are tedious to maintain
blanchet
parents:
74005
diff
changeset
|
696 |
To use iProver, set the environment variable \texttt{IPROVER\_HOME} to the
|
|
302994f5a3c2
updated Sledgehammer docs -- removed most version numbers since these are tedious to maintain
blanchet
parents:
74005
diff
changeset
|
697 |
directory that contains the \texttt{iproveropt} executable. iProver depends on
|
|
302994f5a3c2
updated Sledgehammer docs -- removed most version numbers since these are tedious to maintain
blanchet
parents:
74005
diff
changeset
|
698 |
Vampire to clausify problems, so make sure that Vampire is installed as well. |
| 48701 | 699 |
|
| 45516 | 700 |
\item[\labelitemi] \textbf{\textit{leo2}:} LEO-II is an automatic
|
| 44098 | 701 |
higher-order prover developed by Christoph Benzm\"uller et al.\ \cite{leo2},
|
|
70936
646651bcf261
updated nomenclature for TPTP languages to use modern three-symbol abbreviations (e.g. TF1)
blanchet
parents:
70935
diff
changeset
|
702 |
with support for the TPTP typed higher-order syntax (TH0). To use LEO-II, set |
| 46242 | 703 |
the environment variable \texttt{LEO2\_HOME} to the directory that contains the
|
|
74045
302994f5a3c2
updated Sledgehammer docs -- removed most version numbers since these are tedious to maintain
blanchet
parents:
74005
diff
changeset
|
704 |
\texttt{leo} executable.
|
| 44098 | 705 |
|
|
67021
41f1f8c4259b
integrated Leo-III in Sledgehammer (thanks to Alexander Steen for the patch)
blanchet
parents:
66735
diff
changeset
|
706 |
\item[\labelitemi] \textbf{\textit{leo3}:} Leo-III is an automatic
|
| 75021 | 707 |
higher-order prover developed by Alexander Steen, Christoph Benzm\"uller, |
708 |
et al.\ \cite{leo3},
|
|
|
70936
646651bcf261
updated nomenclature for TPTP languages to use modern three-symbol abbreviations (e.g. TF1)
blanchet
parents:
70935
diff
changeset
|
709 |
with support for the TPTP typed higher-order syntax (TH0). To use Leo-III, set |
|
67021
41f1f8c4259b
integrated Leo-III in Sledgehammer (thanks to Alexander Steen for the patch)
blanchet
parents:
66735
diff
changeset
|
710 |
the environment variable \texttt{LEO3\_HOME} to the directory that contains the
|
|
74045
302994f5a3c2
updated Sledgehammer docs -- removed most version numbers since these are tedious to maintain
blanchet
parents:
74005
diff
changeset
|
711 |
\texttt{leo3} executable.
|
|
67021
41f1f8c4259b
integrated Leo-III in Sledgehammer (thanks to Alexander Steen for the patch)
blanchet
parents:
66735
diff
changeset
|
712 |
|
| 45516 | 713 |
\item[\labelitemi] \textbf{\textit{satallax}:} Satallax is an automatic
|
| 44098 | 714 |
higher-order prover developed by Chad Brown et al.\ \cite{satallax}, with
|
|
70936
646651bcf261
updated nomenclature for TPTP languages to use modern three-symbol abbreviations (e.g. TF1)
blanchet
parents:
70935
diff
changeset
|
715 |
support for the TPTP typed higher-order syntax (TH0). To use Satallax, set the |
| 46242 | 716 |
environment variable \texttt{SATALLAX\_HOME} to the directory that contains the
|
|
74045
302994f5a3c2
updated Sledgehammer docs -- removed most version numbers since these are tedious to maintain
blanchet
parents:
74005
diff
changeset
|
717 |
\texttt{satallax} executable.
|
| 44098 | 718 |
|
| 45516 | 719 |
\item[\labelitemi] \textbf{\textit{spass}:} SPASS is a first-order resolution
|
|
42964
bf45fd2488a2
document primitive support for LEO-II and Satallax
blanchet
parents:
42945
diff
changeset
|
720 |
prover developed by Christoph Weidenbach et al.\ \cite{weidenbach-et-al-2009}.
|
|
bf45fd2488a2
document primitive support for LEO-II and Satallax
blanchet
parents:
42945
diff
changeset
|
721 |
To use SPASS, set the environment variable \texttt{SPASS\_HOME} to the directory
|
| 47056 | 722 |
that contains the \texttt{SPASS} executable and \texttt{SPASS\_VERSION} to the
|
| 47577 | 723 |
version number (e.g., ``3.8ds''), or install the prebuilt SPASS package from |
|
74045
302994f5a3c2
updated Sledgehammer docs -- removed most version numbers since these are tedious to maintain
blanchet
parents:
74005
diff
changeset
|
724 |
\download. |
| 36926 | 725 |
|
| 48652 | 726 |
\item[\labelitemi] \textbf{\textit{vampire}:} Vampire is a first-order
|
727 |
resolution prover developed by Andrei Voronkov and his colleagues |
|
|
42964
bf45fd2488a2
document primitive support for LEO-II and Satallax
blanchet
parents:
42945
diff
changeset
|
728 |
\cite{riazanov-voronkov-2002}. To use Vampire, set the environment variable
|
|
bf45fd2488a2
document primitive support for LEO-II and Satallax
blanchet
parents:
42945
diff
changeset
|
729 |
\texttt{VAMPIRE\_HOME} to the directory that contains the \texttt{vampire}
|
| 48006 | 730 |
executable and \texttt{VAMPIRE\_VERSION} to the version number (e.g.,
|
|
74045
302994f5a3c2
updated Sledgehammer docs -- removed most version numbers since these are tedious to maintain
blanchet
parents:
74005
diff
changeset
|
731 |
``4.2.2''). |
| 40942 | 732 |
|
|
59035
3a2153676705
renamed 'veriT' to 'verit', to stick to all-lowercase rule for prover names
blanchet
parents:
59034
diff
changeset
|
733 |
\item[\labelitemi] \textbf{\textit{verit}:} veriT \cite{bouton-et-al-2009} is an
|
| 65516 | 734 |
SMT solver developed by David D\'eharbe, Pascal Fontaine, and their colleagues. |
| 72592 | 735 |
It is designed to produce detailed proofs for reconstruction in proof |
|
74388
d5e034f2c109
fixed veriT environment variable in sledgehammer's documentation
desharna
parents:
74367
diff
changeset
|
736 |
assistants. To use veriT, set the environment variable \texttt{ISABELLE\_VERIT}
|
|
74045
302994f5a3c2
updated Sledgehammer docs -- removed most version numbers since these are tedious to maintain
blanchet
parents:
74005
diff
changeset
|
737 |
to the complete path of the executable, including the file name. |
|
58497
20aaa307c0ff
updated docs with two provers: veriT and Zipperposition
blanchet
parents:
58090
diff
changeset
|
738 |
|
| 45516 | 739 |
\item[\labelitemi] \textbf{\textit{z3}:} Z3 is an SMT solver developed at
|
| 72592 | 740 |
Microsoft Research \cite{de-moura-2008}. To use Z3, set the environment variable
|
| 59961 | 741 |
\texttt{Z3\_SOLVER} to the complete path of the executable, including the
|
|
74045
302994f5a3c2
updated Sledgehammer docs -- removed most version numbers since these are tedious to maintain
blanchet
parents:
74005
diff
changeset
|
742 |
file name. |
| 56378 | 743 |
|
|
58497
20aaa307c0ff
updated docs with two provers: veriT and Zipperposition
blanchet
parents:
58090
diff
changeset
|
744 |
\item[\labelitemi] \textbf{\textit{zipperposition}:} Zipperposition
|
| 72174 | 745 |
\cite{cruanes-2014} is a higher-order superposition prover developed by Simon
|
| 72589 | 746 |
Cruanes, Petar Vukmirovi\'c, and colleagues. To use Zipperposition, set the |
747 |
environment variable \texttt{ZIPPERPOSITION\_HOME} to the directory that
|
|
748 |
contains the \texttt{zipperposition} executable and
|
|
749 |
\texttt{ZIPPERPOSITION\_VERSION} to the version number (e.g., ``2.0.1'').
|
|
| 57536 | 750 |
\end{enum}
|
| 56378 | 751 |
|
| 48701 | 752 |
\end{sloppy}
|
| 42945 | 753 |
|
| 57536 | 754 |
Moreover, the following remote provers are supported: |
| 42945 | 755 |
|
756 |
\begin{enum}
|
|
| 52078 | 757 |
\item[\labelitemi] \textbf{\textit{remote\_agsyhol}:} The remote version of
|
| 70937 | 758 |
agsyHOL runs on Geoff Sutcliffe's Miami servers \cite{sutcliffe-2000}.
|
759 |
||
760 |
\item[\labelitemi] \textbf{\textit{remote\_alt\_ergo}:} The remote version of
|
|
761 |
Alt-Ergo runs on Geoff Sutcliffe's Miami servers \cite{sutcliffe-2000}.
|
|
| 52078 | 762 |
|
| 45516 | 763 |
\item[\labelitemi] \textbf{\textit{remote\_e}:} The remote version of E runs
|
| 36926 | 764 |
on Geoff Sutcliffe's Miami servers \cite{sutcliffe-2000}.
|
765 |
||
| 48701 | 766 |
\item[\labelitemi] \textbf{\textit{remote\_iprover}:} The
|
| 45339 | 767 |
remote version of iProver runs on Geoff Sutcliffe's Miami servers |
768 |
\cite{sutcliffe-2000}.
|
|
769 |
||
| 45516 | 770 |
\item[\labelitemi] \textbf{\textit{remote\_leo2}:} The remote version of LEO-II
|
| 44098 | 771 |
runs on Geoff Sutcliffe's Miami servers \cite{sutcliffe-2000}.
|
|
42964
bf45fd2488a2
document primitive support for LEO-II and Satallax
blanchet
parents:
42945
diff
changeset
|
772 |
|
|
67021
41f1f8c4259b
integrated Leo-III in Sledgehammer (thanks to Alexander Steen for the patch)
blanchet
parents:
66735
diff
changeset
|
773 |
\item[\labelitemi] \textbf{\textit{remote\_leo3}:} The remote version of Leo-III
|
|
41f1f8c4259b
integrated Leo-III in Sledgehammer (thanks to Alexander Steen for the patch)
blanchet
parents:
66735
diff
changeset
|
774 |
runs on Geoff Sutcliffe's Miami servers \cite{sutcliffe-2000}.
|
|
41f1f8c4259b
integrated Leo-III in Sledgehammer (thanks to Alexander Steen for the patch)
blanchet
parents:
66735
diff
changeset
|
775 |
|
| 45516 | 776 |
\item[\labelitemi] \textbf{\textit{remote\_waldmeister}:} Waldmeister is a unit
|
| 42945 | 777 |
equality prover developed by Hillenbrand et al.\ \cite{waldmeister}. It can be
|
| 43625 | 778 |
used to prove universally quantified equations using unconditional equations, |
779 |
corresponding to the TPTP CNF UEQ division. The remote version of Waldmeister |
|
780 |
runs on Geoff Sutcliffe's Miami servers. |
|
|
70940
ce3a05ad07b7
added support for Zipperposition on SystemOnTPTP
blanchet
parents:
70938
diff
changeset
|
781 |
|
|
ce3a05ad07b7
added support for Zipperposition on SystemOnTPTP
blanchet
parents:
70938
diff
changeset
|
782 |
\item[\labelitemi] \textbf{\textit{remote\_zipperposition}:} The remote
|
|
ce3a05ad07b7
added support for Zipperposition on SystemOnTPTP
blanchet
parents:
70938
diff
changeset
|
783 |
version of Zipperposition runs on Geoff Sutcliffe's Miami servers. |
| 36926 | 784 |
\end{enum}
|
785 |
||
|
75806
2b106aae897c
added support for cvc5 (whose interface is almost identical to CVC4)
blanchet
parents:
75387
diff
changeset
|
786 |
By default, Sledgehammer runs a subset of CVC4, E, SPASS, Vampire, veriT, Z3, |
|
2b106aae897c
added support for cvc5 (whose interface is almost identical to CVC4)
blanchet
parents:
75387
diff
changeset
|
787 |
and Zipperposition in parallel, either locally or remotely---depending on the |
|
2b106aae897c
added support for cvc5 (whose interface is almost identical to CVC4)
blanchet
parents:
75387
diff
changeset
|
788 |
number of processor cores available and on which provers are actually installed. |
|
2b106aae897c
added support for cvc5 (whose interface is almost identical to CVC4)
blanchet
parents:
75387
diff
changeset
|
789 |
It is generally beneficial to run several provers in parallel. |
|
40059
6ad9081665db
use consistent terminology in Sledgehammer: "prover = ATP or SMT solver or ..."
blanchet
parents:
39335
diff
changeset
|
790 |
|
|
6ad9081665db
use consistent terminology in Sledgehammer: "prover = ATP or SMT solver or ..."
blanchet
parents:
39335
diff
changeset
|
791 |
\opnodefault{prover}{string}
|
|
6ad9081665db
use consistent terminology in Sledgehammer: "prover = ATP or SMT solver or ..."
blanchet
parents:
39335
diff
changeset
|
792 |
Alias for \textit{provers}.
|
|
6ad9081665db
use consistent terminology in Sledgehammer: "prover = ATP or SMT solver or ..."
blanchet
parents:
39335
diff
changeset
|
793 |
|
| 57722 | 794 |
\optrue{minimize}{dont\_minimize}
|
| 72592 | 795 |
Specifies whether the proof minimization tool should be invoked automatically |
796 |
after proof search. |
|
|
45708
7c8bed80301f
updated Sledgehammer docs with new/renamed options
blanchet
parents:
45555
diff
changeset
|
797 |
|
|
7c8bed80301f
updated Sledgehammer docs with new/renamed options
blanchet
parents:
45555
diff
changeset
|
798 |
\nopagebreak |
| 47036 | 799 |
{\small See also \textit{preplay\_timeout} (\S\ref{timeouts})
|
800 |
and \textit{dont\_preplay} (\S\ref{timeouts}).}
|
|
|
45708
7c8bed80301f
updated Sledgehammer docs with new/renamed options
blanchet
parents:
45555
diff
changeset
|
801 |
|
| 53801 | 802 |
\opfalse{spy}{dont\_spy}
|
803 |
Specifies whether Sledgehammer should record statistics in |
|
804 |
\texttt{\$ISA\-BELLE\_\allowbreak HOME\_\allowbreak USER/\allowbreak spy\_\allowbreak sledgehammer}.
|
|
805 |
These statistics can be useful to the developers of Sledgehammer. If you are willing to have your |
|
806 |
interactions recorded in the name of science, please enable this feature and send the statistics |
|
807 |
file every now and then to the author of this manual (\authoremail). |
|
808 |
To change the default value of this option globally, set the environment variable |
|
|
57107
2d502370ee99
changed MaSh to use SML version instead of Python version of naive Bayes by default (i.e. if MASH=yes in the settings, or 'fact_filter=mash' with no other explicit setting)
blanchet
parents:
57095
diff
changeset
|
809 |
\texttt{SLEDGEHAMMER\_SPY} to \textit{yes}.
|
| 53801 | 810 |
|
811 |
\nopagebreak |
|
812 |
{\small See also \textit{debug} (\S\ref{output-format}).}
|
|
813 |
||
| 36926 | 814 |
\opfalse{overlord}{no\_overlord}
|
815 |
Specifies whether Sledgehammer should put its temporary files in |
|
816 |
\texttt{\$ISA\-BELLE\_\allowbreak HOME\_\allowbreak USER}, which is useful for
|
|
817 |
debugging Sledgehammer but also unsafe if several instances of the tool are run |
|
|
48390
4147f2bc4442
add versioning to MaSh state + cleanup dead code
blanchet
parents:
48388
diff
changeset
|
818 |
simultaneously. The files are identified by the prefixes \texttt{prob\_} and
|
|
4147f2bc4442
add versioning to MaSh state + cleanup dead code
blanchet
parents:
48388
diff
changeset
|
819 |
\texttt{mash\_}; you may safely remove them after Sledgehammer has run.
|
| 36926 | 820 |
|
| 54139 | 821 |
\textbf{Warning:} This option is not thread-safe. Use at your own risks.
|
822 |
||
| 36926 | 823 |
\nopagebreak |
824 |
{\small See also \textit{debug} (\S\ref{output-format}).}
|
|
825 |
\end{enum}
|
|
826 |
||
| 68565 | 827 |
|
| 48387 | 828 |
\subsection{Relevance Filter}
|
829 |
\label{relevance-filter}
|
|
830 |
||
831 |
\begin{enum}
|
|
| 48388 | 832 |
\opdefault{fact\_filter}{string}{smart}
|
833 |
Specifies the relevance filter to use. The following filters are available: |
|
834 |
||
835 |
\begin{enum}
|
|
836 |
\item[\labelitemi] \textbf{\textit{mepo}:}
|
|
837 |
The traditional memoryless MePo relevance filter. |
|
838 |
||
839 |
\item[\labelitemi] \textbf{\textit{mash}:}
|
|
| 57532 | 840 |
The MaSh machine learner. Three learning algorithms are provided: |
| 57019 | 841 |
|
842 |
\begin{enum}
|
|
| 57463 | 843 |
\item[\labelitemi] \textbf{\textit{nb}} is an implementation of naive Bayes.
|
| 57019 | 844 |
|
| 57463 | 845 |
\item[\labelitemi] \textbf{\textit{knn}} is an implementation of $k$-nearest
|
846 |
neighbors. |
|
847 |
||
|
57659
b246943b3aa3
reenabled MaSh for Isabelle2014 release (hopefully)
blanchet
parents:
57636
diff
changeset
|
848 |
\item[\labelitemi] \textbf{\textit{nb\_knn}} (also called \textbf{\textit{yes}}
|
|
b246943b3aa3
reenabled MaSh for Isabelle2014 release (hopefully)
blanchet
parents:
57636
diff
changeset
|
849 |
and \textbf{\textit{sml}}) is a combination of naive Bayes and $k$-nearest
|
|
b246943b3aa3
reenabled MaSh for Isabelle2014 release (hopefully)
blanchet
parents:
57636
diff
changeset
|
850 |
neighbors. |
| 57019 | 851 |
\end{enum}
|
852 |
||
|
57272
fd539459a112
enabled MaSh by default -- set 'MaSh' to 'none' in Isabelle Plugin Options to disable
blanchet
parents:
57245
diff
changeset
|
853 |
In addition, the special value \textit{none} is used to disable machine learning by
|
|
fd539459a112
enabled MaSh by default -- set 'MaSh' to 'none' in Isabelle Plugin Options to disable
blanchet
parents:
57245
diff
changeset
|
854 |
default (cf.\ \textit{smart} below).
|
|
fd539459a112
enabled MaSh by default -- set 'MaSh' to 'none' in Isabelle Plugin Options to disable
blanchet
parents:
57245
diff
changeset
|
855 |
|
|
57659
b246943b3aa3
reenabled MaSh for Isabelle2014 release (hopefully)
blanchet
parents:
57636
diff
changeset
|
856 |
The default algorithm is \textit{nb\_knn}. The algorithm can be selected by
|
| 61043 | 857 |
setting the ``MaSh'' option under ``Plugins > Plugin Options > Isabelle > |
| 57532 | 858 |
General'' in Isabelle/jEdit. Persistent data for both algorithms is stored in |
859 |
the directory \texttt{\$ISABELLE\_\allowbreak HOME\_\allowbreak USER/\allowbreak
|
|
860 |
mash}. |
|
| 48388 | 861 |
|
|
51024
98fb341d32e3
distinguish MeSh and smart -- with smart, allow combinations of MaSh, MeSh, and MePo in different slices -- and use MaSh also with SMT solvers, based on evaluation
blanchet
parents:
50929
diff
changeset
|
862 |
\item[\labelitemi] \textbf{\textit{mesh}:} The MeSh filter, which combines the
|
|
98fb341d32e3
distinguish MeSh and smart -- with smart, allow combinations of MaSh, MeSh, and MePo in different slices -- and use MaSh also with SMT solvers, based on evaluation
blanchet
parents:
50929
diff
changeset
|
863 |
rankings from MePo and MaSh. |
| 48388 | 864 |
|
|
57659
b246943b3aa3
reenabled MaSh for Isabelle2014 release (hopefully)
blanchet
parents:
57636
diff
changeset
|
865 |
\item[\labelitemi] \textbf{\textit{smart}:} A combination of MePo, MaSh, and
|
|
b246943b3aa3
reenabled MaSh for Isabelle2014 release (hopefully)
blanchet
parents:
57636
diff
changeset
|
866 |
MeSh. If the learning algorithm is set to be \textit{none}, \textit{smart}
|
|
b246943b3aa3
reenabled MaSh for Isabelle2014 release (hopefully)
blanchet
parents:
57636
diff
changeset
|
867 |
behaves like MePo. |
| 48388 | 868 |
\end{enum}
|
869 |
||
| 48387 | 870 |
\opdefault{max\_facts}{smart\_int}{smart}
|
871 |
Specifies the maximum number of facts that may be returned by the relevance |
|
|
55297
1dfcd49f5dcb
renamed 'smt' option 'smt_proofs' to avoid clash with 'smt' prover
blanchet
parents:
55290
diff
changeset
|
872 |
filter. If the option is set to \textit{smart} (the default), it effectively
|
|
1dfcd49f5dcb
renamed 'smt' option 'smt_proofs' to avoid clash with 'smt' prover
blanchet
parents:
55290
diff
changeset
|
873 |
takes a value that was empirically found to be appropriate for the prover. |
|
57107
2d502370ee99
changed MaSh to use SML version instead of Python version of naive Bayes by default (i.e. if MASH=yes in the settings, or 'fact_filter=mash' with no other explicit setting)
blanchet
parents:
57095
diff
changeset
|
874 |
Typical values lie between 50 and 1000. |
|
53757
8d1a059ebcdb
reduce the number of emitted MaSh commands (among others to facilitate debugging)
blanchet
parents:
53518
diff
changeset
|
875 |
|
| 48387 | 876 |
\opdefault{fact\_thresholds}{float\_pair}{\upshape 0.45~0.85}
|
877 |
Specifies the thresholds above which facts are considered relevant by the |
|
878 |
relevance filter. The first threshold is used for the first iteration of the |
|
879 |
relevance filter and the second threshold is used for the last iteration (if it |
|
880 |
is reached). The effective threshold is quadratically interpolated for the other |
|
881 |
iterations. Each threshold ranges from 0 to 1, where 0 means that all theorems |
|
882 |
are relevant and 1 only theorems that refer to previously seen constants. |
|
883 |
||
| 48388 | 884 |
\optrue{learn}{dont\_learn}
|
| 72592 | 885 |
Specifies whether Sledgehammer invocations should run MaSh to learn the |
|
53760
cf37f4b84824
moved focus to Isabell/jEdit and away from Proof General
blanchet
parents:
53759
diff
changeset
|
886 |
available theories (and hence provide more accurate results). Learning takes |
|
cf37f4b84824
moved focus to Isabell/jEdit and away from Proof General
blanchet
parents:
53759
diff
changeset
|
887 |
place only if MaSh is enabled. |
| 48388 | 888 |
|
| 48387 | 889 |
\opdefault{max\_new\_mono\_instances}{int}{smart}
|
890 |
Specifies the maximum number of monomorphic instances to generate beyond |
|
891 |
\textit{max\_facts}. The higher this limit is, the more monomorphic instances
|
|
892 |
are potentially generated. Whether monomorphization takes place depends on the |
|
|
55297
1dfcd49f5dcb
renamed 'smt' option 'smt_proofs' to avoid clash with 'smt' prover
blanchet
parents:
55290
diff
changeset
|
893 |
type encoding used. If the option is set to \textit{smart} (the default), it
|
|
1dfcd49f5dcb
renamed 'smt' option 'smt_proofs' to avoid clash with 'smt' prover
blanchet
parents:
55290
diff
changeset
|
894 |
takes a value that was empirically found to be appropriate for the prover. For |
|
1dfcd49f5dcb
renamed 'smt' option 'smt_proofs' to avoid clash with 'smt' prover
blanchet
parents:
55290
diff
changeset
|
895 |
most provers, this value is 100. |
| 48387 | 896 |
|
897 |
\nopagebreak |
|
898 |
{\small See also \textit{type\_enc} (\S\ref{problem-encoding}).}
|
|
899 |
||
900 |
\opdefault{max\_mono\_iters}{int}{smart}
|
|
901 |
Specifies the maximum number of iterations for the monomorphization fixpoint |
|
902 |
construction. The higher this limit is, the more monomorphic instances are |
|
903 |
potentially generated. Whether monomorphization takes place depends on the |
|
|
55297
1dfcd49f5dcb
renamed 'smt' option 'smt_proofs' to avoid clash with 'smt' prover
blanchet
parents:
55290
diff
changeset
|
904 |
type encoding used. If the option is set to \textit{smart} (the default), it
|
|
1dfcd49f5dcb
renamed 'smt' option 'smt_proofs' to avoid clash with 'smt' prover
blanchet
parents:
55290
diff
changeset
|
905 |
takes a value that was empirically found to be appropriate for the prover. |
|
1dfcd49f5dcb
renamed 'smt' option 'smt_proofs' to avoid clash with 'smt' prover
blanchet
parents:
55290
diff
changeset
|
906 |
For most provers, this value is 3. |
| 48387 | 907 |
|
908 |
\nopagebreak |
|
909 |
{\small See also \textit{type\_enc} (\S\ref{problem-encoding}).}
|
|
|
73941
bec00c7ef8dd
documented Sledgehammer option "induction_rules"
desharna
parents:
73935
diff
changeset
|
910 |
|
|
75019
30a619de7973
use same default for FO and HO provers w.r.t. induction principles, based on evaluation -- this also simplifies the code
blanchet
parents:
75016
diff
changeset
|
911 |
\opdefault{induction\_rules}{string}{exclude}
|
|
73941
bec00c7ef8dd
documented Sledgehammer option "induction_rules"
desharna
parents:
73935
diff
changeset
|
912 |
Specifies whether induction rules should be considered as relevant facts. |
|
bec00c7ef8dd
documented Sledgehammer option "induction_rules"
desharna
parents:
73935
diff
changeset
|
913 |
The following behaviors are available: |
|
bec00c7ef8dd
documented Sledgehammer option "induction_rules"
desharna
parents:
73935
diff
changeset
|
914 |
\begin{enum}
|
|
bec00c7ef8dd
documented Sledgehammer option "induction_rules"
desharna
parents:
73935
diff
changeset
|
915 |
\item[\labelitemi] \textbf{\textit{exclude}:}
|
|
bec00c7ef8dd
documented Sledgehammer option "induction_rules"
desharna
parents:
73935
diff
changeset
|
916 |
Induction rules are ignored by the relevance filter. |
|
bec00c7ef8dd
documented Sledgehammer option "induction_rules"
desharna
parents:
73935
diff
changeset
|
917 |
|
|
74957
089eeaaee525
proper documentation for induction_rules Sledgehammer option
desharna
parents:
74388
diff
changeset
|
918 |
\item[\labelitemi] \textbf{\textit{instantiate}:}
|
|
75019
30a619de7973
use same default for FO and HO provers w.r.t. induction principles, based on evaluation -- this also simplifies the code
blanchet
parents:
75016
diff
changeset
|
919 |
Induction rules are instantiated based on the goal and then |
|
73941
bec00c7ef8dd
documented Sledgehammer option "induction_rules"
desharna
parents:
73935
diff
changeset
|
920 |
considered by the relevance filter. |
|
bec00c7ef8dd
documented Sledgehammer option "induction_rules"
desharna
parents:
73935
diff
changeset
|
921 |
|
|
75019
30a619de7973
use same default for FO and HO provers w.r.t. induction principles, based on evaluation -- this also simplifies the code
blanchet
parents:
75016
diff
changeset
|
922 |
\item[\labelitemi] \textbf{\textit{include}:}
|
|
30a619de7973
use same default for FO and HO provers w.r.t. induction principles, based on evaluation -- this also simplifies the code
blanchet
parents:
75016
diff
changeset
|
923 |
Induction rules are considered by the relevance filter. |
|
73941
bec00c7ef8dd
documented Sledgehammer option "induction_rules"
desharna
parents:
73935
diff
changeset
|
924 |
\end{enum}
|
| 48387 | 925 |
\end{enum}
|
926 |
||
| 68565 | 927 |
|
| 36926 | 928 |
\subsection{Problem Encoding}
|
929 |
\label{problem-encoding}
|
|
930 |
||
| 45516 | 931 |
\newcommand\comb[1]{\const{#1}}
|
932 |
||
| 36926 | 933 |
\begin{enum}
|
| 45516 | 934 |
\opdefault{lam\_trans}{string}{smart}
|
935 |
Specifies the $\lambda$ translation scheme to use in ATP problems. The supported |
|
936 |
translation schemes are listed below: |
|
937 |
||
938 |
\begin{enum}
|
|
| 46366 | 939 |
\item[\labelitemi] \textbf{\textit{lifting}:} Introduce a new
|
| 45516 | 940 |
supercombinator \const{c} for each cluster of $n$~$\lambda$-abstractions,
|
941 |
defined using an equation $\const{c}~x_1~\ldots~x_n = t$ ($\lambda$-lifting).
|
|
942 |
||
|
73935
269b2f976100
added documentation for changes to Sledgehammer option "lam_trans"
desharna
parents:
73932
diff
changeset
|
943 |
\item[\labelitemi] \textbf{\textit{opaque\_lifting}:} Same as
|
|
73941
bec00c7ef8dd
documented Sledgehammer option "induction_rules"
desharna
parents:
73935
diff
changeset
|
944 |
\textit{lifting}, except that the supercombinators are kept opaque,
|
|
bec00c7ef8dd
documented Sledgehammer option "induction_rules"
desharna
parents:
73935
diff
changeset
|
945 |
i.e. they are unspecified fresh constants. This effectively disables |
|
bec00c7ef8dd
documented Sledgehammer option "induction_rules"
desharna
parents:
73935
diff
changeset
|
946 |
all reasoning under $\lambda$-abstractions. |
|
73935
269b2f976100
added documentation for changes to Sledgehammer option "lam_trans"
desharna
parents:
73932
diff
changeset
|
947 |
|
| 46366 | 948 |
\item[\labelitemi] \textbf{\textit{combs}:} Rewrite lambdas to the Curry
|
| 45516 | 949 |
combinators (\comb{I}, \comb{K}, \comb{S}, \comb{B}, \comb{C}). Combinators
|
950 |
enable the ATPs to synthesize $\lambda$-terms but tend to yield bulkier formulas |
|
951 |
than $\lambda$-lifting: The translation is quadratic in the worst case, and the |
|
952 |
equational definitions of the combinators are very prolific in the context of |
|
953 |
resolution. |
|
954 |
||
|
73935
269b2f976100
added documentation for changes to Sledgehammer option "lam_trans"
desharna
parents:
73932
diff
changeset
|
955 |
\item[\labelitemi] \textbf{\textit{opaque\_combs}:} Same as
|
|
73941
bec00c7ef8dd
documented Sledgehammer option "induction_rules"
desharna
parents:
73935
diff
changeset
|
956 |
\textit{combs}, except that the combinators are kept opaque, i.e. without
|
|
bec00c7ef8dd
documented Sledgehammer option "induction_rules"
desharna
parents:
73935
diff
changeset
|
957 |
equational definitions. |
|
73935
269b2f976100
added documentation for changes to Sledgehammer option "lam_trans"
desharna
parents:
73932
diff
changeset
|
958 |
|
| 46366 | 959 |
\item[\labelitemi] \textbf{\textit{combs\_and\_lifting}:} Introduce a new
|
| 45516 | 960 |
supercombinator \const{c} for each cluster of $\lambda$-abstractions and characterize it both using a
|
961 |
lifted equation $\const{c}~x_1~\ldots~x_n = t$ and via Curry combinators.
|
|
962 |
||
| 46366 | 963 |
\item[\labelitemi] \textbf{\textit{combs\_or\_lifting}:} For each cluster of
|
964 |
$\lambda$-abstractions, heuristically choose between $\lambda$-lifting and Curry |
|
965 |
combinators. |
|
966 |
||
| 45516 | 967 |
\item[\labelitemi] \textbf{\textit{keep\_lams}:}
|
968 |
Keep the $\lambda$-abstractions in the generated problems. This is available |
|
|
73859
bc263f1f68cd
added support for TFX's and THF's $ite to Sledgehammer
desharna
parents:
73858
diff
changeset
|
969 |
only with provers that support $\lambda$s. |
| 45516 | 970 |
|
971 |
\item[\labelitemi] \textbf{\textit{smart}:} The actual translation scheme used
|
|
972 |
depends on the ATP and should be the most efficient scheme for that ATP. |
|
973 |
\end{enum}
|
|
974 |
||
| 46366 | 975 |
For SMT solvers, the $\lambda$ translation scheme is always \textit{lifting},
|
976 |
irrespective of the value of this option. |
|
| 45516 | 977 |
|
|
46409
d4754183ccce
made option available to users (mostly for experiments)
blanchet
parents:
46366
diff
changeset
|
978 |
\opsmartx{uncurried\_aliases}{no\_uncurried\_aliases}
|
| 46411 | 979 |
Specifies whether fresh function symbols should be generated as aliases for |
980 |
applications of curried functions in ATP problems. |
|
|
46409
d4754183ccce
made option available to users (mostly for experiments)
blanchet
parents:
46366
diff
changeset
|
981 |
|
|
43627
ecd4bb7a8bc0
update documentation after "type_enc" renaming + fixed a few other out-of-date factlets
blanchet
parents:
43625
diff
changeset
|
982 |
\opdefault{type\_enc}{string}{smart}
|
|
ecd4bb7a8bc0
update documentation after "type_enc" renaming + fixed a few other out-of-date factlets
blanchet
parents:
43625
diff
changeset
|
983 |
Specifies the type encoding to use in ATP problems. Some of the type encodings |
|
ecd4bb7a8bc0
update documentation after "type_enc" renaming + fixed a few other out-of-date factlets
blanchet
parents:
43625
diff
changeset
|
984 |
are unsound, meaning that they can give rise to spurious proofs |
| 48093 | 985 |
(unreconstructible using \textit{metis}). The type encodings are
|
| 46300 | 986 |
listed below, with an indication of their soundness in parentheses. |
| 48093 | 987 |
An asterisk (*) indicates that the encoding is slightly incomplete for |
|
56120
04c37dfef684
updated Sledgehammer docs w.r.t. 'smt2' and 'z3_new'
blanchet
parents:
56119
diff
changeset
|
988 |
reconstruction with \textit{metis}, unless the \textit{strict} option (described
|
| 46302 | 989 |
below) is enabled. |
| 42228 | 990 |
|
991 |
\begin{enum}
|
|
| 48090 | 992 |
\item[\labelitemi] \textbf{\textit{erased} (unsound):} No type information is
|
| 46300 | 993 |
supplied to the ATP, not even to resolve overloading. Types are simply erased. |
| 42582 | 994 |
|
| 45516 | 995 |
\item[\labelitemi] \textbf{\textit{poly\_guards} (sound):} Types are encoded using
|
| 46300 | 996 |
a predicate \const{g}$(\tau, t)$ that guards bound
|
| 48090 | 997 |
variables. Constants are annotated with their types, supplied as extra |
|
42887
771be1dcfef6
document new type system and soundness properties of the different systems
blanchet
parents:
42884
diff
changeset
|
998 |
arguments, to resolve overloading. |
| 42685 | 999 |
|
| 45516 | 1000 |
\item[\labelitemi] \textbf{\textit{poly\_tags} (sound):} Each term and subterm is
|
| 46300 | 1001 |
tagged with its type using a function $\const{t\/}(\tau, t)$.
|
|
42887
771be1dcfef6
document new type system and soundness properties of the different systems
blanchet
parents:
42884
diff
changeset
|
1002 |
|
| 45516 | 1003 |
\item[\labelitemi] \textbf{\textit{poly\_args} (unsound):}
|
| 43990 | 1004 |
Like for \textit{poly\_guards} constants are annotated with their types to
|
|
43002
e88fde86e4c2
mention contributions from LCP and explain metis and metisFT encodings
blanchet
parents:
42996
diff
changeset
|
1005 |
resolve overloading, but otherwise no type information is encoded. This |
| 57040 | 1006 |
is the default encoding used by the \textit{metis} proof method.
|
| 42685 | 1007 |
|
| 45516 | 1008 |
\item[\labelitemi] |
| 42722 | 1009 |
\textbf{%
|
|
44494
a77901b3774e
rationalized option names -- mono becomes raw_mono and mangled becomes mono
blanchet
parents:
44423
diff
changeset
|
1010 |
\textit{raw\_mono\_guards}, \textit{raw\_mono\_tags} (sound); \\
|
|
a77901b3774e
rationalized option names -- mono becomes raw_mono and mangled becomes mono
blanchet
parents:
44423
diff
changeset
|
1011 |
\textit{raw\_mono\_args} (unsound):} \\
|
| 43990 | 1012 |
Similar to \textit{poly\_guards}, \textit{poly\_tags}, and \textit{poly\_args},
|
| 42722 | 1013 |
respectively, but the problem is additionally monomorphized, meaning that type |
1014 |
variables are instantiated with heuristically chosen ground types. |
|
1015 |
Monomorphization can simplify reasoning but also leads to larger fact bases, |
|
1016 |
which can slow down the ATPs. |
|
| 42582 | 1017 |
|
| 45516 | 1018 |
\item[\labelitemi] |
| 42722 | 1019 |
\textbf{%
|
|
44494
a77901b3774e
rationalized option names -- mono becomes raw_mono and mangled becomes mono
blanchet
parents:
44423
diff
changeset
|
1020 |
\textit{mono\_guards}, \textit{mono\_tags} (sound);
|
| 72589 | 1021 |
\textit{mono\_args} \\ (unsound):} \\
|
| 42722 | 1022 |
Similar to |
|
44494
a77901b3774e
rationalized option names -- mono becomes raw_mono and mangled becomes mono
blanchet
parents:
44423
diff
changeset
|
1023 |
\textit{raw\_mono\_guards}, \textit{raw\_mono\_tags}, and
|
| 72589 | 1024 |
\textit{raw\_mono\_\allowbreak args}, respectively but types are mangled in constant names
|
|
44494
a77901b3774e
rationalized option names -- mono becomes raw_mono and mangled becomes mono
blanchet
parents:
44423
diff
changeset
|
1025 |
instead of being supplied as ground term arguments. The binary predicate |
| 46300 | 1026 |
$\const{g}(\tau, t)$ becomes a unary predicate
|
1027 |
$\const{g\_}\tau(t)$, and the binary function
|
|
1028 |
$\const{t}(\tau, t)$ becomes a unary function
|
|
1029 |
$\const{t\_}\tau(t)$.
|
|
|
42589
9f7c48463645
restructured type systems some more -- the old naming schemes had "argshg diff |less" and "tagshg diff |less" as equivalent and didn't support a monomorphic version of "tags"
blanchet
parents:
42582
diff
changeset
|
1030 |
|
| 46435 | 1031 |
\item[\labelitemi] \textbf{\textit{mono\_native} (sound):} Exploits native
|
|
70936
646651bcf261
updated nomenclature for TPTP languages to use modern three-symbol abbreviations (e.g. TF1)
blanchet
parents:
70935
diff
changeset
|
1032 |
first-order types if the prover supports the TF0, TF1, TH0, or TH1 syntax; |
|
46643
a88bccd2b567
added support for Alt-Ergo through Why3 (mostly for experimental purposes, e.g. polymorphism vs. monomorphization)
blanchet
parents:
46640
diff
changeset
|
1033 |
otherwise, falls back on \textit{mono\_guards}. The problem is monomorphized.
|
| 43625 | 1034 |
|
| 72589 | 1035 |
\item[\labelitemi] \textbf{\textit{mono\_native\_fool} (sound):} Exploits native
|
1036 |
first-order types, including Booleans, if the prover supports the TFX0, TFX1, |
|
1037 |
TH0, or TH1 syntax; otherwise, falls back on \textit{mono\_native}. The problem
|
|
1038 |
is monomorphized. |
|
| 42681 | 1039 |
|
| 72589 | 1040 |
\item[\labelitemi] \textbf{\textit{mono\_native\_higher},
|
1041 |
\textit{mono\_native\_higher\_fool} \\ (sound):} Exploits native higher-order
|
|
1042 |
types, including Booleans if ending with ``\textit{\_fool}'', if the prover
|
|
1043 |
supports the TH0 syntax; otherwise, falls back on \textit{mono\_native} or
|
|
1044 |
\textit{mono\_native\_fool}. The problem is monomorphized.
|
|
1045 |
||
1046 |
\item[\labelitemi] \textbf{\textit{poly\_native}, \textit{poly\_native\_fool},
|
|
1047 |
\textit{poly\_native\_higher}, \\ \textit{poly\_native\_higher\_fool} (sound):}
|
|
1048 |
Exploits native first-order polymorphic types if the prover supports the TF1, |
|
1049 |
TFX1, or TH1 syntax; otherwise, falls back on \textit{mono\_native},
|
|
1050 |
\textit{mono\_native\_fool}, \textit{mono\_native\_higher}, or
|
|
1051 |
\textit{mono\_native\_higher\_fool}.
|
|
|
46643
a88bccd2b567
added support for Alt-Ergo through Why3 (mostly for experimental purposes, e.g. polymorphism vs. monomorphization)
blanchet
parents:
46640
diff
changeset
|
1052 |
|
| 45516 | 1053 |
\item[\labelitemi] |
| 42681 | 1054 |
\textbf{%
|
|
44494
a77901b3774e
rationalized option names -- mono becomes raw_mono and mangled becomes mono
blanchet
parents:
44423
diff
changeset
|
1055 |
\textit{poly\_guards}?, \textit{poly\_tags}?, \textit{raw\_mono\_guards}?, \\
|
|
a77901b3774e
rationalized option names -- mono becomes raw_mono and mangled becomes mono
blanchet
parents:
44423
diff
changeset
|
1056 |
\textit{raw\_mono\_tags}?, \textit{mono\_guards}?, \textit{mono\_tags}?, \\
|
| 46435 | 1057 |
\textit{mono\_native}? (sound*):} \\
|
| 43990 | 1058 |
The type encodings \textit{poly\_guards}, \textit{poly\_tags},
|
|
44494
a77901b3774e
rationalized option names -- mono becomes raw_mono and mangled becomes mono
blanchet
parents:
44423
diff
changeset
|
1059 |
\textit{raw\_mono\_guards}, \textit{raw\_mono\_tags}, \textit{mono\_guards},
|
| 47036 | 1060 |
\textit{mono\_tags}, and \textit{mono\_native} are fully typed and sound. For
|
1061 |
each of these, Sledgehammer also provides a lighter variant identified by a |
|
1062 |
question mark (`\hbox{?}')\ that detects and erases monotonic types, notably
|
|
1063 |
infinite types. (For \textit{mono\_native}, the types are not actually erased
|
|
1064 |
but rather replaced by a shared uniform type of individuals.) As argument to the |
|
1065 |
\textit{metis} proof method, the question mark is replaced by a
|
|
1066 |
\hbox{``\textit{\_query\/}''} suffix.
|
|
| 42582 | 1067 |
|
| 45516 | 1068 |
\item[\labelitemi] |
|
42887
771be1dcfef6
document new type system and soundness properties of the different systems
blanchet
parents:
42884
diff
changeset
|
1069 |
\textbf{%
|
| 44769 | 1070 |
\textit{poly\_guards}??, \textit{poly\_tags}??, \textit{raw\_mono\_guards}??, \\
|
1071 |
\textit{raw\_mono\_tags}??, \textit{mono\_guards}??, \textit{mono\_tags}?? \\
|
|
| 46300 | 1072 |
(sound*):} \\ |
| 44816 | 1073 |
Even lighter versions of the `\hbox{?}' encodings. As argument to the
|
1074 |
\textit{metis} proof method, the `\hbox{??}' suffix is replaced by
|
|
| 46242 | 1075 |
\hbox{``\textit{\_query\_query\/}''}.
|
| 44816 | 1076 |
|
| 45516 | 1077 |
\item[\labelitemi] |
| 44816 | 1078 |
\textbf{%
|
| 48184 | 1079 |
\textit{poly\_guards}@, \textit{poly\_tags}@, \textit{raw\_mono\_guards}@, \\
|
1080 |
\textit{raw\_mono\_tags}@ (sound*):} \\
|
|
| 44816 | 1081 |
Alternative versions of the `\hbox{??}' encodings. As argument to the
|
| 48184 | 1082 |
\textit{metis} proof method, the `\hbox{@}' suffix is replaced by
|
1083 |
\hbox{``\textit{\_at\/}''}.
|
|
| 44769 | 1084 |
|
| 48093 | 1085 |
\item[\labelitemi] \textbf{\textit{poly\_args}?, \textit{raw\_mono\_args}? (unsound):} \\
|
1086 |
Lighter versions of \textit{poly\_args} and \textit{raw\_mono\_args}.
|
|
1087 |
||
| 45516 | 1088 |
\item[\labelitemi] \textbf{\textit{smart}:} The actual encoding used depends on
|
| 47036 | 1089 |
the ATP and should be the most efficient sound encoding for that ATP. |
| 42228 | 1090 |
\end{enum}
|
1091 |
||
| 46435 | 1092 |
For SMT solvers, the type encoding is always \textit{mono\_native}, irrespective
|
| 44743 | 1093 |
of the value of this option. |
| 42888 | 1094 |
|
1095 |
\nopagebreak |
|
1096 |
{\small See also \textit{max\_new\_mono\_instances} (\S\ref{relevance-filter})
|
|
1097 |
and \textit{max\_mono\_iters} (\S\ref{relevance-filter}).}
|
|
| 43574 | 1098 |
|
| 46302 | 1099 |
\opfalse{strict}{non\_strict}
|
| 46300 | 1100 |
Specifies whether Sledgehammer should run in its strict mode. In that mode, |
| 46302 | 1101 |
sound type encodings marked with an asterisk (*) above are made complete |
| 46300 | 1102 |
for reconstruction with \textit{metis}, at the cost of some clutter in the
|
1103 |
generated problems. This option has no effect if \textit{type\_enc} is
|
|
1104 |
deliberately set to an unsound encoding. |
|
| 38591 | 1105 |
\end{enum}
|
| 36926 | 1106 |
|
| 68565 | 1107 |
|
| 36926 | 1108 |
\subsection{Output Format}
|
1109 |
\label{output-format}
|
|
1110 |
||
1111 |
\begin{enum}
|
|
1112 |
||
1113 |
\opfalse{verbose}{quiet}
|
|
1114 |
Specifies whether the \textbf{sledgehammer} command should explain what it does.
|
|
1115 |
||
1116 |
\opfalse{debug}{no\_debug}
|
|
| 40203 | 1117 |
Specifies whether Sledgehammer should display additional debugging information |
1118 |
beyond what \textit{verbose} already displays. Enabling \textit{debug} also
|
|
| 61317 | 1119 |
enables \textit{verbose} behind the scenes.
|
| 36926 | 1120 |
|
1121 |
\nopagebreak |
|
| 53801 | 1122 |
{\small See also \textit{spy} (\S\ref{mode-of-operation}) and
|
1123 |
\textit{overlord} (\S\ref{mode-of-operation}).}
|
|
| 36926 | 1124 |
|
| 75030 | 1125 |
\opdefault{max\_proofs}{int}{\upshape 4}
|
| 75031 | 1126 |
Specifies the maximum number of proofs to display before stopping. This is a |
1127 |
soft limit. |
|
| 75030 | 1128 |
|
|
51190
2654b3965c8d
made "isar_proofs" a 3-way option, to provide a way to totally disable isar_proofs if desired
blanchet
parents:
51189
diff
changeset
|
1129 |
\opsmart{isar\_proofs}{no\_isar\_proofs}
|
|
55297
1dfcd49f5dcb
renamed 'smt' option 'smt_proofs' to avoid clash with 'smt' prover
blanchet
parents:
55290
diff
changeset
|
1130 |
Specifies whether Isar proofs should be output in addition to one-line proofs. |
|
1dfcd49f5dcb
renamed 'smt' option 'smt_proofs' to avoid clash with 'smt' prover
blanchet
parents:
55290
diff
changeset
|
1131 |
The construction of Isar proof is still experimental and may sometimes fail; |
|
1dfcd49f5dcb
renamed 'smt' option 'smt_proofs' to avoid clash with 'smt' prover
blanchet
parents:
55290
diff
changeset
|
1132 |
however, when they succeed they are usually faster and more intelligible than |
|
1dfcd49f5dcb
renamed 'smt' option 'smt_proofs' to avoid clash with 'smt' prover
blanchet
parents:
55290
diff
changeset
|
1133 |
one-line proofs. If the option is set to \textit{smart} (the default), Isar
|
|
1dfcd49f5dcb
renamed 'smt' option 'smt_proofs' to avoid clash with 'smt' prover
blanchet
parents:
55290
diff
changeset
|
1134 |
proofs are only generated when no working one-line proof is available. |
| 36926 | 1135 |
|
| 57784 | 1136 |
\opdefault{compress}{int}{smart}
|
| 49919 | 1137 |
Specifies the granularity of the generated Isar proofs if \textit{isar\_proofs}
|
|
51190
2654b3965c8d
made "isar_proofs" a 3-way option, to provide a way to totally disable isar_proofs if desired
blanchet
parents:
51189
diff
changeset
|
1138 |
is explicitly enabled. A value of $n$ indicates that each Isar proof step should |
| 57784 | 1139 |
correspond to a group of up to $n$ consecutive proof steps in the ATP proof. If |
1140 |
the option is set to \textit{smart} (the default), the compression factor is 10
|
|
1141 |
if the \textit{isar\_proofs} option is explicitly enabled; otherwise, it is
|
|
1142 |
$\infty$. |
|
| 51189 | 1143 |
|
| 57245 | 1144 |
\optrueonly{dont\_compress}
|
| 57784 | 1145 |
Alias for ``\textit{compress} = 1''.
|
| 51189 | 1146 |
|
| 57245 | 1147 |
\optrue{try0}{dont\_try0}
|
| 53765 | 1148 |
Specifies whether standard proof methods such as \textit{auto} and
|
| 55289 | 1149 |
\textit{blast} should be tried as alternatives to \textit{metis} in Isar proofs.
|
1150 |
The collection of methods is roughly the same as for the \textbf{try0} command.
|
|
1151 |
||
|
71931
0c8a9c028304
simplified 'smt_proofs' option to be a binary option (instead of ternary), now that SMT proofs are accepted in the AFP (done with Martin Desharnais)
blanchet
parents:
70940
diff
changeset
|
1152 |
\optrue{smt\_proofs}{no\_smt\_proofs}
|
| 61283 | 1153 |
Specifies whether the \textit{smt} proof method should be tried in addition to
|
|
71931
0c8a9c028304
simplified 'smt_proofs' option to be a binary option (instead of ternary), now that SMT proofs are accepted in the AFP (done with Martin Desharnais)
blanchet
parents:
70940
diff
changeset
|
1154 |
Isabelle's built-in proof methods. |
| 36926 | 1155 |
\end{enum}
|
1156 |
||
| 68565 | 1157 |
|
| 57241 | 1158 |
\subsection{Regression Testing}
|
1159 |
\label{regression-testing}
|
|
| 38984 | 1160 |
|
1161 |
\begin{enum}
|
|
1162 |
\opnodefault{expect}{string}
|
|
1163 |
Specifies the expected outcome, which must be one of the following: |
|
| 36926 | 1164 |
|
1165 |
\begin{enum}
|
|
| 46300 | 1166 |
\item[\labelitemi] \textbf{\textit{some}:} Sledgehammer found a proof.
|
| 75376 | 1167 |
\item[\labelitemi] \textbf{\textit{some\_preplayed}:} Sledgehammer found a proof that was successfully preplayed.
|
| 45516 | 1168 |
\item[\labelitemi] \textbf{\textit{none}:} Sledgehammer found no proof.
|
1169 |
\item[\labelitemi] \textbf{\textit{timeout}:} Sledgehammer timed out.
|
|
1170 |
\item[\labelitemi] \textbf{\textit{unknown}:} Sledgehammer encountered some
|
|
| 40203 | 1171 |
problem. |
| 38984 | 1172 |
\end{enum}
|
1173 |
||
| 61317 | 1174 |
Sledgehammer emits an error if the actual outcome differs from the expected outcome. This option is |
1175 |
useful for regression testing. |
|
| 38984 | 1176 |
|
| 75387 | 1177 |
The expected outcomes are not mutually exclusive. More specifically, \textit{some} is accepted
|
1178 |
whenever \textit{some\_preplayed} is accepted as the former has strictly fewer requirements
|
|
1179 |
than the later. |
|
1180 |
||
| 38984 | 1181 |
\nopagebreak |
| 61317 | 1182 |
{\small See also \textit{timeout} (\S\ref{timeouts}).}
|
| 43038 | 1183 |
\end{enum}
|
1184 |
||
| 68565 | 1185 |
|
| 43038 | 1186 |
\subsection{Timeouts}
|
1187 |
\label{timeouts}
|
|
1188 |
||
1189 |
\begin{enum}
|
|
|
54816
10d48c2a3e32
made timeouts in Sledgehammer not be 'option's -- simplified lots of code
blanchet
parents:
54788
diff
changeset
|
1190 |
\opdefault{timeout}{float}{\upshape 30}
|
| 43038 | 1191 |
Specifies the maximum number of seconds that the automatic provers should spend |
1192 |
searching for a proof. This excludes problem preparation and is a soft limit. |
|
1193 |
||
|
75022
e9e27d2e61a1
updated documentation of 'slice' (now 'slices') option
blanchet
parents:
75021
diff
changeset
|
1194 |
\opdefault{slices}{int}{\upshape 6 times the number of cores detected}
|
|
e9e27d2e61a1
updated documentation of 'slice' (now 'slices') option
blanchet
parents:
75021
diff
changeset
|
1195 |
Specifies the number of time slices. Each time slice corresponds to a prover |
|
e9e27d2e61a1
updated documentation of 'slice' (now 'slices') option
blanchet
parents:
75021
diff
changeset
|
1196 |
invocation and has its own set of options. For example, for SPASS, one slice |
|
e9e27d2e61a1
updated documentation of 'slice' (now 'slices') option
blanchet
parents:
75021
diff
changeset
|
1197 |
might specify the fast but incomplete set-of-support (SOS) strategy with 100 |
|
e9e27d2e61a1
updated documentation of 'slice' (now 'slices') option
blanchet
parents:
75021
diff
changeset
|
1198 |
relevant lemmas, whereas other slices might run without SOS and with 500 lemmas. |
|
e9e27d2e61a1
updated documentation of 'slice' (now 'slices') option
blanchet
parents:
75021
diff
changeset
|
1199 |
Slicing (and thereby parallelism) can be disable by setting \textit{slices} to
|
|
e9e27d2e61a1
updated documentation of 'slice' (now 'slices') option
blanchet
parents:
75021
diff
changeset
|
1200 |
1. Since slicing is a valuable optimization, you should probably leave it |
|
e9e27d2e61a1
updated documentation of 'slice' (now 'slices') option
blanchet
parents:
75021
diff
changeset
|
1201 |
enabled unless you are conducting experiments. |
|
75016
873b581fd690
generalized the 'slice' option towards more flexible slicing
blanchet
parents:
74981
diff
changeset
|
1202 |
|
|
873b581fd690
generalized the 'slice' option towards more flexible slicing
blanchet
parents:
74981
diff
changeset
|
1203 |
\nopagebreak |
|
873b581fd690
generalized the 'slice' option towards more flexible slicing
blanchet
parents:
74981
diff
changeset
|
1204 |
{\small See also \textit{verbose} (\S\ref{output-format}).}
|
|
873b581fd690
generalized the 'slice' option towards more flexible slicing
blanchet
parents:
74981
diff
changeset
|
1205 |
|
|
873b581fd690
generalized the 'slice' option towards more flexible slicing
blanchet
parents:
74981
diff
changeset
|
1206 |
\optrueonly{dont\_slice}
|
|
75022
e9e27d2e61a1
updated documentation of 'slice' (now 'slices') option
blanchet
parents:
75021
diff
changeset
|
1207 |
Alias for ``\textit{slices} = 1''.
|
|
75016
873b581fd690
generalized the 'slice' option towards more flexible slicing
blanchet
parents:
74981
diff
changeset
|
1208 |
|
| 57719 | 1209 |
\opdefault{preplay\_timeout}{float}{\upshape 1}
|
|
55297
1dfcd49f5dcb
renamed 'smt' option 'smt_proofs' to avoid clash with 'smt' prover
blanchet
parents:
55290
diff
changeset
|
1210 |
Specifies the maximum number of seconds that \textit{metis} or other proof
|
|
1dfcd49f5dcb
renamed 'smt' option 'smt_proofs' to avoid clash with 'smt' prover
blanchet
parents:
55290
diff
changeset
|
1211 |
methods should spend trying to ``preplay'' the found proof. If this option |
|
1dfcd49f5dcb
renamed 'smt' option 'smt_proofs' to avoid clash with 'smt' prover
blanchet
parents:
55290
diff
changeset
|
1212 |
is set to 0, no preplaying takes place, and no timing information is displayed |
|
1dfcd49f5dcb
renamed 'smt' option 'smt_proofs' to avoid clash with 'smt' prover
blanchet
parents:
55290
diff
changeset
|
1213 |
next to the suggested proof method calls. |
|
45708
7c8bed80301f
updated Sledgehammer docs with new/renamed options
blanchet
parents:
45555
diff
changeset
|
1214 |
|
|
7c8bed80301f
updated Sledgehammer docs with new/renamed options
blanchet
parents:
45555
diff
changeset
|
1215 |
\nopagebreak |
|
7c8bed80301f
updated Sledgehammer docs with new/renamed options
blanchet
parents:
45555
diff
changeset
|
1216 |
{\small See also \textit{minimize} (\S\ref{mode-of-operation}).}
|
| 47036 | 1217 |
|
1218 |
\optrueonly{dont\_preplay}
|
|
1219 |
Alias for ``\textit{preplay\_timeout} = 0''.
|
|
1220 |
||
| 36926 | 1221 |
\end{enum}
|
1222 |
||
|
72342
4195e75a92ef
[mirabelle] add initial documentation in Sledgehammer's doc
desharna
parents:
72319
diff
changeset
|
1223 |
\section{Mirabelle Testing Tool}
|
|
4195e75a92ef
[mirabelle] add initial documentation in Sledgehammer's doc
desharna
parents:
72319
diff
changeset
|
1224 |
\label{mirabelle}
|
|
4195e75a92ef
[mirabelle] add initial documentation in Sledgehammer's doc
desharna
parents:
72319
diff
changeset
|
1225 |
|
| 72404 | 1226 |
The \texttt{isabelle mirabelle} tool executes Sledgehammer or other advisory
|
| 73856 | 1227 |
tools (e.g., Nitpick) or tactics (e.g., \textit{auto}) on all subgoals emerging
|
| 72404 | 1228 |
in a theory. It is typically used to measure the success rate of a proof tool |
1229 |
on some benchmark. Its command-line usage is as follows: |
|
|
72342
4195e75a92ef
[mirabelle] add initial documentation in Sledgehammer's doc
desharna
parents:
72319
diff
changeset
|
1230 |
|
|
4195e75a92ef
[mirabelle] add initial documentation in Sledgehammer's doc
desharna
parents:
72319
diff
changeset
|
1231 |
{\small
|
|
4195e75a92ef
[mirabelle] add initial documentation in Sledgehammer's doc
desharna
parents:
72319
diff
changeset
|
1232 |
\begin{verbatim}
|
| 73855 | 1233 |
Usage: isabelle mirabelle [OPTIONS] [SESSIONS ...] |
|
72342
4195e75a92ef
[mirabelle] add initial documentation in Sledgehammer's doc
desharna
parents:
72319
diff
changeset
|
1234 |
|
|
4195e75a92ef
[mirabelle] add initial documentation in Sledgehammer's doc
desharna
parents:
72319
diff
changeset
|
1235 |
Options are: |
| 73855 | 1236 |
-A ACTION add to list of actions |
| 75021 | 1237 |
-O DIR output directory for log files (default: |
1238 |
"mirabelle") |
|
1239 |
-T THEORY theory restriction: NAME or |
|
1240 |
NAME[FIRST_LINE:LAST_LINE] |
|
1241 |
-m INT max. no. of calls to each action (0: unbounded) |
|
1242 |
(default 0) |
|
1243 |
-s INT run actions on every nth goal (0: uniform |
|
1244 |
distribution) (default 1) |
|
|
74077
b93d8c2ebab0
added automatic uniform stride option to Mirabelle
desharna
parents:
74048
diff
changeset
|
1245 |
-t SECONDS timeout in seconds for each action (default 30) |
| 73855 | 1246 |
... |
|
72342
4195e75a92ef
[mirabelle] add initial documentation in Sledgehammer's doc
desharna
parents:
72319
diff
changeset
|
1247 |
|
| 73855 | 1248 |
Apply the given ACTIONs at all theories and proof steps of the |
1249 |
specified sessions. |
|
1250 |
||
1251 |
The absence of theory restrictions (option -T) means to check all |
|
1252 |
theories fully. Otherwise only the named theories are checked. |
|
|
72342
4195e75a92ef
[mirabelle] add initial documentation in Sledgehammer's doc
desharna
parents:
72319
diff
changeset
|
1253 |
\end{verbatim}
|
|
4195e75a92ef
[mirabelle] add initial documentation in Sledgehammer's doc
desharna
parents:
72319
diff
changeset
|
1254 |
} |
|
4195e75a92ef
[mirabelle] add initial documentation in Sledgehammer's doc
desharna
parents:
72319
diff
changeset
|
1255 |
|
| 73855 | 1256 |
Option \texttt{-A ACTION} specifies an action to run on all subgoals. When
|
1257 |
specified multiple times, all actions are performed in parallel on all |
|
1258 |
selected subgoals. Available actions are \texttt{arith}, \texttt{metis},
|
|
1259 |
\texttt{quickcheck}, \texttt{sledgehammer}, \texttt{sledgehammer\_filter}, and
|
|
1260 |
\texttt{try0}.
|
|
1261 |
||
1262 |
Option \texttt{-O DIR} specifies the output directory, which is created
|
|
1263 |
if needed. In this directory, a log file named "mirabelle.log" records the |
|
1264 |
position of each tested subgoal and the result of executing the actions. |
|
|
72342
4195e75a92ef
[mirabelle] add initial documentation in Sledgehammer's doc
desharna
parents:
72319
diff
changeset
|
1265 |
|
| 73855 | 1266 |
Option \texttt{-T THEORY} restricts the subgoals to those emerging from this
|
1267 |
theory. When not provided, all subgoals from are theories are selected. When |
|
| 73856 | 1268 |
provided multiple times, the union of all specified theories' subgoals is |
| 73855 | 1269 |
selected. |
|
72342
4195e75a92ef
[mirabelle] add initial documentation in Sledgehammer's doc
desharna
parents:
72319
diff
changeset
|
1270 |
|
| 73855 | 1271 |
Option \texttt{-m INT} specifies a maximum number of goals on which the action
|
1272 |
are run. |
|
|
72342
4195e75a92ef
[mirabelle] add initial documentation in Sledgehammer's doc
desharna
parents:
72319
diff
changeset
|
1273 |
|
| 73855 | 1274 |
Option \texttt{-s INT} specifies a stride, effectively running the actions on
|
| 75021 | 1275 |
every $n$th goal. |
| 73855 | 1276 |
|
1277 |
Option \texttt{-t SECONDS} specifies a generic timeout that the actions may
|
|
| 72404 | 1278 |
interpret differently. |
|
72342
4195e75a92ef
[mirabelle] add initial documentation in Sledgehammer's doc
desharna
parents:
72319
diff
changeset
|
1279 |
|
| 73855 | 1280 |
More specific documentation about low-level options, the \texttt{ACTION}
|
1281 |
parameter, and its corresponding options can be found in the Isabelle tool |
|
| 72404 | 1282 |
usage by entering \texttt{isabelle mirabelle -?} on the command line.
|
|
72342
4195e75a92ef
[mirabelle] add initial documentation in Sledgehammer's doc
desharna
parents:
72319
diff
changeset
|
1283 |
|
| 73855 | 1284 |
The following subsections assume that the environment variable \texttt{AFP} is
|
1285 |
defined and points to a release of the Archive of Formal Proofs. |
|
1286 |
||
|
75016
873b581fd690
generalized the 'slice' option towards more flexible slicing
blanchet
parents:
74981
diff
changeset
|
1287 |
|
|
72342
4195e75a92ef
[mirabelle] add initial documentation in Sledgehammer's doc
desharna
parents:
72319
diff
changeset
|
1288 |
\subsection{Example of Benchmarking Sledgehammer}
|
|
4195e75a92ef
[mirabelle] add initial documentation in Sledgehammer's doc
desharna
parents:
72319
diff
changeset
|
1289 |
|
|
4195e75a92ef
[mirabelle] add initial documentation in Sledgehammer's doc
desharna
parents:
72319
diff
changeset
|
1290 |
\begin{verbatim}
|
|
75016
873b581fd690
generalized the 'slice' option towards more flexible slicing
blanchet
parents:
74981
diff
changeset
|
1291 |
isabelle mirabelle -d '$AFP' -O output \ |
| 74958 | 1292 |
-A "sledgehammer[provers = e, timeout = 30]" \ |
| 73855 | 1293 |
VeriComp |
|
72342
4195e75a92ef
[mirabelle] add initial documentation in Sledgehammer's doc
desharna
parents:
72319
diff
changeset
|
1294 |
\end{verbatim}
|
|
4195e75a92ef
[mirabelle] add initial documentation in Sledgehammer's doc
desharna
parents:
72319
diff
changeset
|
1295 |
|
| 73855 | 1296 |
This command specifies to run the Sledgehammer action, using the E prover with |
| 74958 | 1297 |
a timeout of 30 seconds, on all subgoals emerging from all theory in the AFP |
| 73855 | 1298 |
session VeriComp. The results are written to \texttt{output/mirabelle.log}.
|
|
72342
4195e75a92ef
[mirabelle] add initial documentation in Sledgehammer's doc
desharna
parents:
72319
diff
changeset
|
1299 |
|
|
4195e75a92ef
[mirabelle] add initial documentation in Sledgehammer's doc
desharna
parents:
72319
diff
changeset
|
1300 |
\begin{verbatim}
|
|
75016
873b581fd690
generalized the 'slice' option towards more flexible slicing
blanchet
parents:
74981
diff
changeset
|
1301 |
isabelle mirabelle -d '$AFP' -O output \ |
| 73855 | 1302 |
-T Semantics -T Compiler \ |
| 74958 | 1303 |
-A "sledgehammer[provers = e, timeout = 30]" \ |
| 73855 | 1304 |
VeriComp |
|
72342
4195e75a92ef
[mirabelle] add initial documentation in Sledgehammer's doc
desharna
parents:
72319
diff
changeset
|
1305 |
\end{verbatim}
|
|
4195e75a92ef
[mirabelle] add initial documentation in Sledgehammer's doc
desharna
parents:
72319
diff
changeset
|
1306 |
|
| 73855 | 1307 |
This command also specifies to run the Sledgehammer action, but this time only |
1308 |
on subgoals emerging from theories Semantics or Compiler. |
|
1309 |
||
1310 |
||
1311 |
\subsection{Example of Benchmarking Multiple Tools}
|
|
1312 |
||
1313 |
\begin{verbatim}
|
|
|
75016
873b581fd690
generalized the 'slice' option towards more flexible slicing
blanchet
parents:
74981
diff
changeset
|
1314 |
isabelle mirabelle -d '$AFP' -O output -t 10 \ |
| 73857 | 1315 |
-A "try0" -A "metis" \ |
1316 |
VeriComp |
|
| 73855 | 1317 |
\end{verbatim}
|
1318 |
||
1319 |
This command specifies two actions running the \textbf{try0} and \textbf{metis}
|
|
| 73858 | 1320 |
commands, respectively, each with a timeout of 10 seconds. The results are |
| 73855 | 1321 |
written to \texttt{output/mirabelle.log}.
|
|
72342
4195e75a92ef
[mirabelle] add initial documentation in Sledgehammer's doc
desharna
parents:
72319
diff
changeset
|
1322 |
|
|
75016
873b581fd690
generalized the 'slice' option towards more flexible slicing
blanchet
parents:
74981
diff
changeset
|
1323 |
|
|
72342
4195e75a92ef
[mirabelle] add initial documentation in Sledgehammer's doc
desharna
parents:
72319
diff
changeset
|
1324 |
\subsection{Example of Generating TPTP Files}
|
|
4195e75a92ef
[mirabelle] add initial documentation in Sledgehammer's doc
desharna
parents:
72319
diff
changeset
|
1325 |
|
|
4195e75a92ef
[mirabelle] add initial documentation in Sledgehammer's doc
desharna
parents:
72319
diff
changeset
|
1326 |
\begin{verbatim}
|
|
75016
873b581fd690
generalized the 'slice' option towards more flexible slicing
blanchet
parents:
74981
diff
changeset
|
1327 |
isabelle mirabelle -d '$AFP' -O output \ |
|
74981
10df7a627ab6
split option "sledgehammer_atp_dest_dir" into "sledgehammer_atp_prob_dest_dir" and "sledgehammer_atp_proof_dest_dir"
desharna
parents:
74958
diff
changeset
|
1328 |
-A "sledgehammer[provers = e, timeout = 5, keep_probs = true]" \ |
| 73855 | 1329 |
VeriComp |
|
72342
4195e75a92ef
[mirabelle] add initial documentation in Sledgehammer's doc
desharna
parents:
72319
diff
changeset
|
1330 |
\end{verbatim}
|
|
4195e75a92ef
[mirabelle] add initial documentation in Sledgehammer's doc
desharna
parents:
72319
diff
changeset
|
1331 |
|
| 73855 | 1332 |
This command generates TPTP files using Sledgehammer. Since the file |
1333 |
is generated at the very beginning of every Sledgehammer invocation, |
|
1334 |
a timeout of five seconds making the prover fail faster speeds up |
|
|
74079
180ee02eb075
documented Mirabelle_Sledgehammer's new keep semantics
desharna
parents:
74077
diff
changeset
|
1335 |
processing the subgoals. The results are written in an action-specific |
|
180ee02eb075
documented Mirabelle_Sledgehammer's new keep semantics
desharna
parents:
74077
diff
changeset
|
1336 |
subdirectory of the specified output directory (\texttt{output}). A TPTP
|
|
180ee02eb075
documented Mirabelle_Sledgehammer's new keep semantics
desharna
parents:
74077
diff
changeset
|
1337 |
file is generated for each subgoal. |
|
72342
4195e75a92ef
[mirabelle] add initial documentation in Sledgehammer's doc
desharna
parents:
72319
diff
changeset
|
1338 |
|
| 36926 | 1339 |
\let\em=\sl |
|
48962
a1acc1cb0271
more standard document preparation within session context;
wenzelm
parents:
48803
diff
changeset
|
1340 |
\bibliography{manual}{}
|
| 36926 | 1341 |
\bibliographystyle{abbrv}
|
1342 |
||
1343 |
\end{document}
|