author  blanchet 
Tue, 27 Jul 2010 13:16:37 +0200  
changeset 38009  34e1ac9cb71d 
parent 38005  b6555e9c5de4 
child 38015  b30c3c2e1030 
permissions  rwrr 
36376  1 
(* Title: HOL/Tools/ATP_Manager/atp_systems.ML 
28592  2 
Author: Fabian Immler, TU Muenchen 
3 
Author: Jasmin Blanchette, TU Muenchen 
28592  4 

36376  5 
Setup for supported ATPs. 
28592  6 
*) 
7 

36376  8 
signature ATP_SYSTEMS = 
28592  9 
sig 
10 
val trace : bool Unsynchronized.ref 
36376  11 
val dest_dir : string Config.T 
35867  12 
val problem_prefix : string Config.T 
13 
val measure_runtime : bool Config.T 

14 
val refresh_systems_on_tptp : unit > unit 

15 
val default_atps_param_value : unit > string 
35867  16 
val setup : theory > theory 
28592  17 
end; 
18 

36376  19 
structure ATP_Systems : ATP_SYSTEMS = 
28592  20 
struct 
21 

22 
open Metis_Clauses 
36187  23 
open Sledgehammer_Util 
35865  24 
open Sledgehammer_Fact_Filter 
25 
open Sledgehammer_TPTP_Format 
35865  26 
open Sledgehammer_Proof_Reconstruct 
35867  27 
open ATP_Manager 
35826  28 

29 
val trace = Unsynchronized.ref false 
fun trace_msg msg = if !trace then tracing (msg ()) else () 
36376  32 
(** generic ATP **) 
33 

32944
ecc0705174c2
clarified File.platform_path vs. File.shell_path;
34 
(* external problem files *) 
35 

36376  36 
val (dest_dir, dest_dir_setup) = Attrib.config_string "atp_dest_dir" (K ""); 
32864
37 
(*Empty string means create files in Isabelle's temporary files directory.*) 
38 

39 
val (problem_prefix, problem_prefix_setup) = 
36001  40 
Attrib.config_string "atp_problem_prefix" (K "prob"); 
41 

33247  42 
val (measure_runtime, measure_runtime_setup) = 
36001  43 
Attrib.config_bool "atp_measure_runtime" (K false); 
33247  44 

32864
45 

35867  46 
(* prover configuration *) 
47 

32941
72d48e333b77
48 
type prover_config = 
36917
8674cdb0b8cc
49 
{home_var: string, 
36370
a4f601daa175
50 
executable: string, 
37514
b147d01b8ebc
if SPASS fails at finding a proof with the SOS option turned on, turn it off and try again
blanchet
parents:
37509
diff
changeset

51 
arguments: bool > Time.time > string, 
36370
52 
proof_delims: (string * string) list, 
a4f601daa175
53 
known_failures: (failure * string) list, 
38009
34e1ac9cb71d
shrink the "max_new_relevant_facts_per_iter" fudge factors, now that we count formulas and not clauses
blanchet
parents:
38005
diff
changeset

54 
max_new_relevant_facts_per_iter: int, 
37994
b04307085a09
make TPTP generator accept full firstorder formulas
blanchet
parents:
37989
diff
changeset

55 
prefers_theory_relevant: bool, 
b04307085a09
make TPTP generator accept full firstorder formulas
blanchet
parents:
37989
diff
changeset

56 
explicit_forall: bool} 
28596
57 

fcd463a6b6de
58 

59 
(* basic template *) 
60 

36370
61 
val remotify = prefix "remote_" 
62 

32458
63 
fun with_path cleanup after f path = 
64 
Exn.capture f path 
65 
> tap (fn _ => cleanup path) 
66 
> Exn.release 
36369
67 
> tap (after path) 
68 

69 
(* Splits by the first possible of a list of delimiters. *) 
70 
fun extract_proof delims output = 
71 
case pairself (find_first (fn s => String.isSubstring s output)) 
72 
(ListPair.unzip delims) of 
73 
(SOME begin_delim, SOME end_delim) => 
36549  74 
(output > first_field begin_delim > the > snd 
75 
> first_field end_delim > the > fst 

76 
> first_field "\n" > the > snd 

77 
handle Option.Option => "") 

36369
78 
 _ => "" 
32458
79 

37514
80 
fun extract_proof_and_outcome complete res_code proof_delims known_failures 
81 
output = 
36370
82 
case map_filter (fn (failure, pattern) => 
83 
if String.isSubstring pattern output then SOME failure 
84 
else NONE) known_failures of 
85 
[] => (case extract_proof proof_delims output of 
36370
86 
"" => ("", SOME UnknownError) 
87 
 proof => if res_code = 0 then (proof, NONE) 
88 
else ("", SOME UnknownError)) 
37514
89 
 (failure :: _) => 
90 
("", SOME (if failure = IncompleteUnprovable andalso complete then 
91 
Unprovable 
92 
else 
b147d01b8ebc
93 
failure)) 
36370
94 

95 
fun string_for_failure Unprovable = "The ATP problem is unprovable." 
37413  96 
 string_for_failure IncompleteUnprovable = 
97 
"The ATP cannot prove the problem." 

37627  98 
 string_for_failure CantConnect = "Can't connect to remote ATP." 
36370
99 
 string_for_failure TimedOut = "Timed out." 
100 
 string_for_failure OutOfResources = "The ATP ran out of resources." 
101 
 string_for_failure OldSpass = 
36393
102 
(* FIXME: Change the error message below to point to the Isabelle download 
37997  103 
page once the package is there. *) 
36370
104 
"Warning: Sledgehammer requires a more recent version of SPASS with \ 
a4f601daa175
105 
\support for the TPTP syntax. To install it, download and untar the \ 
a4f601daa175
106 
\package \"http://isabelle.in.tum.de/~blanchet/spass3.7.tgz\" and add the \ 
a4f601daa175
107 
\\"spass3.7\" directory's full path to \"" ^ 
a4f601daa175
108 
Path.implode (Path.expand (Path.appends 
a4f601daa175
109 
(Path.variable "ISABELLE_HOME_USER" :: 
a4f601daa175
110 
map Path.basic ["etc", "components"]))) ^ 
a4f601daa175
111 
"\" on a line of its own." 
36965  112 
 string_for_failure MalformedInput = 
113 
"Internal Sledgehammer error: The ATP problem is malformed. Please report \ 

114 
\this to the Isabelle developers." 

36370
115 
 string_for_failure MalformedOutput = "Error: The ATP output is malformed." 
116 
 string_for_failure UnknownError = "Error: An unknown ATP error occurred." 
35865  117 

37623
118 

119 
(* Clause preparation *) 
120 

295f3a9b44b6
121 
fun make_clause_table xs = 
122 
fold (Termtab.update o `(prop_of o snd)) xs Termtab.empty 
123 

295f3a9b44b6
124 
(* Remove existing axiom clauses from the conjecture clauses, as this can 
125 
dramatically boost an ATP's performance (for some reason). *) 
126 
fun subtract_cls ax_clauses = 
127 
filter_out (Termtab.defined (make_clause_table ax_clauses) o prop_of) 
128 

37995
06f02b15ef8a
generate full firstorder formulas (FOF) in Sledgehammer
blanchet
129 
fun combformula_for_prop thy = 
130 
let 
131 
val do_term = combterm_from_term thy 
132 
fun do_quant bs q s T t' = 
133 
do_formula ((s, T) :: bs) t' 
134 
#>> (fn phi => AQuant (q, [`make_bound_var s], phi)) 
135 
and do_conn bs c t1 t2 = 
136 
do_formula bs t1 ##>> do_formula bs t2 
137 
#>> (fn (phi1, phi2) => AConn (c, [phi1, phi2])) 
138 
and do_formula bs t = 
139 
case t of 
38001
a9b47b85ca24
reintroduced more preprocessing steps to Sledgehammer, adapted to the new FOF setting
blanchet
140 
@{const Not} $ t1 => 
37995
141 
do_formula bs t1 #>> (fn phi => AConn (ANot, [phi])) 
142 
 Const (@{const_name All}, _) $ Abs (s, T, t') => 
143 
do_quant bs AForall s T t' 
144 
 Const (@{const_name Ex}, _) $ Abs (s, T, t') => 
145 
do_quant bs AExists s T t' 
146 
 @{const "op &"} $ t1 $ t2 => do_conn bs AAnd t1 t2 
147 
 @{const "op "} $ t1 $ t2 => do_conn bs AOr t1 t2 
148 
 @{const "op >"} $ t1 $ t2 => do_conn bs AImplies t1 t2 
149 
 Const (@{const_name "op ="}, Type (_, [@{typ bool}, _])) $ t1 $ t2 => 
150 
do_conn bs AIff t1 t2 
151 
 _ => (fn ts => do_term bs (Envir.eta_contract t) 
152 
>> APred > union (op =) ts) 
153 
in do_formula [] end 
37623
154 

38001
155 
(* Converts an elimrule into an equivalent theorem that does not have the 
156 
predicate variable. Leaves other theorems unchanged. We simply instantiate 
157 
the conclusion variable to False. (Cf. "transform_elim_term" in 
158 
"ATP_Systems".) *) 
159 
(* FIXME: test! *) 
160 
fun transform_elim_term t = 
161 
case Logic.strip_imp_concl t of 
162 
@{const Trueprop} $ Var (z, @{typ bool}) => 
163 
subst_Vars [(z, @{const True})] t 
164 
 Var (z, @{typ prop}) => subst_Vars [(z, @{prop True})] t 
a9b47b85ca24
165 
 _ => t 
a9b47b85ca24
166 

a9b47b85ca24
167 
(* Removes the lambdas from an equation of the form "t = (%x. u)". 
168 
(Cf. "extensionalize_theorem" in "Clausifier".) *) 
changeset

169 
changeset

170 
diff
changeset

172 
$ t2 $ Abs (s, var_T, t')) = 
173 
let val var_t = Var (("x", j), var_T) in 
changeset

174 
changeset

175 
changeset

176 
changeset

177 
changeset

178 
changeset

179 
changeset

180 

38001
181 
(* FIXME: Guarantee freshness *) 
182 
fun concealed_bound_name j = "Sledgehammer" ^ Int.toString j 
183 
fun conceal_bounds Ts t = 
184 
subst_bounds (map (Free o apfst concealed_bound_name) 
185 
(length Ts  1 downto 0 ~~ rev Ts), t) 
186 
fun reveal_bounds Ts = 
187 
subst_atomic (map (fn (j, T) => (Free (concealed_bound_name j, T), Bound j)) 
188 
(0 upto length Ts  1 ~~ Ts)) 
189 

38005
b6555e9c5de4
prevent schematic variable clash in combinatorintroduction code, when invoked from Sledgehammer (another consequence of the CNF > FOF transition)
190 
fun introduce_combinators_in_term ctxt kind t = 
38001
191 
let 
changeset

192 
diff
changeset

diff
changeset

diff
changeset

diff
changeset

diff
changeset

diff
changeset

diff
changeset

diff
changeset

diff
changeset

diff
changeset

diff
changeset

204 
$ t1 $ t2 => 
205 
t0 $ aux Ts t1 $ aux Ts t2 
206 
 _ => if not (exists_subterm (fn Abs _ => true  _ => false) t) then 
207 
t 
a9b47b85ca24
208 
else 
38005
209 
let 
210 
val t = t > conceal_bounds Ts 
211 
> Envir.eta_contract 
212 
val ([t], ctxt') = Variable.import_terms true [t] ctxt 
213 
in 
214 
t > cterm_of thy 
215 
> Clausifier.introduce_combinators_in_cterm 
216 
> singleton (Variable.export ctxt' ctxt) 
217 
> prop_of > Logic.dest_equals > snd 
218 
> reveal_bounds Ts 
219 
end 
38001
220 
in t > not (Meson.is_fol_term thy t) ? aux [] end 
38005
221 
handle THM _ => 
222 
(* A type variable of sort "{}" will make abstraction fail. *) 
223 
case kind of 
224 
Axiom => HOLogic.true_const 
225 
 Conjecture => HOLogic.false_const 
38001
226 

37623
227 
(* making axiom and conjecture clauses *) 
38005
b6555e9c5de4
prevent schematic variable clash in combinatorintroduction code, when invoked from Sledgehammer (another consequence of the CNF > FOF transition)
blanchet
parents:
38004
diff
changeset

228 
fun make_clause ctxt (formula_name, kind, t) = 
37623
229 
let 
38005
230 
val thy = ProofContext.theory_of ctxt 
38002
231 
(* ### FIXME: perform other transformations previously done by 
232 
"Clausifier.to_nnf", e.g. "HOL.If" *) 
38001
233 
val t = t > transform_elim_term 
234 
> Object_Logic.atomize_term thy 
38000
235 
> extensionalize_term 
38005
b6555e9c5de4
prevent schematic variable clash in combinatorintroduction code, when invoked from Sledgehammer (another consequence of the CNF > FOF transition)
blanchet
236 
> introduce_combinators_in_term ctxt kind 
37995
237 
val (combformula, ctypes_sorts) = combformula_for_prop thy t [] 
37623
238 
in 
38004  239 
FOLFormula {formula_name = formula_name, combformula = combformula, 
240 
kind = kind, ctypes_sorts = ctypes_sorts} 

37623
241 
end 
295f3a9b44b6
242 

38005
b6555e9c5de4
243 
fun make_axiom_clause ctxt (name, th) = 
244 
(name, make_clause ctxt (name, Axiom, prop_of th)) 
245 
fun make_conjecture_clauses ctxt ts = 
246 
map2 (fn j => fn t => make_clause ctxt (Int.toString j, Conjecture, t)) 
37999  247 
(0 upto length ts  1) ts 
37623
295f3a9b44b6
move functions not needed by Metis out of "Metis_Clauses"
blanchet
parents:
37621
diff
changeset

248 

295f3a9b44b6
move functions not needed by Metis out of "Metis_Clauses"
295f3a9b44b6
move functions not needed by Metis out of "Metis_Clauses"
37994
b04307085a09
make TPTP generator accept full firstorder formulas
fun count_combterm (CombConst ((s, _), _, _)) = 
b04307085a09
Symtab.map_entry s (Integer.add 1) 
37623
253 
 count_combterm (CombVar _) = I 
37994
254 
 count_combterm (CombApp (t1, t2)) = fold count_combterm [t1, t2] 
255 
fun count_combformula (AQuant (_, _, phi)) = count_combformula phi 
256 
 count_combformula (AConn (_, phis)) = fold count_combformula phis 
257 
 count_combformula (APred tm) = count_combterm tm 
258 
fun count_fol_formula (FOLFormula {combformula, ...}) = 
259 
count_combformula combformula 
37623
260 

295f3a9b44b6
261 
val optional_helpers = 
38002
262 
[(["c_COMBI", "c_COMBK"], @{thms COMBI_def COMBK_def}), 
263 
(["c_COMBB", "c_COMBC"], @{thms COMBB_def COMBC_def}), 
264 
(["c_COMBS"], @{thms COMBS_def})] 
265 
val optional_typed_helpers = 
38002
266 
[(["c_True", "c_False"], @{thms True_or_False}), 
267 
(["c_If"], @{thms if_True if_False True_or_False})] 
268 
val mandatory_helpers = @{thms fequal_imp_equal equal_imp_fequal} 
295f3a9b44b6
269 

295f3a9b44b6
move functions not needed by Metis out of "Metis_Clauses"
val init_counters = 
295f3a9b44b6
271 
Symtab.make (maps (maps (map (rpair 0) o fst)) 
295f3a9b44b6
272 
[optional_helpers, optional_typed_helpers]) 
273 

38005
274 
fun get_helper_clauses ctxt is_FO full_types conjectures axclauses = 
37623
275 
let 
37994
276 
val ct = fold (fold count_fol_formula) [conjectures, axclauses] 
b04307085a09
277 
init_counters 
37623
changeset

278 
fun is_needed c = the (Symtab.lookup ct c) > 0 
changeset

279 
val cnfs = 
changeset

280 
(optional_helpers 
281 
> full_types ? append optional_typed_helpers 
changeset

282 
283 
if exists is_needed ss then map (`Thm.get_name_hint) ths 
284 
else [])) @ 
285 
(if is_FO then [] else map (`Thm.get_name_hint) mandatory_helpers) 
38005
286 
in map (snd o make_axiom_clause ctxt) cnfs end 
37623
295f3a9b44b6
move functions not needed by Metis out of "Metis_Clauses"
blanchet
parents:
37621
diff
changeset

287 

38002
288 
fun s_not (@{const Not} $ t) = t 
289 
 s_not t = @{const Not} $ t 
37995
290 

37623
295f3a9b44b6
291 
(* prepare for passing to writer, 
292 
create additional clauses based on the information from extra_cls *) 
38005
293 
fun prepare_clauses ctxt full_types hyp_ts concl_t axcls extra_cls = 
37623
295f3a9b44b6
move functions not needed by Metis out of "Metis_Clauses"
blanchet
parents:
37621
diff
changeset

294 
let 
38005
b6555e9c5de4
prevent schematic variable clash in combinatorintroduction code, when invoked from Sledgehammer (another consequence of the CNF > FOF transition)
295 
val thy = ProofContext.theory_of ctxt 
37995
296 
val goal_t = Logic.list_implies (hyp_ts, concl_t) 
297 
val is_FO = Meson.is_fol_term thy goal_t 
38005
298 
val _ = trace_msg (fn _ => Syntax.string_of_term ctxt goal_t) 
37995
299 
val axtms = map (prop_of o snd) extra_cls 
300 
val subs = tfree_classes_of_terms [goal_t] 
301 
val supers = tvar_classes_of_terms axtms 
302 
val tycons = type_consts_of_terms thy (goal_t :: axtms) 
38002
303 
(* TFrees in conjecture clauses; TVars in axiom clauses *) 
38005
304 
val conjectures = 
305 
map (s_not o HOLogic.dest_Trueprop) hyp_ts @ 
306 
[HOLogic.dest_Trueprop concl_t] 
307 
> make_conjecture_clauses ctxt 
308 
val extra_clauses = map (snd o make_axiom_clause ctxt) extra_cls 
38003  309 
val (clnames, axiom_clauses) = 
38005
310 
ListPair.unzip (map (make_axiom_clause ctxt) axcls) 
38003  311 
(* FIXME: Should it read "extra_clauses" or "axiom_clauses" in the 
312 
"get_helper_clauses" call? *) 

37623
313 
val helper_clauses = 
38005
314 
get_helper_clauses ctxt is_FO full_types conjectures extra_clauses 
37623
315 
val (supers', arity_clauses) = make_arity_clauses thy tycons supers 
37925  316 
val class_rel_clauses = make_class_rel_clauses thy subs supers' 
37623
317 
in 
318 
(Vector.fromList clnames, 
37925  319 
(conjectures, axiom_clauses, extra_clauses, helper_clauses, 
320 
class_rel_clauses, arity_clauses)) 

37623
321 
end 
295f3a9b44b6
322 

37962
323 
fun extract_clause_sequence output = 
diff
changeset

324 
let 
d7dbe01f48d7
keep track of clause numbers for SPASS now that we generate FOF rather than CNF problems;
blanchet
parents:
37926
diff
changeset

325 
val tokens_of = String.tokens (not o Char.isAlphaNum) 
d7dbe01f48d7
keep track of clause numbers for SPASS now that we generate FOF rather than CNF problems;
blanchet
parents:
37926
diff
changeset

326 
fun extract_num ("clause" :: (ss as _ :: _)) = 
d7dbe01f48d7
keep track of clause numbers for SPASS now that we generate FOF rather than CNF problems;
blanchet
parents:
37926
diff
changeset

327 
Int.fromString (List.last ss) 
d7dbe01f48d7
keep track of clause numbers for SPASS now that we generate FOF rather than CNF problems;
blanchet
parents:
37926
diff
changeset

328 
 extract_num _ = NONE 
d7dbe01f48d7
keep track of clause numbers for SPASS now that we generate FOF rather than CNF problems;
blanchet
parents:
37926
diff
changeset

329 
in output > split_lines > map_filter (extract_num o tokens_of) end 
d7dbe01f48d7
keep track of clause numbers for SPASS now that we generate FOF rather than CNF problems;
blanchet
parents:
37926
diff
changeset

330 

d7dbe01f48d7
keep track of clause numbers for SPASS now that we generate FOF rather than CNF problems;
blanchet
parents:
37926
diff
changeset

331 
val set_ClauseFormulaRelationN = "set_ClauseFormulaRelation" 
d7dbe01f48d7
keep track of clause numbers for SPASS now that we generate FOF rather than CNF problems;
blanchet
parents:
37926
diff
changeset

332 

d7dbe01f48d7
keep track of clause numbers for SPASS now that we generate FOF rather than CNF problems;
blanchet
parents:
37926
diff
changeset

333 
val parse_clause_formula_pair = 
d7dbe01f48d7
keep track of clause numbers for SPASS now that we generate FOF rather than CNF problems;
blanchet
parents:
37926
diff
changeset

334 
$$ "("  scan_integer  $$ ","  Symbol.scan_id  $$ ")" 
d7dbe01f48d7
keep track of clause numbers for SPASS now that we generate FOF rather than CNF problems;
blanchet
parents:
37926
diff
changeset

335 
 Scan.option ($$ ",") 
d7dbe01f48d7
keep track of clause numbers for SPASS now that we generate FOF rather than CNF problems;
blanchet
parents:
37926
diff
changeset

336 
val parse_clause_formula_relation = 
d7dbe01f48d7
keep track of clause numbers for SPASS now that we generate FOF rather than CNF problems;
blanchet
parents:
37926
diff
changeset

337 
Scan.this_string set_ClauseFormulaRelationN  $$ "(" 
d7dbe01f48d7
keep track of clause numbers for SPASS now that we generate FOF rather than CNF problems;
blanchet
parents:
37926
diff
changeset

338 
 Scan.repeat parse_clause_formula_pair 
d7dbe01f48d7
keep track of clause numbers for SPASS now that we generate FOF rather than CNF problems;
blanchet
parents:
37926
diff
changeset

339 
val extract_clause_formula_relation = 
d7dbe01f48d7
keep track of clause numbers for SPASS now that we generate FOF rather than CNF problems;
blanchet
parents:
37926
diff
changeset

340 
Substring.full 
d7dbe01f48d7
keep track of clause numbers for SPASS now that we generate FOF rather than CNF problems;
blanchet
parents:
37926
diff
changeset

341 
#> Substring.position set_ClauseFormulaRelationN 
d7dbe01f48d7
keep track of clause numbers for SPASS now that we generate FOF rather than CNF problems;
blanchet
parents:
37926
diff
changeset

342 
#> snd #> Substring.string #> strip_spaces #> explode 
d7dbe01f48d7
keep track of clause numbers for SPASS now that we generate FOF rather than CNF problems;
blanchet
parents:
37926
diff
changeset

343 
#> parse_clause_formula_relation #> fst 
d7dbe01f48d7
keep track of clause numbers for SPASS now that we generate FOF rather than CNF problems;
blanchet
parents:
37926
diff
changeset

344 

37989
ca3041b0f445
reorder SPASS conjectures correctly, based on Flotter output
blanchet
parents:
37962
diff
changeset

345 
fun repair_conjecture_shape_and_theorem_names output conjecture_shape 
ca3041b0f445
reorder SPASS conjectures correctly, based on Flotter output
blanchet
parents:
37962
diff
changeset

346 
thm_names = 
37962
d7dbe01f48d7
keep track of clause numbers for SPASS now that we generate FOF rather than CNF problems;
blanchet
parents:
37926
diff
changeset

347 
if String.isSubstring set_ClauseFormulaRelationN output then 
38009
34e1ac9cb71d
shrink the "max_new_relevant_facts_per_iter" fudge factors, now that we count formulas and not clauses
blanchet
parents:
38005
diff
changeset

348 
(* This is a hack required for keeping track of axioms after they have been 
34e1ac9cb71d
shrink the "max_new_relevant_facts_per_iter" fudge factors, now that we count formulas and not clauses
blanchet
parents:
38005
diff
changeset

349 
clausified by SPASS's Flotter tool. The "SPASS_TPTP" script is also part 
34e1ac9cb71d
shrink the "max_new_relevant_facts_per_iter" fudge factors, now that we count formulas and not clauses
blanchet
parents:
38005
diff
changeset

350 
of this hack. *) 
37962
d7dbe01f48d7
keep track of clause numbers for SPASS now that we generate FOF rather than CNF problems;
blanchet
parents:
37926
diff
changeset

351 
let 
37996
11c076ea92e9
simplify "conjecture_shape" business, as a result of using FOF instead of CNF
blanchet
parents:
37995
diff
changeset

352 
val j0 = hd conjecture_shape 
37962
d7dbe01f48d7
keep track of clause numbers for SPASS now that we generate FOF rather than CNF problems;
blanchet
parents:
37926
diff
changeset

353 
val seq = extract_clause_sequence output 
d7dbe01f48d7
keep track of clause numbers for SPASS now that we generate FOF rather than CNF problems;
blanchet
parents:
37926
diff
changeset

354 
val name_map = extract_clause_formula_relation output 
37989
ca3041b0f445
reorder SPASS conjectures correctly, based on Flotter output
blanchet
parents:
37962
diff
changeset

355 
fun renumber_conjecture j = 
ca3041b0f445
reorder SPASS conjectures correctly, based on Flotter output
blanchet
parents:
37962
diff
changeset

356 
AList.find (op =) name_map (conjecture_prefix ^ Int.toString (j  j0)) 
ca3041b0f445
reorder SPASS conjectures correctly, based on Flotter output
blanchet
parents:
37962
diff
changeset

357 
> the_single 
ca3041b0f445
reorder SPASS conjectures correctly, based on Flotter output
blanchet
parents:
37962
diff
changeset

358 
> (fn s => find_index (curry (op =) s) seq + 1) 
37962
d7dbe01f48d7
keep track of clause numbers for SPASS now that we generate FOF rather than CNF problems;
blanchet
parents:
37926
diff
changeset

359 
in 
37996
11c076ea92e9
simplify "conjecture_shape" business, as a result of using FOF instead of CNF
blanchet
parents:
37995
diff
changeset

360 
(conjecture_shape > map renumber_conjecture, 
37989
ca3041b0f445
reorder SPASS conjectures correctly, based on Flotter output
blanchet
parents:
37962
diff
changeset

361 
seq > map (the o AList.lookup (op =) name_map) 
ca3041b0f445
reorder SPASS conjectures correctly, based on Flotter output
blanchet
parents:
37962
diff
changeset

362 
> map (fn s => case try (unprefix axiom_prefix) s of 
ca3041b0f445
reorder SPASS conjectures correctly, based on Flotter output
blanchet
parents:
37962
diff
changeset

363 
SOME s' => undo_ascii_of s' 
ca3041b0f445
reorder SPASS conjectures correctly, based on Flotter output
blanchet
parents:
37962
diff
changeset

364 
 NONE => "") 
ca3041b0f445
reorder SPASS conjectures correctly, based on Flotter output
blanchet
parents:
37962
diff
changeset

365 
> Vector.fromList) 
37962
d7dbe01f48d7
keep track of clause numbers for SPASS now that we generate FOF rather than CNF problems;
blanchet
parents:
37926
diff
changeset

366 
end 
d7dbe01f48d7
keep track of clause numbers for SPASS now that we generate FOF rather than CNF problems;
blanchet
parents:
37926
diff
changeset

367 
else 
37989
ca3041b0f445
reorder SPASS conjectures correctly, based on Flotter output
blanchet
parents:
37962
diff
changeset

368 
(conjecture_shape, thm_names) 
37962
d7dbe01f48d7
keep track of clause numbers for SPASS now that we generate FOF rather than CNF problems;
blanchet
parents:
37926
diff
changeset

369 

37623
295f3a9b44b6
move functions not needed by Metis out of "Metis_Clauses"
blanchet
parents:
37621
diff
changeset

370 

37499
5ff37037fbec
merge "generic_prover" and "generic_tptp_prover"
blanchet
parents:
37498
diff
changeset

371 
(* generic TPTPbased provers *) 
5ff37037fbec
merge "generic_prover" and "generic_tptp_prover"
blanchet
parents:
37498
diff
changeset

372 

5ff37037fbec
merge "generic_prover" and "generic_tptp_prover"
blanchet
parents:
37498
diff
changeset

373 
fun generic_tptp_prover 
5ff37037fbec
merge "generic_prover" and "generic_tptp_prover"
blanchet
parents:
37498
diff
changeset

374 
(name, {home_var, executable, arguments, proof_delims, known_failures, 
38009
34e1ac9cb71d
shrink the "max_new_relevant_facts_per_iter" fudge factors, now that we count formulas and not clauses
blanchet
parents:
38005
diff
changeset

375 
max_new_relevant_facts_per_iter, prefers_theory_relevant, 
34e1ac9cb71d
shrink the "max_new_relevant_facts_per_iter" fudge factors, now that we count formulas and not clauses
blanchet
parents:
38005
diff
changeset

376 
explicit_forall}) 
37580
c2c1caff5dea
got rid of "respect_no_atp" option, which even I don't use
blanchet
parents:
37578
diff
changeset

377 
({debug, overlord, full_types, explicit_apply, relevance_threshold, 
c2c1caff5dea
got rid of "respect_no_atp" option, which even I don't use
blanchet
parents:
37578
diff
changeset

378 
relevance_convergence, theory_relevant, defs_relevant, isar_proof, 
c2c1caff5dea
got rid of "respect_no_atp" option, which even I don't use
blanchet
parents:
37578
diff
changeset

379 
isar_shrink_factor, ...} : params) 
37499
5ff37037fbec
merge "generic_prover" and "generic_tptp_prover"
blanchet
parents:
37498
diff
changeset

380 
minimize_command timeout 
35969  381 
({subgoal, goal, relevance_override, axiom_clauses, filtered_clauses} 
382 
: problem) = 

28596
fcd463a6b6de
tuned interfaces  plain prover function, without thread;
wenzelm
parents:
28592
diff
changeset

383 
let 
31750  384 
(* get clauses and prepare them for writing *) 
37498
b426cbdb5a23
removed Sledgehammer's support for the DFG syntax;
blanchet
parents:
37480
diff
changeset

385 
val (ctxt, (_, th)) = goal; 
38005
b6555e9c5de4
prevent schematic variable clash in combinatorintroduction code, when invoked from Sledgehammer (another consequence of the CNF > FOF transition)
blanchet
parents:
38004
diff
changeset

386 
val thy = ProofContext.theory_of ctxt 
37995
06f02b15ef8a
generate full firstorder formulas (FOF) in Sledgehammer
blanchet
parents:
37994
diff
changeset

387 
(* ### FIXME: (1) preprocessing for "if" etc. *) 
06f02b15ef8a
generate full firstorder formulas (FOF) in Sledgehammer
blanchet
parents:
37994
diff
changeset

388 
val (params, hyp_ts, concl_t) = strip_subgoal th subgoal 
31752
19a5f1c8a844
use results of relevancefilter to determine additional clauses;
immler@in.tum.de
parents:
31751
diff
changeset

389 
val the_filtered_clauses = 
37621  390 
case filtered_clauses of 
391 
SOME fcls => fcls 

392 
 NONE => relevant_facts full_types relevance_threshold 

38009
34e1ac9cb71d
shrink the "max_new_relevant_facts_per_iter" fudge factors, now that we count formulas and not clauses
blanchet
parents:
38005
diff
changeset

393 
relevance_convergence defs_relevant 
34e1ac9cb71d
shrink the "max_new_relevant_facts_per_iter" fudge factors, now that we count formulas and not clauses
blanchet
parents:
38005
diff
changeset

394 
max_new_relevant_facts_per_iter 
37499
5ff37037fbec
merge "generic_prover" and "generic_tptp_prover"
blanchet
parents:
37498
diff
changeset

395 
(the_default prefers_theory_relevant theory_relevant) 
37995
06f02b15ef8a
generate full firstorder formulas (FOF) in Sledgehammer
blanchet
parents:
37994
diff
changeset

396 
relevance_override goal hyp_ts concl_t 
37506
32a1ee39c49b
missing "Unsynchronized" + make exception take a unit
blanchet
parents:
37499
diff
changeset

397 
val the_axiom_clauses = axiom_clauses > the_default the_filtered_clauses 
35969  398 
val (internal_thm_names, clauses) = 
38005
b6555e9c5de4
prevent schematic variable clash in combinatorintroduction code, when invoked from Sledgehammer (another consequence of the CNF > FOF transition)
blanchet
parents:
38004
diff
changeset

399 
prepare_clauses ctxt full_types hyp_ts concl_t the_axiom_clauses 
b6555e9c5de4
prevent schematic variable clash in combinatorintroduction code, when invoked from Sledgehammer (another consequence of the CNF > FOF transition)
blanchet
parents:
38004
diff
changeset

400 
the_filtered_clauses 
31750  401 

32864
a226f29d4bdc
reorganized signature of AtpWrapper structure: records instead of unnamed parameters and return values,
boehmes
parents:
32740
diff
changeset

402 
(* path to unique problem file *) 
36376  403 
val the_dest_dir = if overlord then getenv "ISABELLE_HOME_USER" 
404 
else Config.get ctxt dest_dir; 

405 
val the_problem_prefix = Config.get ctxt problem_prefix; 

32864
a226f29d4bdc
reorganized signature of AtpWrapper structure: records instead of unnamed parameters and return values,
boehmes
parents:
32740
diff
changeset

406 
fun prob_pathname nr = 
36143
6490319b1703
added "overlord" option (to get easy access to output files for debugging) + systematically use "raw_goal" rather than an inconsistent mixture
blanchet
parents:
36142
diff
changeset

407 
let 
6490319b1703
added "overlord" option (to get easy access to output files for debugging) + systematically use "raw_goal" rather than an inconsistent mixture
blanchet
parents:
36142
diff
changeset

408 
val probfile = 
36568
d495d2e1f0a6
in "overlord" mode: ignore problem prefix specified in the .thy file
blanchet
parents:
36552
diff
changeset

409 
Path.basic ((if overlord then "prob_" ^ name 
d495d2e1f0a6
in "overlord" mode: ignore problem prefix specified in the .thy file
blanchet
parents:
36552
diff
changeset

410 
else the_problem_prefix ^ serial_string ()) 
36143
6490319b1703
added "overlord" option (to get easy access to output files for debugging) + systematically use "raw_goal" rather than an inconsistent mixture
blanchet
parents:
36142
diff
changeset

411 
^ "_" ^ string_of_int nr) 
32942
b6711ec9de26
misc tuning and recovery of Isabelle coding style;
wenzelm
parents:
32941
diff
changeset

412 
in 
36376  413 
if the_dest_dir = "" then File.tmp_path probfile 
414 
else if File.exists (Path.explode the_dest_dir) 

415 
then Path.append (Path.explode the_dest_dir) probfile 

416 
else error ("No such directory: " ^ the_dest_dir ^ ".") 

32942
b6711ec9de26
misc tuning and recovery of Isabelle coding style;
wenzelm
parents:
32941
diff
changeset

417 
end; 
32864
a226f29d4bdc
reorganized signature of AtpWrapper structure: records instead of unnamed parameters and return values,
boehmes
parents:
32740
diff
changeset

418 

36917
8674cdb0b8cc
query _HOME environment variables at runtime, not at buildtime
blanchet
parents:
36910
diff
changeset

419 
val home = getenv home_var 
36289
f75b6a3e1450
set "atps" reference's default value to "(remote_)e (remote_)spass (remote_)vampire", based on what is installed
blanchet
parents:
36287
diff
changeset

420 
val command = Path.explode (home ^ "/" ^ executable) 
31750  421 
(* write out problem file and call prover *) 
37514
b147d01b8ebc
if SPASS fails at finding a proof with the SOS option turned on, turn it off and try again
blanchet
parents:
37509
diff
changeset

422 
fun command_line complete probfile = 
b147d01b8ebc
if SPASS fails at finding a proof with the SOS option turned on, turn it off and try again
blanchet
parents:
37509
diff
changeset

423 
let 
b147d01b8ebc
if SPASS fails at finding a proof with the SOS option turned on, turn it off and try again
blanchet
parents:
37509
diff
changeset

424 
val core = File.shell_path command ^ " " ^ arguments complete timeout ^ 
b147d01b8ebc
if SPASS fails at finding a proof with the SOS option turned on, turn it off and try again
blanchet
parents:
37509
diff
changeset

425 
" " ^ File.shell_path probfile 
b147d01b8ebc
if SPASS fails at finding a proof with the SOS option turned on, turn it off and try again
blanchet
parents:
37509
diff
changeset

426 
in 
b147d01b8ebc
if SPASS fails at finding a proof with the SOS option turned on, turn it off and try again
blanchet
parents:
37509
diff
changeset

427 
(if Config.get ctxt measure_runtime then 
b147d01b8ebc
if SPASS fails at finding a proof with the SOS option turned on, turn it off and try again
blanchet
parents:
37509
diff
changeset

428 
"TIMEFORMAT='%3U'; { time " ^ core ^ " ; }" 
b147d01b8ebc
if SPASS fails at finding a proof with the SOS option turned on, turn it off and try again
blanchet
parents:
37509
diff
changeset

429 
else 
37962
d7dbe01f48d7
keep track of clause numbers for SPASS now that we generate FOF rather than CNF problems;
blanchet
parents:
37926
diff
changeset

430 
"exec " ^ core) ^ " 2>&1" 
37514
b147d01b8ebc
if SPASS fails at finding a proof with the SOS option turned on, turn it off and try again
blanchet
parents:
37509
diff
changeset

431 
end 
32510  432 
fun split_time s = 
433 
let 

32942
b6711ec9de26
misc tuning and recovery of Isabelle coding style;
wenzelm
parents:
32941
diff
changeset

434 
val split = String.tokens (fn c => str c = "\n"); 
36369
d2cd0d04b8e6
handle ATP proof delimiters in a cleaner, more extensible fashion
blanchet
parents:
36289
diff
changeset

435 
val (output, t) = s > split > split_last > apfst cat_lines; 
32942
b6711ec9de26
misc tuning and recovery of Isabelle coding style;
wenzelm
parents:
32941
diff
changeset

436 
fun as_num f = f >> (fst o read_int); 
b6711ec9de26
misc tuning and recovery of Isabelle coding style;
wenzelm
parents:
32941
diff
changeset

437 
val num = as_num (Scan.many1 Symbol.is_ascii_digit); 
b6711ec9de26
misc tuning and recovery of Isabelle coding style;
wenzelm
parents:
32941
diff
changeset

438 
val digit = Scan.one Symbol.is_ascii_digit; 
b6711ec9de26
misc tuning and recovery of Isabelle coding style;
wenzelm
parents:
32941
diff
changeset

439 
val num3 = as_num (digit ::: digit ::: (digit >> single)); 
b6711ec9de26
misc tuning and recovery of Isabelle coding style;
wenzelm
parents:
32941
diff
changeset

440 
val time = num  Scan.$$ "."  num3 >> (fn (a, b) => a * 1000 + b); 
b6711ec9de26
misc tuning and recovery of Isabelle coding style;
wenzelm
parents:
32941
diff
changeset

441 
val as_time = the_default 0 o Scan.read Symbol.stopper time o explode; 
36369
d2cd0d04b8e6
handle ATP proof delimiters in a cleaner, more extensible fashion
blanchet
parents:
36289
diff
changeset

442 
in (output, as_time t) end; 
32458
de6834b20e9e
sledgehammer's temporary files are removed properly (even in case of an exception occurs)
boehmes
parents:
32451
diff
changeset

443 
fun run_on probfile = 
37962
d7dbe01f48d7
keep track of clause numbers for SPASS now that we generate FOF rather than CNF problems;
blanchet
parents:
37926
diff
changeset

444 
if home = "" then 
d7dbe01f48d7
keep track of clause numbers for SPASS now that we generate FOF rather than CNF problems;
blanchet
parents:
37926
diff
changeset

445 
error ("The environment variable " ^ quote home_var ^ " is not set.") 
d7dbe01f48d7
keep track of clause numbers for SPASS now that we generate FOF rather than CNF problems;
blanchet
parents:
37926
diff
changeset

446 
else if File.exists command then 
37514
b147d01b8ebc
if SPASS fails at finding a proof with the SOS option turned on, turn it off and try again
blanchet
parents:
37509
diff
changeset

447 
let 
b147d01b8ebc
if SPASS fails at finding a proof with the SOS option turned on, turn it off and try again
blanchet
parents:
37509
diff
changeset

448 
fun do_run complete = 
b147d01b8ebc
if SPASS fails at finding a proof with the SOS option turned on, turn it off and try again
blanchet
parents:
37509
diff
changeset

449 
let 
b147d01b8ebc
if SPASS fails at finding a proof with the SOS option turned on, turn it off and try again
blanchet
parents:
37509
diff
changeset

450 
val command = command_line complete probfile 
b147d01b8ebc
if SPASS fails at finding a proof with the SOS option turned on, turn it off and try again
blanchet
parents:
37509
diff
changeset

451 
val ((output, msecs), res_code) = 
b147d01b8ebc
if SPASS fails at finding a proof with the SOS option turned on, turn it off and try again
blanchet
parents:
37509
diff
changeset

452 
bash_output command 
b147d01b8ebc
if SPASS fails at finding a proof with the SOS option turned on, turn it off and try again
blanchet
parents:
37509
diff
changeset

453 
>> (if overlord then 
b147d01b8ebc
if SPASS fails at finding a proof with the SOS option turned on, turn it off and try again
blanchet
parents:
37509
diff
changeset

454 
prefix ("% " ^ command ^ "\n% " ^ timestamp () ^ "\n") 
b147d01b8ebc
if SPASS fails at finding a proof with the SOS option turned on, turn it off and try again
blanchet
parents:
37509
diff
changeset

455 
else 
b147d01b8ebc
if SPASS fails at finding a proof with the SOS option turned on, turn it off and try again
blanchet
parents:
37509
diff
changeset

456 
I) 
b147d01b8ebc
if SPASS fails at finding a proof with the SOS option turned on, turn it off and try again
blanchet
parents:
37509
diff
changeset

457 
>> (if Config.get ctxt measure_runtime then split_time 
b147d01b8ebc
if SPASS fails at finding a proof with the SOS option turned on, turn it off and try again
blanchet
parents:
37509
diff
changeset

458 
else rpair 0) 
b147d01b8ebc
if SPASS fails at finding a proof with the SOS option turned on, turn it off and try again
blanchet
parents:
37509
diff
changeset

459 
val (proof, outcome) = 
b147d01b8ebc
if SPASS fails at finding a proof with the SOS option turned on, turn it off and try again
blanchet
parents:
37509
diff
changeset

460 
extract_proof_and_outcome complete res_code proof_delims 
b147d01b8ebc
if SPASS fails at finding a proof with the SOS option turned on, turn it off and try again
blanchet
parents:
37509
diff
changeset

461 
known_failures output 
b147d01b8ebc
if SPASS fails at finding a proof with the SOS option turned on, turn it off and try again
blanchet
parents:
37509
diff
changeset

462 
in (output, msecs, proof, outcome) end 
37643
f576af716aa6
rewrote the TPTP problem generation code more or less from scratch;
blanchet
parents:
37628
diff
changeset

463 
val readable_names = debug andalso overlord 
37514
b147d01b8ebc
if SPASS fails at finding a proof with the SOS option turned on, turn it off and try again
blanchet
parents:
37509
diff
changeset

464 
val (pool, conjecture_offset) = 
37994
b04307085a09
make TPTP generator accept full firstorder formulas
blanchet
parents:
37989
diff
changeset

465 
write_tptp_file thy readable_names explicit_forall full_types 
b04307085a09
make TPTP generator accept full firstorder formulas
blanchet
parents:
37989
diff
changeset

466 
explicit_apply probfile clauses 
37995
06f02b15ef8a
generate full firstorder formulas (FOF) in Sledgehammer
blanchet
parents:
37994
diff
changeset

467 
val conjecture_shape = 
06f02b15ef8a
generate full firstorder formulas (FOF) in Sledgehammer
blanchet
parents:
37994
diff
changeset

468 
conjecture_offset + 1 upto conjecture_offset + length hyp_ts + 1 
37514
b147d01b8ebc
if SPASS fails at finding a proof with the SOS option turned on, turn it off and try again
blanchet
parents:
37509
diff
changeset

469 
val result = 
b147d01b8ebc
if SPASS fails at finding a proof with the SOS option turned on, turn it off and try again
blanchet
parents:
37509
diff
changeset

470 
do_run false 
37550
fc2f979b9a08
split SPASS time slot between SOS and nonSOS, in case SOS times out
blanchet
parents:
37514
diff
changeset

471 
> (fn (_, msecs0, _, SOME _) => 
37514
b147d01b8ebc
if SPASS fails at finding a proof with the SOS option turned on, turn it off and try again
blanchet
parents:
37509
diff
changeset

472 
do_run true 
b147d01b8ebc
if SPASS fails at finding a proof with the SOS option turned on, turn it off and try again
blanchet
parents:
37509
diff
changeset

473 
> (fn (output, msecs, proof, outcome) => 
b147d01b8ebc
if SPASS fails at finding a proof with the SOS option turned on, turn it off and try again
blanchet
parents:
37509
diff
changeset

474 
(output, msecs0 + msecs, proof, outcome)) 
b147d01b8ebc
if SPASS fails at finding a proof with the SOS option turned on, turn it off and try again
blanchet
parents:
37509
diff
changeset

475 
 result => result) 
b147d01b8ebc
if SPASS fails at finding a proof with the SOS option turned on, turn it off and try again
blanchet
parents:
37509
diff
changeset

476 
in ((pool, conjecture_shape), result) end 
36382  477 
else 
478 
error ("Bad executable: " ^ Path.implode command ^ "."); 

28592  479 

36167
c1a35be8e476
make Sledgehammer's output more debugging friendly
blanchet
parents:
36143
diff
changeset

480 
(* If the problem file has not been exported, remove it; otherwise, export 
c1a35be8e476
make Sledgehammer's output more debugging friendly
blanchet
parents:
36143
diff
changeset

481 
the proof file too. *) 
36376  482 
fun cleanup probfile = 
483 
if the_dest_dir = "" then try File.rm probfile else NONE 

37514
b147d01b8ebc
if SPASS fails at finding a proof with the SOS option turned on, turn it off and try again
blanchet
parents:
37509
diff
changeset

484 
fun export probfile (_, (output, _, _, _)) = 
36376  485 
if the_dest_dir = "" then 
36187  486 
() 
487 
else 

37514
b147d01b8ebc
if SPASS fails at finding a proof with the SOS option turned on, turn it off and try again
blanchet
parents:
37509
diff
changeset

488 
File.write (Path.explode (Path.implode probfile ^ "_proof")) output 
32257
bad5a99c16d8
neg_conjecture_clauses, neg_clausify_tac: proper context, eliminated METAHYPS;
wenzelm
parents:
32091
diff
changeset

489 

37514
b147d01b8ebc
if SPASS fails at finding a proof with the SOS option turned on, turn it off and try again
blanchet
parents:
37509
diff
changeset

490 
val ((pool, conjecture_shape), (output, msecs, proof, outcome)) = 
b147d01b8ebc
if SPASS fails at finding a proof with the SOS option turned on, turn it off and try again
blanchet
parents:
37509
diff
changeset

491 
with_path cleanup export run_on (prob_pathname subgoal) 
37989
ca3041b0f445
reorder SPASS conjectures correctly, based on Flotter output
blanchet
parents:
37962
diff
changeset

492 
val (conjecture_shape, internal_thm_names) = 
ca3041b0f445
reorder SPASS conjectures correctly, based on Flotter output
blanchet
parents:
37962
diff
changeset

493 
repair_conjecture_shape_and_theorem_names output conjecture_shape 
ca3041b0f445
reorder SPASS conjectures correctly, based on Flotter output
blanchet
parents:
37962
diff
changeset

494 
internal_thm_names 
37514
b147d01b8ebc
if SPASS fails at finding a proof with the SOS option turned on, turn it off and try again
blanchet
parents:
37509
diff
changeset

495 

35969  496 
val (message, relevant_thm_names) = 
36370
a4f601daa175
centralized ATPspecific error handling in "atp_wrapper.ML"
blanchet
parents:
36369
diff
changeset

497 
case outcome of 
36400
c5bae529f967
rename options and keep track of conjecture shape (to facilitate proof reconstruction)
blanchet
parents:
36393
diff
changeset

498 
NONE => 
c5bae529f967
rename options and keep track of conjecture shape (to facilitate proof reconstruction)
blanchet
parents:
36393
diff
changeset

499 
proof_text isar_proof 
37480  500 
(pool, debug, isar_shrink_factor, ctxt, conjecture_shape) 
501 
(full_types, minimize_command, proof, internal_thm_names, th, 

502 
subgoal) 

36370
a4f601daa175
centralized ATPspecific error handling in "atp_wrapper.ML"
blanchet
parents:
36369
diff
changeset

503 
 SOME failure => (string_for_failure failure ^ "\n", []) 
32864
a226f29d4bdc
reorganized signature of AtpWrapper structure: records instead of unnamed parameters and return values,
boehmes
parents:
32740
diff
changeset

504 
in 
36393
be73a2b2443b
support readable names even when Isar proof reconstruction is enabled  useful for debugging
blanchet
parents:
36382
diff
changeset

505 
{outcome = outcome, message = message, pool = pool, 
37514
b147d01b8ebc
if SPASS fails at finding a proof with the SOS option turned on, turn it off and try again
blanchet
parents:
37509
diff
changeset

506 
relevant_thm_names = relevant_thm_names, atp_run_time_in_msecs = msecs, 
b147d01b8ebc
if SPASS fails at finding a proof with the SOS option turned on, turn it off and try again
blanchet
parents:
37509
diff
changeset

507 
output = output, proof = proof, internal_thm_names = internal_thm_names, 
36400
c5bae529f967
rename options and keep track of conjecture shape (to facilitate proof reconstruction)
blanchet
parents:
36393
diff
changeset

508 
conjecture_shape = conjecture_shape, 
35969  509 
filtered_clauses = the_filtered_clauses} 
37499
5ff37037fbec
merge "generic_prover" and "generic_tptp_prover"
blanchet
parents:
37498
diff
changeset

510 
end 
28596
fcd463a6b6de
tuned interfaces  plain prover function, without thread;
wenzelm
parents:
28592
diff
changeset

511 

35969  512 
fun tptp_prover name p = (name, generic_tptp_prover (name, p)); 
28596
fcd463a6b6de
tuned interfaces  plain prover function, without thread;
wenzelm
parents:
28592
diff
changeset

513 

36382  514 
fun to_generous_secs time = (Time.toMilliseconds time + 999) div 1000 
36142
f5e15e9aae10
make Sledgehammer "minimize" output less confusing + round up (not down) time limits to nearest second
blanchet
parents:
36064
diff
changeset

515 

28596
fcd463a6b6de
tuned interfaces  plain prover function, without thread;
wenzelm
parents:
28592
diff
changeset

516 
(* E prover *) 
fcd463a6b6de
tuned interfaces  plain prover function, without thread;
wenzelm
parents:
28592
diff
changeset

517 

36369
d2cd0d04b8e6
handle ATP proof delimiters in a cleaner, more extensible fashion
blanchet
parents:
36289
diff
changeset

518 
val tstp_proof_delims = 
d2cd0d04b8e6
handle ATP proof delimiters in a cleaner, more extensible fashion
blanchet
parents:
36289
diff
changeset

519 
("# SZS output start CNFRefutation.", "# SZS output end CNFRefutation") 
d2cd0d04b8e6
handle ATP proof delimiters in a cleaner, more extensible fashion
blanchet
parents:
36289
diff
changeset

520 

35969  521 
val e_config : prover_config = 
36917
8674cdb0b8cc
query _HOME environment variables at runtime, not at buildtime
blanchet
parents:
36910
diff
changeset

522 
{home_var = "E_HOME", 
36289
f75b6a3e1450
set "atps" reference's default value to "(remote_)e (remote_)spass (remote_)vampire", based on what is installed
blanchet
parents:
36287
diff
changeset

523 
executable = "eproof", 
37514
b147d01b8ebc
if SPASS fails at finding a proof with the SOS option turned on, turn it off and try again
blanchet
parents:
37509
diff
changeset

524 
arguments = fn _ => fn timeout => 
36382  525 
"tstpin tstpout l5 xAutoDev tAutoDev silent cpulimit=" ^ 
526 
string_of_int (to_generous_secs timeout), 

36369
d2cd0d04b8e6
handle ATP proof delimiters in a cleaner, more extensible fashion
blanchet
parents:
36289
diff
changeset

527 
proof_delims = [tstp_proof_delims], 
36265
41c9e755e552
distinguish between the different ATP errors in the user interface;
blanchet
parents:
36264
diff
changeset

528 
known_failures = 
37995
06f02b15ef8a
generate full firstorder formulas (FOF) in Sledgehammer
blanchet
parents:
37994
diff
changeset

529 
[(Unprovable, "SZS status: CounterSatisfiable"), 
06f02b15ef8a
generate full firstorder formulas (FOF) in Sledgehammer
blanchet
parents:
37994
diff
changeset

530 
(Unprovable, "SZS status CounterSatisfiable"), 
36370
a4f601daa175
centralized ATPspecific error handling in "atp_wrapper.ML"
blanchet
parents:
36369
diff
changeset

531 
(TimedOut, "Failure: Resource limit exceeded (time)"), 
a4f601daa175
centralized ATPspecific error handling in "atp_wrapper.ML"
blanchet
parents:
36369
diff
changeset

532 
(TimedOut, "time limit exceeded"), 
a4f601daa175
centralized ATPspecific error handling in "atp_wrapper.ML"
blanchet
parents:
36369
diff
changeset

533 
(OutOfResources, 
a4f601daa175
centralized ATPspecific error handling in "atp_wrapper.ML"
blanchet
parents:
36369
diff
changeset

534 
"# Cannot determine problem status within resource limit"), 
a4f601daa175
centralized ATPspecific error handling in "atp_wrapper.ML"
blanchet
parents:
36369
diff
changeset

535 
(OutOfResources, "SZS status: ResourceOut"), 
a4f601daa175
centralized ATPspecific error handling in "atp_wrapper.ML"
blanchet
parents:
36369
diff
changeset

536 
(OutOfResources, "SZS status ResourceOut")], 
38009
34e1ac9cb71d
shrink the "max_new_relevant_facts_per_iter" fudge factors, now that we count formulas and not clauses
blanchet
parents:
38005
diff
changeset

537 
max_new_relevant_facts_per_iter = 80 (* FIXME *), 
37994
b04307085a09
make TPTP generator accept full firstorder formulas
blanchet
parents:
37989
diff
changeset

538 
prefers_theory_relevant = false, 
b04307085a09
make TPTP generator accept full firstorder formulas
blanchet
parents:
37989
diff
changeset

539 
explicit_forall = false} 
35969  540 
val e = tptp_prover "e" e_config 
28596
fcd463a6b6de
tuned interfaces  plain prover function, without thread;
wenzelm
parents:
28592
diff
changeset

541 

fcd463a6b6de
tuned interfaces  plain prover function, without thread;
wenzelm
parents:
28592
diff
changeset

542 

36219
16670b4f0baa
set SPASS option on the commandline, so that it doesn't vanish when moving to TPTP format
blanchet
parents:
36190
diff
changeset

543 
(* The "VarWeight=3" option helps the higherorder problems, probably by 
16670b4f0baa
set SPASS option on the commandline, so that it doesn't vanish when moving to TPTP format
blanchet
parents:
36190
diff
changeset

544 
counteracting the presence of "hAPP". *) 
37498
b426cbdb5a23
removed Sledgehammer's support for the DFG syntax;
blanchet
parents:
37480
diff
changeset

545 
val spass_config : prover_config = 
37962
d7dbe01f48d7
keep track of clause numbers for SPASS now that we generate FOF rather than CNF problems;
blanchet
parents:
37926
diff
changeset

546 
{home_var = "ISABELLE_ATP_MANAGER", 
d7dbe01f48d7
keep track of clause numbers for SPASS now that we generate FOF rather than CNF problems;
blanchet
parents:
37926
diff
changeset

547 
executable = "SPASS_TPTP", 
37550
fc2f979b9a08
split SPASS time slot between SOS and nonSOS, in case SOS times out
blanchet
parents:
37514
diff
changeset

548 
(* "div 2" accounts for the fact that SPASS is often run twice. *) 
37514
b147d01b8ebc
if SPASS fails at finding a proof with the SOS option turned on, turn it off and try again
blanchet
parents:
37509
diff
changeset

549 
arguments = fn complete => fn timeout => 
37962
d7dbe01f48d7
keep track of clause numbers for SPASS now that we generate FOF rather than CNF problems;
blanchet
parents:
37926
diff
changeset

550 
("Auto PGiven=0 PProblem=0 Splits=0 FullRed=0 DocProof \ 
37550
fc2f979b9a08
split SPASS time slot between SOS and nonSOS, in case SOS times out
blanchet
parents:
37514
diff
changeset

551 
\VarWeight=3 TimeLimit=" ^ 
fc2f979b9a08
split SPASS time slot between SOS and nonSOS, in case SOS times out
blanchet
parents:
37514
diff
changeset

552 
string_of_int (to_generous_secs timeout div 2)) 
37514
b147d01b8ebc
if SPASS fails at finding a proof with the SOS option turned on, turn it off and try again
blanchet
parents:
37509
diff
changeset

553 
> not complete ? prefix "SOS=1 ", 
36369
d2cd0d04b8e6
handle ATP proof delimiters in a cleaner, more extensible fashion
blanchet
parents:
36289
diff
changeset

554 
proof_delims = [("Here is a proof", "Formulae used in the proof")], 
36289
f75b6a3e1450
set "atps" reference's default value to "(remote_)e (remote_)spass (remote_)vampire", based on what is installed
blanchet
parents:
36287
diff
changeset

555 
known_failures = 
37413  556 
[(IncompleteUnprovable, "SPASS beiseite: Completion found"), 
36370
a4f601daa175
centralized ATPspecific error handling in "atp_wrapper.ML"
blanchet
parents:
36369
diff
changeset

557 
(TimedOut, "SPASS beiseite: Ran out of time"), 
36965  558 
(OutOfResources, "SPASS beiseite: Maximal number of loops exceeded"), 
37413  559 
(MalformedInput, "Undefined symbol"), 
37414
d0cea0796295
expect SPASS 3.7, and give a friendly warning if an older version is used
blanchet
parents:
37413
diff
changeset

560 
(MalformedInput, "Free Variable"), 
37962
d7dbe01f48d7
keep track of clause numbers for SPASS now that we generate FOF rather than CNF problems;
blanchet
parents:
37926
diff
changeset

561 
(OldSpass, "tptp2dfg")], 
38009
34e1ac9cb71d
shrink the "max_new_relevant_facts_per_iter" fudge factors, now that we count formulas and not clauses
blanchet
parents:
38005
diff
changeset

562 
max_new_relevant_facts_per_iter = 26 (* FIXME *), 
37994
b04307085a09
make TPTP generator accept full firstorder formulas
blanchet
parents:
37989
diff
changeset

563 
prefers_theory_relevant = true, 
b04307085a09
make TPTP generator accept full firstorder formulas
blanchet
parents:
37989
diff
changeset

564 
explicit_forall = true} 
37414
d0cea0796295
expect SPASS 3.7, and give a friendly warning if an older version is used
blanchet
parents:
37413
diff
changeset

565 
val spass = tptp_prover "spass" spass_config 
28596
fcd463a6b6de
tuned interfaces  plain prover function, without thread;
wenzelm
parents:
28592
diff
changeset

566 

37509
f39464d971c4
factor out TPTP format output into file of its own, to facilitate further changes
blanchet
parents:
37506
diff
changeset

567 
(* Vampire *) 
f39464d971c4
factor out TPTP format output into file of its own, to facilitate further changes
blanchet
parents:
37506
diff
changeset

568 

f39464d971c4
factor out TPTP format output into file of its own, to facilitate further changes
blanchet
parents:
37506
diff
changeset

569 
val vampire_config : prover_config = 
f39464d971c4
factor out TPTP format output into file of its own, to facilitate further changes
blanchet
parents:
37506
diff
changeset

570 
{home_var = "VAMPIRE_HOME", 
f39464d971c4
factor out TPTP format output into file of its own, to facilitate further changes
blanchet
parents:
37506
diff
changeset

571 
executable = "vampire", 
37514
b147d01b8ebc
if SPASS fails at finding a proof with the SOS option turned on, turn it off and try again
blanchet
parents:
37509
diff
changeset

572 
arguments = fn _ => fn timeout => 
37509
f39464d971c4
factor out TPTP format output into file of its own, to facilitate further changes
blanchet
parents:
37506
diff
changeset

573 
"output_syntax tptp mode casc t " ^ 
f39464d971c4
factor out TPTP format output into file of its own, to facilitate further changes
blanchet
parents:
37506
diff
changeset

574 
string_of_int (to_generous_secs timeout), 
f39464d971c4
factor out TPTP format output into file of its own, to facilitate further changes
blanchet
parents:
37506
diff
changeset

575 
proof_delims = 
f39464d971c4
factor out TPTP format output into file of its own, to facilitate further changes
blanchet
parents:
37506
diff
changeset

576 
[("=========== Refutation ==========", 
f39464d971c4
factor out TPTP format output into file of its own, to facilitate further changes
blanchet
parents:
37506
diff
changeset

577 
"======= End of refutation ======="), 
f39464d971c4
factor out TPTP format output into file of its own, to facilitate further changes
blanchet
parents:
37506
diff
changeset

578 
("% SZS output start Refutation", "% SZS output end Refutation")], 
f39464d971c4
factor out TPTP format output into file of its own, to facilitate further changes
blanchet
parents:
37506
diff
changeset

579 
known_failures = 
f39464d971c4
factor out TPTP format output into file of its own, to facilitate further changes
blanchet
parents:
37506
diff
changeset

580 
[(Unprovable, "UNPROVABLE"), 
f39464d971c4
factor out TPTP format output into file of its own, to facilitate further changes
blanchet
parents:
37506
diff
changeset

581 
(IncompleteUnprovable, "CANNOT PROVE"), 
f39464d971c4
factor out TPTP format output into file of its own, to facilitate further changes
blanchet
parents:
37506
diff
changeset

582 
(Unprovable, "Satisfiability detected"), 
f39464d971c4
factor out TPTP format output into file of its own, to facilitate further changes
blanchet
parents:
37506
diff
changeset

583 
(OutOfResources, "Refutation not found")], 
38009
34e1ac9cb71d
shrink the "max_new_relevant_facts_per_iter" fudge factors, now that we count formulas and not clauses
blanchet
parents:
38005
diff
changeset

584 
max_new_relevant_facts_per_iter = 40 (* FIXME *), 
37994
b04307085a09
make TPTP generator accept full firstorder formulas
blanchet
parents:
37989
diff
changeset

585 
prefers_theory_relevant = false, 
b04307085a09
make TPTP generator accept full firstorder formulas
blanchet
parents:
37989
diff
changeset

586 
explicit_forall = false} 
37509
f39464d971c4
factor out TPTP format output into file of its own, to facilitate further changes
blanchet
parents:
37506
diff
changeset

587 
val vampire = tptp_prover "vampire" vampire_config 
f39464d971c4
factor out TPTP format output into file of its own, to facilitate further changes
blanchet
parents:
37506
diff
changeset

588 

f39464d971c4
factor out TPTP format output into file of its own, to facilitate further changes
blanchet
parents:
37506
diff
changeset

589 
(* Remote prover invocation via SystemOnTPTP *) 
28596
fcd463a6b6de
tuned interfaces  plain prover function, without thread;
wenzelm
parents:
28592
diff
changeset

590 

36376  591 
val systems = Synchronized.var "atp_systems" ([]: string list); 
31835  592 

593 
fun get_systems () = 

36370
a4f601daa175
centralized ATPspecific error handling in "atp_wrapper.ML"
blanchet
parents:
36369
diff
changeset

594 
case bash_output "\"$ISABELLE_ATP_MANAGER/SystemOnTPTP\" w" of 
a4f601daa175
centralized ATPspecific error handling in "atp_wrapper.ML"
blanchet
parents:
36369
diff
changeset

595 
(answer, 0) => split_lines answer 
a4f601daa175
centralized ATPspecific error handling in "atp_wrapper.ML"
blanchet
parents:
36369
diff
changeset

596 
 (answer, _) => 
37627  597 
error ("Failed to get available systems at SystemOnTPTP:\n" ^ 
598 
perhaps (try (unsuffix "\n")) answer) 

31835  599 

35867  600 
fun refresh_systems_on_tptp () = 
37509
f39464d971c4
factor out TPTP format output into file of its own, to facilitate further changes
blanchet
parents:
37506
diff
changeset

601 
Synchronized.change systems (fn _ => get_systems ()) 
31835  602 

603 
fun get_system prefix = Synchronized.change_result systems (fn systems => 

32864
a226f29d4bdc
reorganized signature of AtpWrapper structure: records instead of unnamed parameters and return values,
boehmes
parents:
32740
diff
changeset

604 
(if null systems then get_systems () else systems) 
32942
b6711ec9de26
misc tuning and recovery of Isabelle coding style;
wenzelm
parents:
32941
diff
changeset

605 
> `(find_first (String.isPrefix prefix))); 
32864
a226f29d4bdc
reorganized signature of AtpWrapper structure: records instead of unnamed parameters and return values,
boehmes
parents:
32740
diff
changeset

606 

32948  607 
fun the_system prefix = 
32864
a226f29d4bdc
reorganized signature of AtpWrapper structure: records instead of unnamed parameters and return values,
boehmes
parents:
32740
diff
changeset

608 
(case get_system prefix of 
37509
f39464d971c4
factor out TPTP format output into file of its own, to facilitate further changes
blanchet
parents:
37506
diff
changeset

609 
NONE => error ("System " ^ quote prefix ^ " not available at SystemOnTPTP.") 
32942
b6711ec9de26
misc tuning and recovery of Isabelle coding style;
wenzelm
parents:
32941
diff
changeset

610 
 SOME sys => sys); 
31835  611 

36265
41c9e755e552
distinguish between the different ATP errors in the user interface;
blanchet
parents:
36264
diff
changeset

612 
val remote_known_failures = 
37627  613 
[(CantConnect, "HTTPError"), 
614 
(TimedOut, "says Timeout"), 

36377
b3dce4c715d0
now rename the file "atp_wrapper.ML" to "atp_systems.ML" + fix typo in "SystemOnTPTP" script
blanchet
parents:
36376
diff
changeset

615 
(MalformedOutput, "Remote script could not extract proof")] 
35865  616 

37509
f39464d971c4
factor out TPTP format output into file of its own, to facilitate further changes
blanchet
parents:
37506
diff
changeset

617 
fun remote_config atp_prefix args 
38009
34e1ac9cb71d
shrink the "max_new_relevant_facts_per_iter" fudge factors, now that we count formulas and not clauses
blanchet
parents:
38005
diff
changeset

618 
({proof_delims, known_failures, max_new_relevant_facts_per_iter, 
37994
b04307085a09
make TPTP generator accept full firstorder formulas
blanchet
parents:
37989
diff
changeset

619 
prefers_theory_relevant, explicit_forall, ...} : prover_config) 
b04307085a09
make TPTP generator accept full firstorder formulas
blanchet
parents:
37989
diff
changeset

620 
: prover_config = 
36917
8674cdb0b8cc
query _HOME environment variables at runtime, not at buildtime
blanchet
parents:
36910
diff
changeset

621 
{home_var = "ISABELLE_ATP_MANAGER", 
36289
f75b6a3e1450
set "atps" reference's default value to "(remote_)e (remote_)spass (remote_)vampire", based on what is installed
blanchet
parents:
36287
diff
changeset

622 
executable = "SystemOnTPTP", 
37514
b147d01b8ebc
if SPASS fails at finding a proof with the SOS option turned on, turn it off and try again
blanchet
parents:
37509
diff
changeset

623 
arguments = fn _ => fn timeout => 
36382  624 
args ^ " t " ^ string_of_int (to_generous_secs timeout) ^ " s " ^ 
625 
the_system atp_prefix, 

36369
d2cd0d04b8e6
handle ATP proof delimiters in a cleaner, more extensible fashion
blanchet
parents:
36289
diff
changeset

626 
proof_delims = insert (op =) tstp_proof_delims proof_delims, 
36265
41c9e755e552
distinguish between the different ATP errors in the user interface;
blanchet
parents:
36264
diff
changeset

627 
known_failures = remote_known_failures @ known_failures, 
38009
34e1ac9cb71d
shrink the "max_new_relevant_facts_per_iter" fudge factors, now that we count formulas and not clauses
blanchet
parents:
38005
diff
changeset

628 
max_new_relevant_facts_per_iter = max_new_relevant_facts_per_iter, 
37994
b04307085a09
make TPTP generator accept full firstorder formulas
blanchet
parents:
37989
diff
changeset

629 
prefers_theory_relevant = prefers_theory_relevant, 
b04307085a09
make TPTP generator accept full firstorder formulas
blanchet
parents:
37989
diff
changeset

630 
explicit_forall = explicit_forall} 
28596
fcd463a6b6de
tuned interfaces  plain prover function, without thread;
wenzelm
parents:
28592
diff
changeset

631 

37509
f39464d971c4
factor out TPTP format output into file of its own, to facilitate further changes
blanchet
parents:
37506
diff
changeset

632 
fun remote_tptp_prover prover atp_prefix args config = 
f39464d971c4
factor out TPTP format output into file of its own, to facilitate further changes
blanchet
parents:
37506
diff
changeset

633 
tptp_prover (remotify (fst prover)) (remote_config atp_prefix args config) 
32864
a226f29d4bdc
reorganized signature of AtpWrapper structure: records instead of unnamed parameters and return values,
boehmes
parents:
32740
diff
changeset

634 

37509
f39464d971c4
factor out TPTP format output into file of its own, to facilitate further changes
blanchet
parents:
37506
diff
changeset

635 
val remote_e = remote_tptp_prover e "EP" "" e_config 
f39464d971c4
factor out TPTP format output into file of its own, to facilitate further changes
blanchet
parents:
37506
diff
changeset

636 
val remote_spass = remote_tptp_prover spass "SPASS" "x" spass_config 
f39464d971c4
factor out TPTP format output into file of its own, to facilitate further changes
blanchet
parents:
37506
diff
changeset

637 
val remote_vampire = remote_tptp_prover vampire "Vampire9" "" vampire_config 
28592  638 

36917
8674cdb0b8cc
query _HOME environment variables at runtime, not at buildtime
blanchet
parents:
36910
diff
changeset

639 
fun maybe_remote (name, _) ({home_var, ...} : prover_config) = 
8674cdb0b8cc
query _HOME environment variables at runtime, not at buildtime
blanchet
parents:
36910
diff
changeset

640 
name > getenv home_var = "" ? remotify 
36371
8c83ea1a7740
move the Sledgehammer menu options to "sledgehammer_isar.ML"
blanchet
parents:
36370
diff
changeset

641 

8c83ea1a7740
move the Sledgehammer menu options to "sledgehammer_isar.ML"
blanchet
parents:
36370
diff
changeset

642 
fun default_atps_param_value () = 
8c83ea1a7740
move the Sledgehammer menu options to "sledgehammer_isar.ML"
blanchet
parents:
36370
diff
changeset

643 
space_implode " " [maybe_remote e e_config, maybe_remote spass spass_config, 
8c83ea1a7740
move the Sledgehammer menu options to "sledgehammer_isar.ML"
blanchet
parents:
36370
diff
changeset

644 
remotify (fst vampire)] 
8c83ea1a7740
move the Sledgehammer menu options to "sledgehammer_isar.ML"
blanchet
parents:
36370
diff
changeset

645 

37509
f39464d971c4
factor out TPTP format output into file of its own, to facilitate further changes
blanchet
parents:
37506
diff
changeset

646 
val provers = [e, spass, vampire, remote_e, remote_spass, remote_vampire] 
35867  647 
val prover_setup = fold add_prover provers 
648 

649 
val setup = 

36376  650 
dest_dir_setup 
35867  651 
#> problem_prefix_setup 
652 
#> measure_runtime_setup 

36371
8c83ea1a7740
move the Sledgehammer menu options to "sledgehammer_isar.ML"
blanchet
parents:
36370
diff
changeset

653 
#> prover_setup 
35867  654 

28592  655 
end; 