author  blanchet 
Wed, 28 Jul 2010 18:32:54 +0200  
(* Title: HOL/Tools/ATP_Manager/atp_systems.ML 
Author: Fabian Immler, TU Muenchen 
3 
Author: Jasmin Blanchette, TU Muenchen 
28592  4 

36376  5 
Setup for supported ATPs. 
28592  6 
*) 
7 

36376  8 
signature ATP_SYSTEMS = 
28592  9 
sig 
38023  10 
datatype failure = 
11 
Unprovable  IncompleteUnprovable  CantConnect  TimedOut  

12 
OutOfResources  OldSpass  MalformedInput  MalformedOutput  UnknownError 

13 

14 
type prover_config = 

38032  15 
{executable: string * string, 
16 
required_executables: (string * string) list, 

38023  17 
arguments: bool > Time.time > string, 
18 
proof_delims: (string * string) list, 

19 
known_failures: (failure * string) list, 

20 
max_new_relevant_facts_per_iter: int, 

21 
prefers_theory_relevant: bool, 

22 
explicit_forall: bool} 

23 

24 
val add_prover: string * prover_config > theory > theory 

25 
val get_prover: theory > string > prover_config 

26 
val available_atps: theory > unit 

35867  27 
val refresh_systems_on_tptp : unit > unit 
28 
val default_atps_param_value : unit > string 
35867  29 
val setup : theory > theory 
28592  30 
end; 
31 

36376  32 
structure ATP_Systems : ATP_SYSTEMS = 
28592  33 
struct 
34 

38023  35 
(* prover configuration *) 
36 

38023  37 
datatype failure = 
38 
Unprovable  IncompleteUnprovable  CantConnect  TimedOut  OutOfResources  

39 
OldSpass  MalformedInput  MalformedOutput  UnknownError 

40 

41 
type prover_config = 
38032  42 
{executable: string * string, 
43 
required_executables: (string * string) list, 

44 
arguments: bool > Time.time > string, 
45 
proof_delims: (string * string) list, 
46 
known_failures: (failure * string) list, 
38009
34e1ac9cb71d
shrink the "max_new_relevant_facts_per_iter" fudge factors, now that we count formulas and not clauses
blanchet
parents:
38005
diff
changeset

47 
max_new_relevant_facts_per_iter: int, 
37994
b04307085a09
make TPTP generator accept full firstorder formulas
blanchet
parents:
37989
diff
changeset

48 
prefers_theory_relevant: bool, 
b04307085a09
make TPTP generator accept full firstorder formulas
blanchet
parents:
37989
diff
changeset

49 
explicit_forall: bool} 
50 

fcd463a6b6de
tuned interfaces  plain prover function, without thread;
wenzelm
parents:
28592
diff
changeset

51 

38023  52 
(* named provers *) 
53 

38023  54 
structure Data = Theory_Data 
55 
( 

56 
type T = (prover_config * stamp) Symtab.table 

57 
val empty = Symtab.empty 

58 
val extend = I 

59 
fun merge data : T = Symtab.merge (eq_snd op =) data 

60 
handle Symtab.DUP name => error ("Duplicate ATP: " ^ quote name ^ ".") 

61 
) 

62 

38023  63 
fun add_prover (name, config) thy = 
64 
Data.map (Symtab.update_new (name, (config, stamp ()))) thy 

65 
handle Symtab.DUP name => error ("Duplicate ATP: " ^ quote name ^ ".") 

66 

38023  67 
fun get_prover thy name = 
68 
the (Symtab.lookup (Data.get thy) name) > fst 

69 
handle Option.Option => error ("Unknown ATP: " ^ name ^ ".") 

70 

38023  71 
fun available_atps thy = 
72 
priority ("Available ATPs: " ^ 

73 
commas (sort_strings (Symtab.keys (Data.get thy))) ^ ".") 

74 

38023  75 
fun available_atps thy = 
76 
priority ("Available ATPs: " ^ 

77 
commas (sort_strings (Symtab.keys (Data.get thy))) ^ ".") 

78 

36382  79 
fun to_generous_secs time = (Time.toMilliseconds time + 999) div 1000 
80 

81 
(* E prover *) 
82 

83 
val tstp_proof_delims = 
84 
("# SZS output start CNFRefutation.", "# SZS output end CNFRefutation") 
85 

35969  86 
val e_config : prover_config = 
38032  87 
{executable = ("E_HOME", "eproof"), 
88 
required_executables = [], 

89 
arguments = fn _ => fn timeout => 
36382  90 
"tstpin tstpout l5 xAutoDev tAutoDev silent cpulimit=" ^ 
91 
string_of_int (to_generous_secs timeout), 

92 
proof_delims = [tstp_proof_delims], 
93 
known_failures = 
94 
[(Unprovable, "SZS status: CounterSatisfiable"), 
95 
(Unprovable, "SZS status CounterSatisfiable"), 
96 
(TimedOut, "Failure: Resource limit exceeded (time)"), 
97 
(TimedOut, "time limit exceeded"), 
98 
(OutOfResources, 
99 
"# Cannot determine problem status within resource limit"), 
100 
(OutOfResources, "SZS status: ResourceOut"), 
101 
(OutOfResources, "SZS status ResourceOut")], 
102 
max_new_relevant_facts_per_iter = 80 (* FIXME *), 
103 
prefers_theory_relevant = false, 
104 
explicit_forall = false} 
38023  105 
val e = ("e", e_config) 
106 

107 

108 
(* The "VarWeight=3" option helps the higherorder problems, probably by 
109 
counteracting the presence of "hAPP". *) 
110 
val spass_config : prover_config = 
111 
{executable = ("ISABELLE_ATP_MANAGER", "scripts/spass"), 
38032  112 
required_executables = [("SPASS_HOME", "SPASS")], 
113 
(* "div 2" accounts for the fact that SPASS is often run twice. *) 
114 
arguments = fn complete => fn timeout => 
115 
("Auto PGiven=0 PProblem=0 Splits=0 FullRed=0 DocProof \ 
116 
\VarWeight=3 TimeLimit=" ^ 
117 
string_of_int (to_generous_secs timeout div 2)) 
118 
> not complete ? prefix "SOS=1 ", 
119 
proof_delims = [("Here is a proof", "Formulae used in the proof")], 
120 
known_failures = 
37413  121 
[(IncompleteUnprovable, "SPASS beiseite: Completion found"), 
122 
(TimedOut, "SPASS beiseite: Ran out of time"), 
36965  123 
(OutOfResources, "SPASS beiseite: Maximal number of loops exceeded"), 
37413  124 
(MalformedInput, "Undefined symbol"), 
125 
(MalformedInput, "Free Variable"), 
126 
(OldSpass, "tptp2dfg")], 
127 
max_new_relevant_facts_per_iter = 26 (* FIXME *), 
128 
prefers_theory_relevant = true, 
129 
explicit_forall = true} 
38023  130 
val spass = ("spass", spass_config) 
131 

132 
(* Vampire *) 
133 

134 
val vampire_config : prover_config = 
38032  135 
{executable = ("VAMPIRE_HOME", "vampire"), 
136 
required_executables = [], 

137 
arguments = fn _ => fn timeout => 
38033  138 
"mode casc t " ^ string_of_int (to_generous_secs timeout) ^ 
139 
" input_file ", 

140 
proof_delims = 
141 
[("=========== Refutation ==========", 
142 
"======= End of refutation ======="), 
38033  143 
("% SZS output start Refutation", "% SZS output end Refutation"), 
144 
("% SZS output start Proof", "% SZS output end Proof")], 

145 
known_failures = 
146 
[(Unprovable, "UNPROVABLE"), 
147 
(IncompleteUnprovable, "CANNOT PROVE"), 
148 
(Unprovable, "Satisfiability detected"), 
149 
(OutOfResources, "Refutation not found")], 
150 
max_new_relevant_facts_per_iter = 40 (* FIXME *), 
151 
prefers_theory_relevant = false, 
152 
explicit_forall = false} 
38023  153 
val vampire = ("vampire", vampire_config) 
154 

155 
(* Remote prover invocation via SystemOnTPTP *) 
156 

38023  157 
val systems = Synchronized.var "atp_systems" ([]: string list) 
31835  158 

159 
fun get_systems () = 

160 
case bash_output "\"$ISABELLE_ATP_MANAGER/scripts/remote_atp\" w" of 
161 
(answer, 0) => split_lines answer 
162 
 (answer, _) => 
37627  163 
error ("Failed to get available systems at SystemOnTPTP:\n" ^ 
164 
perhaps (try (unsuffix "\n")) answer) 

31835  165 

35867  166 
changeset

167 
Synchronized.change systems (fn _ => get_systems ()) 
31835  168 

169 
fun get_system prefix = Synchronized.change_result systems (fn systems => 

170 
(if null systems then get_systems () else systems) 
171 
> `(find_first (String.isPrefix prefix))); 
172 

32948  173 
fun the_system prefix = 
changeset

174 
(case get_system prefix of 
37509
f39464d971c4
factor out TPTP format output into file of its own, to facilitate further changes
blanchet
parents:
37506
diff
changeset

175 
NONE => error ("System " ^ quote prefix ^ " not available at SystemOnTPTP.") 
32942
b6711ec9de26
misc tuning and recovery of Isabelle coding style;
wenzelm
parents:
32941
diff
changeset

176 
 SOME sys => sys); 
31835  177 

36265
41c9e755e552
distinguish between the different ATP errors in the user interface;
blanchet
parents:
36264
diff
changeset

178 
val remote_known_failures = 
37627  179 
[(CantConnect, "HTTPError"), 
180 
(TimedOut, "says Timeout"), 

36377
b3dce4c715d0
now rename the file "atp_wrapper.ML" to "atp_systems.ML" + fix typo in "SystemOnTPTP" script
blanchet
parents:
36376
diff
changeset

181 
(MalformedOutput, "Remote script could not extract proof")] 
35865  182 

38041
3b80d6082131
remove "remote_spass" because there's no way to find out which clauses come from which facts + rename scripts
blanchet
parents:
38033
diff
changeset

183 
fun remote_config atp_prefix 
38009
34e1ac9cb71d
shrink the "max_new_relevant_facts_per_iter" fudge factors, now that we count formulas and not clauses
blanchet
parents:
38005
diff
changeset

184 
({proof_delims, known_failures, max_new_relevant_facts_per_iter, 
37994
b04307085a09
make TPTP generator accept full firstorder formulas
blanchet
parents:
37989
diff
changeset

185 
prefers_theory_relevant, explicit_forall, ...} : prover_config) 
b04307085a09
make TPTP generator accept full firstorder formulas
blanchet
parents:
37989
diff
changeset

186 
: prover_config = 
38041
3b80d6082131
remove "remote_spass" because there's no way to find out which clauses come from which facts + rename scripts
blanchet
parents:
38033
diff
changeset

187 
{executable = ("ISABELLE_ATP_MANAGER", "scripts/remote_atp"), 
38032  188 
required_executables = [], 
37514
b147d01b8ebc
if SPASS fails at finding a proof with the SOS option turned on, turn it off and try again
blanchet
parents:
37509
diff
changeset

189 
arguments = fn _ => fn timeout => 
38041
3b80d6082131
remove "remote_spass" because there's no way to find out which clauses come from which facts + rename scripts
blanchet
parents:
38033
diff
changeset

190 
" t " ^ string_of_int (to_generous_secs timeout) ^ " s " ^ 
36382  191 
the_system atp_prefix, 
36369
d2cd0d04b8e6
handle ATP proof delimiters in a cleaner, more extensible fashion
blanchet
parents:
36289
diff
changeset

192 
proof_delims = insert (op =) tstp_proof_delims proof_delims, 
36265
41c9e755e552
distinguish between the different ATP errors in the user interface;
blanchet
parents:
36264
diff
changeset

193 
known_failures = remote_known_failures @ known_failures, 
38009
34e1ac9cb71d
shrink the "max_new_relevant_facts_per_iter" fudge factors, now that we count formulas and not clauses
blanchet
parents:
38005
diff
changeset

194 
max_new_relevant_facts_per_iter = max_new_relevant_facts_per_iter, 
37994
b04307085a09
make TPTP generator accept full firstorder formulas
blanchet
parents:
37989
diff
changeset

195 
prefers_theory_relevant = prefers_theory_relevant, 
b04307085a09
make TPTP generator accept full firstorder formulas
blanchet
parents:
37989
diff
changeset

196 
explicit_forall = explicit_forall} 
28596
fcd463a6b6de
tuned interfaces  plain prover function, without thread;
wenzelm
parents:
28592
diff
changeset

197 

38023  198 
val remote_name = prefix "remote_" 
32864
a226f29d4bdc
reorganized signature of AtpWrapper structure: records instead of unnamed parameters and return values,
boehmes
parents:
32740
diff
changeset

199 

38041
3b80d6082131
remove "remote_spass" because there's no way to find out which clauses come from which facts + rename scripts
blanchet
parents:
38033
diff
changeset

200 
fun remote_prover (name, config) atp_prefix = 
3b80d6082131
remove "remote_spass" because there's no way to find out which clauses come from which facts + rename scripts
blanchet
parents:
38033
diff
changeset

201 
(remote_name name, remote_config atp_prefix config) 
38023  202 

38041
3b80d6082131
remove "remote_spass" because there's no way to find out which clauses come from which facts + rename scripts
blanchet
parents:
38033
diff
changeset

203 
val remote_e = remote_prover e "EP" 
3b80d6082131
remove "remote_spass" because there's no way to find out which clauses come from which facts + rename scripts
blanchet
parents:
38033
diff
changeset

204 
val remote_vampire = remote_prover vampire "Vampire9" 
28592  205 

38041
3b80d6082131
remove "remote_spass" because there's no way to find out which clauses come from which facts + rename scripts
blanchet
parents:
38033
diff
changeset

206 
fun is_installed ({executable, required_executables, ...} : prover_config) = 
3b80d6082131
remove "remote_spass" because there's no way to find out which clauses come from which facts + rename scripts
blanchet
parents:
38033
diff
changeset

207 
forall (curry (op <>) "" o getenv o fst) (executable :: required_executables) 
3b80d6082131
remove "remote_spass" because there's no way to find out which clauses come from which facts + rename scripts
blanchet
parents:
38033
diff
changeset

208 
fun maybe_remote (name, config) = 
3b80d6082131
remove "remote_spass" because there's no way to find out which clauses come from which facts + rename scripts
blanchet
parents:
38033
diff
changeset

209 
name > not (is_installed config) ? remote_name 
36371
8c83ea1a7740
move the Sledgehammer menu options to "sledgehammer_isar.ML"
blanchet
parents:
36370
diff
changeset

210 

8c83ea1a7740
move the Sledgehammer menu options to "sledgehammer_isar.ML"
blanchet
parents:
36370
diff
changeset

211 
fun default_atps_param_value () = 
38041
3b80d6082131
remove "remote_spass" because there's no way to find out which clauses come from which facts + rename scripts
blanchet
parents:
38033
diff
changeset

212 
space_implode " " ([maybe_remote e] @ 
3b80d6082131
remove "remote_spass" because there's no way to find out which clauses come from which facts + rename scripts
blanchet
parents:
38033
diff
changeset

213 
(if is_installed (snd spass) then [fst spass] else []) @ 
3b80d6082131
remove "remote_spass" because there's no way to find out which clauses come from which facts + rename scripts
blanchet
parents:
38033
diff
changeset

214 
[remote_name (fst vampire)]) 
36371
8c83ea1a7740
move the Sledgehammer menu options to "sledgehammer_isar.ML"
blanchet
parents:
36370
diff
changeset

215 

38041
3b80d6082131
remove "remote_spass" because there's no way to find out which clauses come from which facts + rename scripts
blanchet
parents:
38033
diff
changeset

216 
val provers = [e, spass, vampire, remote_e, remote_vampire] 
38023  217 
val setup = fold add_prover provers 
35867  218 

28592  219 
end; 