author | blanchet |
Tue, 19 Feb 2013 15:37:42 +0100 | |
changeset 51186 | c8721406511a |
parent 51181 | d0fa18638478 |
child 51190 | 2654b3965c8d |
permissions | -rw-r--r-- |
41087
d7b5fd465198
split "Sledgehammer" module into two parts, to resolve forthcoming dependency problems
blanchet
parents:
41066
diff
changeset
|
1 |
(* Title: HOL/Tools/Sledgehammer/sledgehammer_provers.ML |
28477
9339d4dcec8b
version of sledgehammer using threads instead of processes, misc cleanup;
wenzelm
parents:
diff
changeset
|
2 |
Author: Fabian Immler, TU Muenchen |
32996
d2e48879e65a
removed disjunctive group cancellation -- provers run independently;
wenzelm
parents:
32995
diff
changeset
|
3 |
Author: Makarius |
35969 | 4 |
Author: Jasmin Blanchette, TU Muenchen |
28477
9339d4dcec8b
version of sledgehammer using threads instead of processes, misc cleanup;
wenzelm
parents:
diff
changeset
|
5 |
|
41087
d7b5fd465198
split "Sledgehammer" module into two parts, to resolve forthcoming dependency problems
blanchet
parents:
41066
diff
changeset
|
6 |
Generic prover abstraction for Sledgehammer. |
28477
9339d4dcec8b
version of sledgehammer using threads instead of processes, misc cleanup;
wenzelm
parents:
diff
changeset
|
7 |
*) |
9339d4dcec8b
version of sledgehammer using threads instead of processes, misc cleanup;
wenzelm
parents:
diff
changeset
|
8 |
|
41087
d7b5fd465198
split "Sledgehammer" module into two parts, to resolve forthcoming dependency problems
blanchet
parents:
41066
diff
changeset
|
9 |
signature SLEDGEHAMMER_PROVERS = |
28477
9339d4dcec8b
version of sledgehammer using threads instead of processes, misc cleanup;
wenzelm
parents:
diff
changeset
|
10 |
sig |
40181 | 11 |
type failure = ATP_Proof.failure |
46340 | 12 |
type stature = ATP_Problem_Generate.stature |
46320 | 13 |
type type_enc = ATP_Problem_Generate.type_enc |
51005
ce4290c33d73
eliminated needless speed optimization -- and simplified code quite a bit
blanchet
parents:
50927
diff
changeset
|
14 |
type fact = Sledgehammer_Fact.fact |
49914 | 15 |
type reconstructor = Sledgehammer_Reconstruct.reconstructor |
16 |
type play = Sledgehammer_Reconstruct.play |
|
17 |
type minimize_command = Sledgehammer_Reconstruct.minimize_command |
|
39493
cb2208f2c07d
move SPASS's Flotter hack to "Sledgehammer_Reconstruct"
blanchet
parents:
39492
diff
changeset
|
18 |
|
48392
ca998fa08cd9
added "learn_from_atp" command to MaSh, for patient users
blanchet
parents:
48376
diff
changeset
|
19 |
datatype mode = Auto_Try | Try | Normal | MaSh | Auto_Minimize | Minimize |
43021 | 20 |
|
35969 | 21 |
type params = |
48321 | 22 |
{debug : bool, |
23 |
verbose : bool, |
|
24 |
overlord : bool, |
|
25 |
blocking : bool, |
|
26 |
provers : string list, |
|
27 |
type_enc : string option, |
|
28 |
strict : bool, |
|
29 |
lam_trans : string option, |
|
30 |
uncurried_aliases : bool option, |
|
31 |
learn : bool, |
|
32 |
fact_filter : string option, |
|
33 |
max_facts : int option, |
|
34 |
fact_thresholds : real * real, |
|
35 |
max_mono_iters : int option, |
|
36 |
max_new_mono_instances : int option, |
|
49918
cf441f4a358b
renamed Isar-proof related options + changed semantics of Isar shrinking
blanchet
parents:
49914
diff
changeset
|
37 |
isar_proofs : bool, |
51130
76d68444cd59
renamed sledgehammer_shrink to sledgehammer_compress
smolkas
parents:
51024
diff
changeset
|
38 |
isar_compress : real, |
48321 | 39 |
slice : bool, |
40 |
minimize : bool option, |
|
50557 | 41 |
timeout : Time.time option, |
42 |
preplay_timeout : Time.time option, |
|
48321 | 43 |
expect : string} |
39493
cb2208f2c07d
move SPASS's Flotter hack to "Sledgehammer_Reconstruct"
blanchet
parents:
39492
diff
changeset
|
44 |
|
48288
255c6e1fd505
rationalize relevance filter, slowing moving code from Iter to MaSh
blanchet
parents:
48250
diff
changeset
|
45 |
type relevance_fudge = |
255c6e1fd505
rationalize relevance filter, slowing moving code from Iter to MaSh
blanchet
parents:
48250
diff
changeset
|
46 |
{local_const_multiplier : real, |
255c6e1fd505
rationalize relevance filter, slowing moving code from Iter to MaSh
blanchet
parents:
48250
diff
changeset
|
47 |
worse_irrel_freq : real, |
255c6e1fd505
rationalize relevance filter, slowing moving code from Iter to MaSh
blanchet
parents:
48250
diff
changeset
|
48 |
higher_order_irrel_weight : real, |
255c6e1fd505
rationalize relevance filter, slowing moving code from Iter to MaSh
blanchet
parents:
48250
diff
changeset
|
49 |
abs_rel_weight : real, |
255c6e1fd505
rationalize relevance filter, slowing moving code from Iter to MaSh
blanchet
parents:
48250
diff
changeset
|
50 |
abs_irrel_weight : real, |
255c6e1fd505
rationalize relevance filter, slowing moving code from Iter to MaSh
blanchet
parents:
48250
diff
changeset
|
51 |
skolem_irrel_weight : real, |
255c6e1fd505
rationalize relevance filter, slowing moving code from Iter to MaSh
blanchet
parents:
48250
diff
changeset
|
52 |
theory_const_rel_weight : real, |
255c6e1fd505
rationalize relevance filter, slowing moving code from Iter to MaSh
blanchet
parents:
48250
diff
changeset
|
53 |
theory_const_irrel_weight : real, |
255c6e1fd505
rationalize relevance filter, slowing moving code from Iter to MaSh
blanchet
parents:
48250
diff
changeset
|
54 |
chained_const_irrel_weight : real, |
255c6e1fd505
rationalize relevance filter, slowing moving code from Iter to MaSh
blanchet
parents:
48250
diff
changeset
|
55 |
intro_bonus : real, |
255c6e1fd505
rationalize relevance filter, slowing moving code from Iter to MaSh
blanchet
parents:
48250
diff
changeset
|
56 |
elim_bonus : real, |
255c6e1fd505
rationalize relevance filter, slowing moving code from Iter to MaSh
blanchet
parents:
48250
diff
changeset
|
57 |
simp_bonus : real, |
255c6e1fd505
rationalize relevance filter, slowing moving code from Iter to MaSh
blanchet
parents:
48250
diff
changeset
|
58 |
local_bonus : real, |
255c6e1fd505
rationalize relevance filter, slowing moving code from Iter to MaSh
blanchet
parents:
48250
diff
changeset
|
59 |
assum_bonus : real, |
255c6e1fd505
rationalize relevance filter, slowing moving code from Iter to MaSh
blanchet
parents:
48250
diff
changeset
|
60 |
chained_bonus : real, |
255c6e1fd505
rationalize relevance filter, slowing moving code from Iter to MaSh
blanchet
parents:
48250
diff
changeset
|
61 |
max_imperfect : real, |
255c6e1fd505
rationalize relevance filter, slowing moving code from Iter to MaSh
blanchet
parents:
48250
diff
changeset
|
62 |
max_imperfect_exp : real, |
255c6e1fd505
rationalize relevance filter, slowing moving code from Iter to MaSh
blanchet
parents:
48250
diff
changeset
|
63 |
threshold_divisor : real, |
255c6e1fd505
rationalize relevance filter, slowing moving code from Iter to MaSh
blanchet
parents:
48250
diff
changeset
|
64 |
ridiculous_threshold : real} |
255c6e1fd505
rationalize relevance filter, slowing moving code from Iter to MaSh
blanchet
parents:
48250
diff
changeset
|
65 |
|
40061
71cc5aac8b76
generalization of the Sledgehammer minimizer, to make it possible to handle SMT solvers as well
blanchet
parents:
40060
diff
changeset
|
66 |
type prover_problem = |
48321 | 67 |
{state : Proof.state, |
68 |
goal : thm, |
|
69 |
subgoal : int, |
|
70 |
subgoal_count : int, |
|
51010 | 71 |
factss : (string * fact list) list} |
39493
cb2208f2c07d
move SPASS's Flotter hack to "Sledgehammer_Reconstruct"
blanchet
parents:
39492
diff
changeset
|
72 |
|
40061
71cc5aac8b76
generalization of the Sledgehammer minimizer, to make it possible to handle SMT solvers as well
blanchet
parents:
40060
diff
changeset
|
73 |
type prover_result = |
48321 | 74 |
{outcome : failure option, |
51009
e8ff34a1fa9a
thread through fact triple component from which used facts come, for accurate index output
blanchet
parents:
51007
diff
changeset
|
75 |
used_facts : (string * stature) list, |
e8ff34a1fa9a
thread through fact triple component from which used facts come, for accurate index output
blanchet
parents:
51007
diff
changeset
|
76 |
used_from : fact list, |
48321 | 77 |
run_time : Time.time, |
50669
84c7cf36b2e0
use "Lazy" to simplify control flow a bit and guarantee single evaluation (at most)
blanchet
parents:
50667
diff
changeset
|
78 |
preplay : play Lazy.lazy, |
48321 | 79 |
message : play -> string, |
80 |
message_tail : string} |
|
39493
cb2208f2c07d
move SPASS's Flotter hack to "Sledgehammer_Reconstruct"
blanchet
parents:
39492
diff
changeset
|
81 |
|
43051 | 82 |
type prover = |
45520 | 83 |
params -> ((string * string list) list -> string -> minimize_command) |
84 |
-> prover_problem -> prover_result |
|
35867 | 85 |
|
43092
93ec303e1917
more work on new metis that exploits the powerful new type encodings
blanchet
parents:
43085
diff
changeset
|
86 |
val dest_dir : string Config.T |
93ec303e1917
more work on new metis that exploits the powerful new type encodings
blanchet
parents:
43085
diff
changeset
|
87 |
val problem_prefix : string Config.T |
48143 | 88 |
val completish : bool Config.T |
44592
54906b0337ab
flip logic of boolean option so it's off by default
blanchet
parents:
44586
diff
changeset
|
89 |
val atp_full_names : bool Config.T |
42646
4781fcd53572
replaced some Unsynchronized.refs with Config.Ts
blanchet
parents:
42642
diff
changeset
|
90 |
val smt_triggers : bool Config.T |
4781fcd53572
replaced some Unsynchronized.refs with Config.Ts
blanchet
parents:
42642
diff
changeset
|
91 |
val smt_weights : bool Config.T |
4781fcd53572
replaced some Unsynchronized.refs with Config.Ts
blanchet
parents:
42642
diff
changeset
|
92 |
val smt_weight_min_facts : int Config.T |
4781fcd53572
replaced some Unsynchronized.refs with Config.Ts
blanchet
parents:
42642
diff
changeset
|
93 |
val smt_min_weight : int Config.T |
4781fcd53572
replaced some Unsynchronized.refs with Config.Ts
blanchet
parents:
42642
diff
changeset
|
94 |
val smt_max_weight : int Config.T |
4781fcd53572
replaced some Unsynchronized.refs with Config.Ts
blanchet
parents:
42642
diff
changeset
|
95 |
val smt_max_weight_index : int Config.T |
41256
0e7d45cc005f
put the SMT weights back where they belong, so that they're also used by Mirabelle
blanchet
parents:
41242
diff
changeset
|
96 |
val smt_weight_curve : (int -> int) Unsynchronized.ref |
42646
4781fcd53572
replaced some Unsynchronized.refs with Config.Ts
blanchet
parents:
42642
diff
changeset
|
97 |
val smt_max_slices : int Config.T |
4781fcd53572
replaced some Unsynchronized.refs with Config.Ts
blanchet
parents:
42642
diff
changeset
|
98 |
val smt_slice_fact_frac : real Config.T |
4781fcd53572
replaced some Unsynchronized.refs with Config.Ts
blanchet
parents:
42642
diff
changeset
|
99 |
val smt_slice_time_frac : real Config.T |
4781fcd53572
replaced some Unsynchronized.refs with Config.Ts
blanchet
parents:
42642
diff
changeset
|
100 |
val smt_slice_min_secs : int Config.T |
48319
340187063d84
use async manager to manage MaSh learners to make sure they get killed cleanly
blanchet
parents:
48314
diff
changeset
|
101 |
val SledgehammerN : string |
45519
cd6e78cb6ee8
make metis reconstruction handling more flexible
blanchet
parents:
45514
diff
changeset
|
102 |
val plain_metis : reconstructor |
41242
8edeb1dbbc76
run the SMT relevance filter only once, then run the normalization/monomorphization code once _per class_ of SMT solvers
blanchet
parents:
41241
diff
changeset
|
103 |
val select_smt_solver : string -> Proof.context -> Proof.context |
45520 | 104 |
val extract_reconstructor : |
45561
57227eedce81
don't propagate user-set "type_enc" or "lam_trans" to Metis calls
blanchet
parents:
45560
diff
changeset
|
105 |
params -> reconstructor -> string * (string * string list) list |
45379
0147a4348ca1
try "smt" as a fallback for ATPs if "metis" fails/times out
blanchet
parents:
45378
diff
changeset
|
106 |
val is_reconstructor : string -> bool |
43050
59284a13abc4
support "metis" and "metisFT" as provers in the architecture, so they can be used for minimizing
blanchet
parents:
43044
diff
changeset
|
107 |
val is_atp : theory -> string -> bool |
41087
d7b5fd465198
split "Sledgehammer" module into two parts, to resolve forthcoming dependency problems
blanchet
parents:
41066
diff
changeset
|
108 |
val is_smt_prover : Proof.context -> string -> bool |
47962
137883567114
lower the monomorphization thresholds for less scalable provers
blanchet
parents:
47946
diff
changeset
|
109 |
val is_ho_atp: Proof.context -> string -> bool |
42944
9e620869a576
improved Waldmeister support -- even run it by default on unit equational goals
blanchet
parents:
42943
diff
changeset
|
110 |
val is_unit_equational_atp : Proof.context -> string -> bool |
41727
ab3f6d76fb23
available_provers ~> supported_provers (for clarity)
blanchet
parents:
41723
diff
changeset
|
111 |
val is_prover_supported : Proof.context -> string -> bool |
40072
27f2a45b0aab
more robust handling of "remote_" vs. non-"remote_" provers
blanchet
parents:
40071
diff
changeset
|
112 |
val is_prover_installed : Proof.context -> string -> bool |
48293 | 113 |
val default_max_facts_for_prover : Proof.context -> bool -> string -> int |
42944
9e620869a576
improved Waldmeister support -- even run it by default on unit equational goals
blanchet
parents:
42943
diff
changeset
|
114 |
val is_unit_equality : term -> bool |
42952
96f62b77748f
tuning -- the "appropriate" terminology is inspired from TPTP
blanchet
parents:
42944
diff
changeset
|
115 |
val is_appropriate_prop_for_prover : Proof.context -> string -> term -> bool |
40369
53dca3bd4250
use the SMT integration's official list of built-ins
blanchet
parents:
40341
diff
changeset
|
116 |
val is_built_in_const_for_prover : |
41336
0ea5b9c7d233
proper handling of the arguments of SMT builtins -- for numerals, ignore the arguments (Pls, Bit0, Bit1, ..), for functions, consider them;
blanchet
parents:
41335
diff
changeset
|
117 |
Proof.context -> string -> string * typ -> term list -> bool * term list |
41087
d7b5fd465198
split "Sledgehammer" module into two parts, to resolve forthcoming dependency problems
blanchet
parents:
41066
diff
changeset
|
118 |
val atp_relevance_fudge : relevance_fudge |
d7b5fd465198
split "Sledgehammer" module into two parts, to resolve forthcoming dependency problems
blanchet
parents:
41066
diff
changeset
|
119 |
val smt_relevance_fudge : relevance_fudge |
40941
a3e6f8634a11
replace "smt" prover with specific SMT solvers, e.g. "z3" -- whatever the SMT module gives us
blanchet
parents:
40723
diff
changeset
|
120 |
val relevance_fudge_for_prover : Proof.context -> string -> relevance_fudge |
41256
0e7d45cc005f
put the SMT weights back where they belong, so that they're also used by Mirabelle
blanchet
parents:
41242
diff
changeset
|
121 |
val weight_smt_fact : |
46340 | 122 |
Proof.context -> int -> ((string * stature) * thm) * int |
123 |
-> (string * stature) * (int option * thm) |
|
41727
ab3f6d76fb23
available_provers ~> supported_provers (for clarity)
blanchet
parents:
41723
diff
changeset
|
124 |
val supported_provers : Proof.context -> unit |
40059
6ad9081665db
use consistent terminology in Sledgehammer: "prover = ATP or SMT solver or ..."
blanchet
parents:
39494
diff
changeset
|
125 |
val kill_provers : unit -> unit |
6ad9081665db
use consistent terminology in Sledgehammer: "prover = ATP or SMT solver or ..."
blanchet
parents:
39494
diff
changeset
|
126 |
val running_provers : unit -> unit |
6ad9081665db
use consistent terminology in Sledgehammer: "prover = ATP or SMT solver or ..."
blanchet
parents:
39494
diff
changeset
|
127 |
val messages : int option -> unit |
48798 | 128 |
val is_fact_chained : (('a * stature) * 'b) -> bool |
129 |
val filter_used_facts : |
|
130 |
bool -> (''a * stature) list -> ((''a * stature) * 'b) list -> |
|
131 |
((''a * stature) * 'b) list |
|
43021 | 132 |
val get_prover : Proof.context -> mode -> string -> prover |
28477
9339d4dcec8b
version of sledgehammer using threads instead of processes, misc cleanup;
wenzelm
parents:
diff
changeset
|
133 |
end; |
9339d4dcec8b
version of sledgehammer using threads instead of processes, misc cleanup;
wenzelm
parents:
diff
changeset
|
134 |
|
41087
d7b5fd465198
split "Sledgehammer" module into two parts, to resolve forthcoming dependency problems
blanchet
parents:
41066
diff
changeset
|
135 |
structure Sledgehammer_Provers : SLEDGEHAMMER_PROVERS = |
28477
9339d4dcec8b
version of sledgehammer using threads instead of processes, misc cleanup;
wenzelm
parents:
diff
changeset
|
136 |
struct |
9339d4dcec8b
version of sledgehammer using threads instead of processes, misc cleanup;
wenzelm
parents:
diff
changeset
|
137 |
|
43085
0a2f5b86bdd7
first step in sharing more code between ATP and Metis translation
blanchet
parents:
43063
diff
changeset
|
138 |
open ATP_Util |
38028 | 139 |
open ATP_Problem |
39491
2416666e6f94
refactoring: move ATP proof and error extraction code to "ATP_Proof" module
blanchet
parents:
39453
diff
changeset
|
140 |
open ATP_Proof |
38028 | 141 |
open ATP_Systems |
46320 | 142 |
open ATP_Problem_Generate |
143 |
open ATP_Proof_Reconstruct |
|
45521 | 144 |
open Metis_Tactic |
38023 | 145 |
open Sledgehammer_Util |
51005
ce4290c33d73
eliminated needless speed optimization -- and simplified code quite a bit
blanchet
parents:
50927
diff
changeset
|
146 |
open Sledgehammer_Fact |
49881
d9d73ebf9274
added proof minimization code from Steffen Smolka
blanchet
parents:
48802
diff
changeset
|
147 |
open Sledgehammer_Reconstruct |
48288
255c6e1fd505
rationalize relevance filter, slowing moving code from Iter to MaSh
blanchet
parents:
48250
diff
changeset
|
148 |
|
37583
9ce2451647d5
factored non-ATP specific code from "ATP_Manager" out, so that it can be reused for the LEO-II integration
blanchet
parents:
37581
diff
changeset
|
149 |
|
9ce2451647d5
factored non-ATP specific code from "ATP_Manager" out, so that it can be reused for the LEO-II integration
blanchet
parents:
37581
diff
changeset
|
150 |
(** The Sledgehammer **) |
9ce2451647d5
factored non-ATP specific code from "ATP_Manager" out, so that it can be reused for the LEO-II integration
blanchet
parents:
37581
diff
changeset
|
151 |
|
48392
ca998fa08cd9
added "learn_from_atp" command to MaSh, for patient users
blanchet
parents:
48376
diff
changeset
|
152 |
datatype mode = Auto_Try | Try | Normal | MaSh | Auto_Minimize | Minimize |
43021 | 153 |
|
45376 | 154 |
(* Identifier that distinguishes Sledgehammer from other tools that could use |
38102
019a49759829
fix bug in the newly introduced "bound concealing" code
blanchet
parents:
38100
diff
changeset
|
155 |
"Async_Manager". *) |
48319
340187063d84
use async manager to manage MaSh learners to make sure they get killed cleanly
blanchet
parents:
48314
diff
changeset
|
156 |
val SledgehammerN = "Sledgehammer" |
37585 | 157 |
|
45520 | 158 |
val reconstructor_names = [metisN, smtN] |
46365 | 159 |
val plain_metis = Metis (hd partial_type_encs, combsN) |
45561
57227eedce81
don't propagate user-set "type_enc" or "lam_trans" to Metis calls
blanchet
parents:
45560
diff
changeset
|
160 |
val is_reconstructor = member (op =) reconstructor_names |
43228
2ed2f092e990
obsoleted "metisFT", and added "no_types" version of Metis as fallback to Sledgehammer after noticing how useful it can be
blanchet
parents:
43226
diff
changeset
|
161 |
|
43050
59284a13abc4
support "metis" and "metisFT" as provers in the architecture, so they can be used for minimizing
blanchet
parents:
43044
diff
changeset
|
162 |
val is_atp = member (op =) o supported_atps |
59284a13abc4
support "metis" and "metisFT" as provers in the architecture, so they can be used for minimizing
blanchet
parents:
43044
diff
changeset
|
163 |
|
43233
2749c357f865
use the proper prover name, e.g. metis_full_types, not metis (full_types), for minimizing
blanchet
parents:
43232
diff
changeset
|
164 |
val select_smt_solver = Context.proof_map o SMT_Config.select_solver |
41242
8edeb1dbbc76
run the SMT relevance filter only once, then run the normalization/monomorphization code once _per class_ of SMT solvers
blanchet
parents:
41241
diff
changeset
|
165 |
|
45376 | 166 |
fun is_smt_prover ctxt = member (op =) (SMT_Solver.available_solvers_of ctxt) |
40062 | 167 |
|
44597 | 168 |
fun is_atp_for_format is_format ctxt name = |
42944
9e620869a576
improved Waldmeister support -- even run it by default on unit equational goals
blanchet
parents:
42943
diff
changeset
|
169 |
let val thy = Proof_Context.theory_of ctxt in |
9e620869a576
improved Waldmeister support -- even run it by default on unit equational goals
blanchet
parents:
42943
diff
changeset
|
170 |
case try (get_atp thy) name of |
47606
06dde48a1503
true delayed evaluation of "SPASS_VERSION" environment variable
blanchet
parents:
47531
diff
changeset
|
171 |
SOME config => |
48716
1d2a12bb0640
stop distinguishing between complete and incomplete slices, since this is very fragile and has hardly any useful semantics to users
blanchet
parents:
48656
diff
changeset
|
172 |
exists (fn (_, ((_, format, _, _, _), _)) => is_format format) |
47606
06dde48a1503
true delayed evaluation of "SPASS_VERSION" environment variable
blanchet
parents:
47531
diff
changeset
|
173 |
(#best_slices (config ()) ctxt) |
42944
9e620869a576
improved Waldmeister support -- even run it by default on unit equational goals
blanchet
parents:
42943
diff
changeset
|
174 |
| NONE => false |
9e620869a576
improved Waldmeister support -- even run it by default on unit equational goals
blanchet
parents:
42943
diff
changeset
|
175 |
end |
9e620869a576
improved Waldmeister support -- even run it by default on unit equational goals
blanchet
parents:
42943
diff
changeset
|
176 |
|
44597 | 177 |
val is_unit_equational_atp = is_atp_for_format (curry (op =) CNF_UEQ) |
45303
bd03b08161ac
added DFG unsorted support (like in the old days)
blanchet
parents:
45301
diff
changeset
|
178 |
val is_ho_atp = is_atp_for_format is_format_higher_order |
44597 | 179 |
|
45376 | 180 |
fun is_prover_supported ctxt = |
42361 | 181 |
let val thy = Proof_Context.theory_of ctxt in |
45379
0147a4348ca1
try "smt" as a fallback for ATPs if "metis" fails/times out
blanchet
parents:
45378
diff
changeset
|
182 |
is_reconstructor orf is_atp thy orf is_smt_prover ctxt |
40941
a3e6f8634a11
replace "smt" prover with specific SMT solvers, e.g. "z3" -- whatever the SMT module gives us
blanchet
parents:
40723
diff
changeset
|
183 |
end |
40072
27f2a45b0aab
more robust handling of "remote_" vs. non-"remote_" provers
blanchet
parents:
40071
diff
changeset
|
184 |
|
41432
3214c39777ab
differentiate between local and remote SMT solvers (e.g., "z3" vs. "remote_z3");
boehmes
parents:
41336
diff
changeset
|
185 |
fun is_prover_installed ctxt = |
45379
0147a4348ca1
try "smt" as a fallback for ATPs if "metis" fails/times out
blanchet
parents:
45378
diff
changeset
|
186 |
is_reconstructor orf is_smt_prover ctxt orf |
43050
59284a13abc4
support "metis" and "metisFT" as provers in the architecture, so they can be used for minimizing
blanchet
parents:
43044
diff
changeset
|
187 |
is_atp_installed (Proof_Context.theory_of ctxt) |
40941
a3e6f8634a11
replace "smt" prover with specific SMT solvers, e.g. "z3" -- whatever the SMT module gives us
blanchet
parents:
40723
diff
changeset
|
188 |
|
45706 | 189 |
fun get_slices slice slices = |
190 |
(0 upto length slices - 1) ~~ slices |> not slice ? (List.last #> single) |
|
42443
724e612ba248
implemented general slicing for ATPs, especially E 1.2w and above
blanchet
parents:
42361
diff
changeset
|
191 |
|
48293 | 192 |
val reconstructor_default_max_facts = 20 |
43050
59284a13abc4
support "metis" and "metisFT" as provers in the architecture, so they can be used for minimizing
blanchet
parents:
43044
diff
changeset
|
193 |
|
51186
c8721406511a
interpret "max_facts" argument in a slice-dependent fashion, instead of forcing the same number of facts to all slices
blanchet
parents:
51181
diff
changeset
|
194 |
fun slice_max_facts (_, (_, ( ((max_facts, _), _, _, _, _), _))) = max_facts |
c8721406511a
interpret "max_facts" argument in a slice-dependent fashion, instead of forcing the same number of facts to all slices
blanchet
parents:
51181
diff
changeset
|
195 |
|
48293 | 196 |
fun default_max_facts_for_prover ctxt slice name = |
42361 | 197 |
let val thy = Proof_Context.theory_of ctxt in |
45379
0147a4348ca1
try "smt" as a fallback for ATPs if "metis" fails/times out
blanchet
parents:
45378
diff
changeset
|
198 |
if is_reconstructor name then |
48293 | 199 |
reconstructor_default_max_facts |
43050
59284a13abc4
support "metis" and "metisFT" as provers in the architecture, so they can be used for minimizing
blanchet
parents:
43044
diff
changeset
|
200 |
else if is_atp thy name then |
51186
c8721406511a
interpret "max_facts" argument in a slice-dependent fashion, instead of forcing the same number of facts to all slices
blanchet
parents:
51181
diff
changeset
|
201 |
fold (Integer.max o slice_max_facts) |
47606
06dde48a1503
true delayed evaluation of "SPASS_VERSION" environment variable
blanchet
parents:
47531
diff
changeset
|
202 |
(get_slices slice (#best_slices (get_atp thy name ()) ctxt)) 0 |
43050
59284a13abc4
support "metis" and "metisFT" as provers in the architecture, so they can be used for minimizing
blanchet
parents:
43044
diff
changeset
|
203 |
else (* is_smt_prover ctxt name *) |
59284a13abc4
support "metis" and "metisFT" as provers in the architecture, so they can be used for minimizing
blanchet
parents:
43044
diff
changeset
|
204 |
SMT_Solver.default_max_relevant ctxt name |
40941
a3e6f8634a11
replace "smt" prover with specific SMT solvers, e.g. "z3" -- whatever the SMT module gives us
blanchet
parents:
40723
diff
changeset
|
205 |
end |
40063
d086e3699e78
bring ATPs and SMT solvers more in line with each other
blanchet
parents:
40062
diff
changeset
|
206 |
|
42956
9aeb0f6ad971
filter Waldmeister facts better -- and don't encode type classes as predicates, since it doesn't like conditional equations
blanchet
parents:
42952
diff
changeset
|
207 |
fun is_if (@{const_name If}, _) = true |
9aeb0f6ad971
filter Waldmeister facts better -- and don't encode type classes as predicates, since it doesn't like conditional equations
blanchet
parents:
42952
diff
changeset
|
208 |
| is_if _ = false |
9aeb0f6ad971
filter Waldmeister facts better -- and don't encode type classes as predicates, since it doesn't like conditional equations
blanchet
parents:
42952
diff
changeset
|
209 |
|
9aeb0f6ad971
filter Waldmeister facts better -- and don't encode type classes as predicates, since it doesn't like conditional equations
blanchet
parents:
42952
diff
changeset
|
210 |
(* Beware of "if and only if" (which is translated as such) and "If" (which is |
9aeb0f6ad971
filter Waldmeister facts better -- and don't encode type classes as predicates, since it doesn't like conditional equations
blanchet
parents:
42952
diff
changeset
|
211 |
translated to conditional equations). *) |
9aeb0f6ad971
filter Waldmeister facts better -- and don't encode type classes as predicates, since it doesn't like conditional equations
blanchet
parents:
42952
diff
changeset
|
212 |
fun is_good_unit_equality T t u = |
9aeb0f6ad971
filter Waldmeister facts better -- and don't encode type classes as predicates, since it doesn't like conditional equations
blanchet
parents:
42952
diff
changeset
|
213 |
T <> @{typ bool} andalso not (exists (exists_Const is_if) [t, u]) |
9aeb0f6ad971
filter Waldmeister facts better -- and don't encode type classes as predicates, since it doesn't like conditional equations
blanchet
parents:
42952
diff
changeset
|
214 |
|
42944
9e620869a576
improved Waldmeister support -- even run it by default on unit equational goals
blanchet
parents:
42943
diff
changeset
|
215 |
fun is_unit_equality (@{const Trueprop} $ t) = is_unit_equality t |
9e620869a576
improved Waldmeister support -- even run it by default on unit equational goals
blanchet
parents:
42943
diff
changeset
|
216 |
| is_unit_equality (Const (@{const_name all}, _) $ Abs (_, _, t)) = |
9e620869a576
improved Waldmeister support -- even run it by default on unit equational goals
blanchet
parents:
42943
diff
changeset
|
217 |
is_unit_equality t |
9e620869a576
improved Waldmeister support -- even run it by default on unit equational goals
blanchet
parents:
42943
diff
changeset
|
218 |
| is_unit_equality (Const (@{const_name All}, _) $ Abs (_, _, t)) = |
9e620869a576
improved Waldmeister support -- even run it by default on unit equational goals
blanchet
parents:
42943
diff
changeset
|
219 |
is_unit_equality t |
42956
9aeb0f6ad971
filter Waldmeister facts better -- and don't encode type classes as predicates, since it doesn't like conditional equations
blanchet
parents:
42952
diff
changeset
|
220 |
| is_unit_equality (Const (@{const_name "=="}, Type (_, [T, _])) $ t $ u) = |
9aeb0f6ad971
filter Waldmeister facts better -- and don't encode type classes as predicates, since it doesn't like conditional equations
blanchet
parents:
42952
diff
changeset
|
221 |
is_good_unit_equality T t u |
9aeb0f6ad971
filter Waldmeister facts better -- and don't encode type classes as predicates, since it doesn't like conditional equations
blanchet
parents:
42952
diff
changeset
|
222 |
| is_unit_equality (Const (@{const_name HOL.eq}, Type (_ , [T, _])) $ t $ u) = |
9aeb0f6ad971
filter Waldmeister facts better -- and don't encode type classes as predicates, since it doesn't like conditional equations
blanchet
parents:
42952
diff
changeset
|
223 |
is_good_unit_equality T t u |
42944
9e620869a576
improved Waldmeister support -- even run it by default on unit equational goals
blanchet
parents:
42943
diff
changeset
|
224 |
| is_unit_equality _ = false |
9e620869a576
improved Waldmeister support -- even run it by default on unit equational goals
blanchet
parents:
42943
diff
changeset
|
225 |
|
42952
96f62b77748f
tuning -- the "appropriate" terminology is inspired from TPTP
blanchet
parents:
42944
diff
changeset
|
226 |
fun is_appropriate_prop_for_prover ctxt name = |
42944
9e620869a576
improved Waldmeister support -- even run it by default on unit equational goals
blanchet
parents:
42943
diff
changeset
|
227 |
if is_unit_equational_atp ctxt name then is_unit_equality else K true |
9e620869a576
improved Waldmeister support -- even run it by default on unit equational goals
blanchet
parents:
42943
diff
changeset
|
228 |
|
41242
8edeb1dbbc76
run the SMT relevance filter only once, then run the normalization/monomorphization code once _per class_ of SMT solvers
blanchet
parents:
41241
diff
changeset
|
229 |
fun is_built_in_const_for_prover ctxt name = |
8edeb1dbbc76
run the SMT relevance filter only once, then run the normalization/monomorphization code once _per class_ of SMT solvers
blanchet
parents:
41241
diff
changeset
|
230 |
if is_smt_prover ctxt name then |
41336
0ea5b9c7d233
proper handling of the arguments of SMT builtins -- for numerals, ignore the arguments (Pls, Bit0, Bit1, ..), for functions, consider them;
blanchet
parents:
41335
diff
changeset
|
231 |
let val ctxt = ctxt |> select_smt_solver name in |
0ea5b9c7d233
proper handling of the arguments of SMT builtins -- for numerals, ignore the arguments (Pls, Bit0, Bit1, ..), for functions, consider them;
blanchet
parents:
41335
diff
changeset
|
232 |
fn x => fn ts => |
0ea5b9c7d233
proper handling of the arguments of SMT builtins -- for numerals, ignore the arguments (Pls, Bit0, Bit1, ..), for functions, consider them;
blanchet
parents:
41335
diff
changeset
|
233 |
if SMT_Builtin.is_builtin_num_ext ctxt (list_comb (Const x, ts)) then |
0ea5b9c7d233
proper handling of the arguments of SMT builtins -- for numerals, ignore the arguments (Pls, Bit0, Bit1, ..), for functions, consider them;
blanchet
parents:
41335
diff
changeset
|
234 |
(true, []) |
0ea5b9c7d233
proper handling of the arguments of SMT builtins -- for numerals, ignore the arguments (Pls, Bit0, Bit1, ..), for functions, consider them;
blanchet
parents:
41335
diff
changeset
|
235 |
else if SMT_Builtin.is_builtin_fun_ext ctxt x ts then |
0ea5b9c7d233
proper handling of the arguments of SMT builtins -- for numerals, ignore the arguments (Pls, Bit0, Bit1, ..), for functions, consider them;
blanchet
parents:
41335
diff
changeset
|
236 |
(true, ts) |
0ea5b9c7d233
proper handling of the arguments of SMT builtins -- for numerals, ignore the arguments (Pls, Bit0, Bit1, ..), for functions, consider them;
blanchet
parents:
41335
diff
changeset
|
237 |
else |
0ea5b9c7d233
proper handling of the arguments of SMT builtins -- for numerals, ignore the arguments (Pls, Bit0, Bit1, ..), for functions, consider them;
blanchet
parents:
41335
diff
changeset
|
238 |
(false, ts) |
0ea5b9c7d233
proper handling of the arguments of SMT builtins -- for numerals, ignore the arguments (Pls, Bit0, Bit1, ..), for functions, consider them;
blanchet
parents:
41335
diff
changeset
|
239 |
end |
41242
8edeb1dbbc76
run the SMT relevance filter only once, then run the normalization/monomorphization code once _per class_ of SMT solvers
blanchet
parents:
41241
diff
changeset
|
240 |
else |
41336
0ea5b9c7d233
proper handling of the arguments of SMT builtins -- for numerals, ignore the arguments (Pls, Bit0, Bit1, ..), for functions, consider them;
blanchet
parents:
41335
diff
changeset
|
241 |
fn (s, _) => fn ts => (member (op =) atp_irrelevant_consts s, ts) |
40071
658a37c80b53
generalized the relevance filter so that it takes the list of "irrelevant constants" as argument (since the ATP and SMT preprocessing are different)
blanchet
parents:
40070
diff
changeset
|
242 |
|
40070
bdb890782d4a
replaced references with proper record that's threaded through
blanchet
parents:
40069
diff
changeset
|
243 |
(* FUDGE *) |
bdb890782d4a
replaced references with proper record that's threaded through
blanchet
parents:
40069
diff
changeset
|
244 |
val atp_relevance_fudge = |
42738 | 245 |
{local_const_multiplier = 1.5, |
41159
1e12d6495423
honor "overlord" option for SMT solvers as well and don't pass "ext" to them
blanchet
parents:
41152
diff
changeset
|
246 |
worse_irrel_freq = 100.0, |
40070
bdb890782d4a
replaced references with proper record that's threaded through
blanchet
parents:
40069
diff
changeset
|
247 |
higher_order_irrel_weight = 1.05, |
bdb890782d4a
replaced references with proper record that's threaded through
blanchet
parents:
40069
diff
changeset
|
248 |
abs_rel_weight = 0.5, |
bdb890782d4a
replaced references with proper record that's threaded through
blanchet
parents:
40069
diff
changeset
|
249 |
abs_irrel_weight = 2.0, |
47934
08d7aff8c7e6
lower skolem penalty to ensure that some useful facts with existentials, e.g. congruence of "setsum", eventually get picked up
blanchet
parents:
47912
diff
changeset
|
250 |
skolem_irrel_weight = 0.05, |
40070
bdb890782d4a
replaced references with proper record that's threaded through
blanchet
parents:
40069
diff
changeset
|
251 |
theory_const_rel_weight = 0.5, |
bdb890782d4a
replaced references with proper record that's threaded through
blanchet
parents:
40069
diff
changeset
|
252 |
theory_const_irrel_weight = 0.25, |
42735
1d375de437e9
fine-tuned the relevance filter, so that equations of the form "c = (%x. _)" and constants occurring in chained facts are not unduely penalized
blanchet
parents:
42730
diff
changeset
|
253 |
chained_const_irrel_weight = 0.25, |
40070
bdb890782d4a
replaced references with proper record that's threaded through
blanchet
parents:
40069
diff
changeset
|
254 |
intro_bonus = 0.15, |
bdb890782d4a
replaced references with proper record that's threaded through
blanchet
parents:
40069
diff
changeset
|
255 |
elim_bonus = 0.15, |
bdb890782d4a
replaced references with proper record that's threaded through
blanchet
parents:
40069
diff
changeset
|
256 |
simp_bonus = 0.15, |
bdb890782d4a
replaced references with proper record that's threaded through
blanchet
parents:
40069
diff
changeset
|
257 |
local_bonus = 0.55, |
bdb890782d4a
replaced references with proper record that's threaded through
blanchet
parents:
40069
diff
changeset
|
258 |
assum_bonus = 1.05, |
bdb890782d4a
replaced references with proper record that's threaded through
blanchet
parents:
40069
diff
changeset
|
259 |
chained_bonus = 1.5, |
bdb890782d4a
replaced references with proper record that's threaded through
blanchet
parents:
40069
diff
changeset
|
260 |
max_imperfect = 11.5, |
bdb890782d4a
replaced references with proper record that's threaded through
blanchet
parents:
40069
diff
changeset
|
261 |
max_imperfect_exp = 1.0, |
bdb890782d4a
replaced references with proper record that's threaded through
blanchet
parents:
40069
diff
changeset
|
262 |
threshold_divisor = 2.0, |
41093 | 263 |
ridiculous_threshold = 0.01} |
40070
bdb890782d4a
replaced references with proper record that's threaded through
blanchet
parents:
40069
diff
changeset
|
264 |
|
40071
658a37c80b53
generalized the relevance filter so that it takes the list of "irrelevant constants" as argument (since the ATP and SMT preprocessing are different)
blanchet
parents:
40070
diff
changeset
|
265 |
(* FUDGE (FIXME) *) |
40070
bdb890782d4a
replaced references with proper record that's threaded through
blanchet
parents:
40069
diff
changeset
|
266 |
val smt_relevance_fudge = |
42738 | 267 |
{local_const_multiplier = #local_const_multiplier atp_relevance_fudge, |
41159
1e12d6495423
honor "overlord" option for SMT solvers as well and don't pass "ext" to them
blanchet
parents:
41152
diff
changeset
|
268 |
worse_irrel_freq = #worse_irrel_freq atp_relevance_fudge, |
40071
658a37c80b53
generalized the relevance filter so that it takes the list of "irrelevant constants" as argument (since the ATP and SMT preprocessing are different)
blanchet
parents:
40070
diff
changeset
|
269 |
higher_order_irrel_weight = #higher_order_irrel_weight atp_relevance_fudge, |
658a37c80b53
generalized the relevance filter so that it takes the list of "irrelevant constants" as argument (since the ATP and SMT preprocessing are different)
blanchet
parents:
40070
diff
changeset
|
270 |
abs_rel_weight = #abs_rel_weight atp_relevance_fudge, |
658a37c80b53
generalized the relevance filter so that it takes the list of "irrelevant constants" as argument (since the ATP and SMT preprocessing are different)
blanchet
parents:
40070
diff
changeset
|
271 |
abs_irrel_weight = #abs_irrel_weight atp_relevance_fudge, |
658a37c80b53
generalized the relevance filter so that it takes the list of "irrelevant constants" as argument (since the ATP and SMT preprocessing are different)
blanchet
parents:
40070
diff
changeset
|
272 |
skolem_irrel_weight = #skolem_irrel_weight atp_relevance_fudge, |
658a37c80b53
generalized the relevance filter so that it takes the list of "irrelevant constants" as argument (since the ATP and SMT preprocessing are different)
blanchet
parents:
40070
diff
changeset
|
273 |
theory_const_rel_weight = #theory_const_rel_weight atp_relevance_fudge, |
658a37c80b53
generalized the relevance filter so that it takes the list of "irrelevant constants" as argument (since the ATP and SMT preprocessing are different)
blanchet
parents:
40070
diff
changeset
|
274 |
theory_const_irrel_weight = #theory_const_irrel_weight atp_relevance_fudge, |
42735
1d375de437e9
fine-tuned the relevance filter, so that equations of the form "c = (%x. _)" and constants occurring in chained facts are not unduely penalized
blanchet
parents:
42730
diff
changeset
|
275 |
chained_const_irrel_weight = #chained_const_irrel_weight atp_relevance_fudge, |
40071
658a37c80b53
generalized the relevance filter so that it takes the list of "irrelevant constants" as argument (since the ATP and SMT preprocessing are different)
blanchet
parents:
40070
diff
changeset
|
276 |
intro_bonus = #intro_bonus atp_relevance_fudge, |
658a37c80b53
generalized the relevance filter so that it takes the list of "irrelevant constants" as argument (since the ATP and SMT preprocessing are different)
blanchet
parents:
40070
diff
changeset
|
277 |
elim_bonus = #elim_bonus atp_relevance_fudge, |
658a37c80b53
generalized the relevance filter so that it takes the list of "irrelevant constants" as argument (since the ATP and SMT preprocessing are different)
blanchet
parents:
40070
diff
changeset
|
278 |
simp_bonus = #simp_bonus atp_relevance_fudge, |
658a37c80b53
generalized the relevance filter so that it takes the list of "irrelevant constants" as argument (since the ATP and SMT preprocessing are different)
blanchet
parents:
40070
diff
changeset
|
279 |
local_bonus = #local_bonus atp_relevance_fudge, |
658a37c80b53
generalized the relevance filter so that it takes the list of "irrelevant constants" as argument (since the ATP and SMT preprocessing are different)
blanchet
parents:
40070
diff
changeset
|
280 |
assum_bonus = #assum_bonus atp_relevance_fudge, |
658a37c80b53
generalized the relevance filter so that it takes the list of "irrelevant constants" as argument (since the ATP and SMT preprocessing are different)
blanchet
parents:
40070
diff
changeset
|
281 |
chained_bonus = #chained_bonus atp_relevance_fudge, |
658a37c80b53
generalized the relevance filter so that it takes the list of "irrelevant constants" as argument (since the ATP and SMT preprocessing are different)
blanchet
parents:
40070
diff
changeset
|
282 |
max_imperfect = #max_imperfect atp_relevance_fudge, |
658a37c80b53
generalized the relevance filter so that it takes the list of "irrelevant constants" as argument (since the ATP and SMT preprocessing are different)
blanchet
parents:
40070
diff
changeset
|
283 |
max_imperfect_exp = #max_imperfect_exp atp_relevance_fudge, |
658a37c80b53
generalized the relevance filter so that it takes the list of "irrelevant constants" as argument (since the ATP and SMT preprocessing are different)
blanchet
parents:
40070
diff
changeset
|
284 |
threshold_divisor = #threshold_divisor atp_relevance_fudge, |
658a37c80b53
generalized the relevance filter so that it takes the list of "irrelevant constants" as argument (since the ATP and SMT preprocessing are different)
blanchet
parents:
40070
diff
changeset
|
285 |
ridiculous_threshold = #ridiculous_threshold atp_relevance_fudge} |
40070
bdb890782d4a
replaced references with proper record that's threaded through
blanchet
parents:
40069
diff
changeset
|
286 |
|
40941
a3e6f8634a11
replace "smt" prover with specific SMT solvers, e.g. "z3" -- whatever the SMT module gives us
blanchet
parents:
40723
diff
changeset
|
287 |
fun relevance_fudge_for_prover ctxt name = |
a3e6f8634a11
replace "smt" prover with specific SMT solvers, e.g. "z3" -- whatever the SMT module gives us
blanchet
parents:
40723
diff
changeset
|
288 |
if is_smt_prover ctxt name then smt_relevance_fudge else atp_relevance_fudge |
40070
bdb890782d4a
replaced references with proper record that's threaded through
blanchet
parents:
40069
diff
changeset
|
289 |
|
41727
ab3f6d76fb23
available_provers ~> supported_provers (for clarity)
blanchet
parents:
41723
diff
changeset
|
290 |
fun supported_provers ctxt = |
40060
5ef6747aa619
first step in adding support for an SMT backend to Sledgehammer
blanchet
parents:
40059
diff
changeset
|
291 |
let |
42361 | 292 |
val thy = Proof_Context.theory_of ctxt |
40060
5ef6747aa619
first step in adding support for an SMT backend to Sledgehammer
blanchet
parents:
40059
diff
changeset
|
293 |
val (remote_provers, local_provers) = |
45520 | 294 |
reconstructor_names @ |
41727
ab3f6d76fb23
available_provers ~> supported_provers (for clarity)
blanchet
parents:
41723
diff
changeset
|
295 |
sort_strings (supported_atps thy) @ |
ab3f6d76fb23
available_provers ~> supported_provers (for clarity)
blanchet
parents:
41723
diff
changeset
|
296 |
sort_strings (SMT_Solver.available_solvers_of ctxt) |
40060
5ef6747aa619
first step in adding support for an SMT backend to Sledgehammer
blanchet
parents:
40059
diff
changeset
|
297 |
|> List.partition (String.isPrefix remote_prefix) |
5ef6747aa619
first step in adding support for an SMT backend to Sledgehammer
blanchet
parents:
40059
diff
changeset
|
298 |
in |
41727
ab3f6d76fb23
available_provers ~> supported_provers (for clarity)
blanchet
parents:
41723
diff
changeset
|
299 |
Output.urgent_message ("Supported provers: " ^ |
40205
277508b07418
if "debug" is on, print list of relevant facts (poweruser request);
blanchet
parents:
40204
diff
changeset
|
300 |
commas (local_provers @ remote_provers) ^ ".") |
40060
5ef6747aa619
first step in adding support for an SMT backend to Sledgehammer
blanchet
parents:
40059
diff
changeset
|
301 |
end |
35969 | 302 |
|
48319
340187063d84
use async manager to manage MaSh learners to make sure they get killed cleanly
blanchet
parents:
48314
diff
changeset
|
303 |
fun kill_provers () = Async_Manager.kill_threads SledgehammerN "prover" |
340187063d84
use async manager to manage MaSh learners to make sure they get killed cleanly
blanchet
parents:
48314
diff
changeset
|
304 |
fun running_provers () = Async_Manager.running_threads SledgehammerN "prover" |
340187063d84
use async manager to manage MaSh learners to make sure they get killed cleanly
blanchet
parents:
48314
diff
changeset
|
305 |
val messages = Async_Manager.thread_messages SledgehammerN "prover" |
40059
6ad9081665db
use consistent terminology in Sledgehammer: "prover = ATP or SMT solver or ..."
blanchet
parents:
39494
diff
changeset
|
306 |
|
48288
255c6e1fd505
rationalize relevance filter, slowing moving code from Iter to MaSh
blanchet
parents:
48250
diff
changeset
|
307 |
|
40059
6ad9081665db
use consistent terminology in Sledgehammer: "prover = ATP or SMT solver or ..."
blanchet
parents:
39494
diff
changeset
|
308 |
(** problems, results, ATPs, etc. **) |
35969 | 309 |
|
310 |
type params = |
|
48321 | 311 |
{debug : bool, |
312 |
verbose : bool, |
|
313 |
overlord : bool, |
|
314 |
blocking : bool, |
|
315 |
provers : string list, |
|
316 |
type_enc : string option, |
|
317 |
strict : bool, |
|
318 |
lam_trans : string option, |
|
319 |
uncurried_aliases : bool option, |
|
320 |
learn : bool, |
|
321 |
fact_filter : string option, |
|
322 |
max_facts : int option, |
|
323 |
fact_thresholds : real * real, |
|
324 |
max_mono_iters : int option, |
|
325 |
max_new_mono_instances : int option, |
|
49918
cf441f4a358b
renamed Isar-proof related options + changed semantics of Isar shrinking
blanchet
parents:
49914
diff
changeset
|
326 |
isar_proofs : bool, |
51130
76d68444cd59
renamed sledgehammer_shrink to sledgehammer_compress
smolkas
parents:
51024
diff
changeset
|
327 |
isar_compress : real, |
48321 | 328 |
slice : bool, |
329 |
minimize : bool option, |
|
50557 | 330 |
timeout : Time.time option, |
331 |
preplay_timeout : Time.time option, |
|
48321 | 332 |
expect : string} |
35867 | 333 |
|
48288
255c6e1fd505
rationalize relevance filter, slowing moving code from Iter to MaSh
blanchet
parents:
48250
diff
changeset
|
334 |
type relevance_fudge = |
255c6e1fd505
rationalize relevance filter, slowing moving code from Iter to MaSh
blanchet
parents:
48250
diff
changeset
|
335 |
{local_const_multiplier : real, |
255c6e1fd505
rationalize relevance filter, slowing moving code from Iter to MaSh
blanchet
parents:
48250
diff
changeset
|
336 |
worse_irrel_freq : real, |
255c6e1fd505
rationalize relevance filter, slowing moving code from Iter to MaSh
blanchet
parents:
48250
diff
changeset
|
337 |
higher_order_irrel_weight : real, |
255c6e1fd505
rationalize relevance filter, slowing moving code from Iter to MaSh
blanchet
parents:
48250
diff
changeset
|
338 |
abs_rel_weight : real, |
255c6e1fd505
rationalize relevance filter, slowing moving code from Iter to MaSh
blanchet
parents:
48250
diff
changeset
|
339 |
abs_irrel_weight : real, |
255c6e1fd505
rationalize relevance filter, slowing moving code from Iter to MaSh
blanchet
parents:
48250
diff
changeset
|
340 |
skolem_irrel_weight : real, |
255c6e1fd505
rationalize relevance filter, slowing moving code from Iter to MaSh
blanchet
parents:
48250
diff
changeset
|
341 |
theory_const_rel_weight : real, |
255c6e1fd505
rationalize relevance filter, slowing moving code from Iter to MaSh
blanchet
parents:
48250
diff
changeset
|
342 |
theory_const_irrel_weight : real, |
255c6e1fd505
rationalize relevance filter, slowing moving code from Iter to MaSh
blanchet
parents:
48250
diff
changeset
|
343 |
chained_const_irrel_weight : real, |
255c6e1fd505
rationalize relevance filter, slowing moving code from Iter to MaSh
blanchet
parents:
48250
diff
changeset
|
344 |
intro_bonus : real, |
255c6e1fd505
rationalize relevance filter, slowing moving code from Iter to MaSh
blanchet
parents:
48250
diff
changeset
|
345 |
elim_bonus : real, |
255c6e1fd505
rationalize relevance filter, slowing moving code from Iter to MaSh
blanchet
parents:
48250
diff
changeset
|
346 |
simp_bonus : real, |
255c6e1fd505
rationalize relevance filter, slowing moving code from Iter to MaSh
blanchet
parents:
48250
diff
changeset
|
347 |
local_bonus : real, |
255c6e1fd505
rationalize relevance filter, slowing moving code from Iter to MaSh
blanchet
parents:
48250
diff
changeset
|
348 |
assum_bonus : real, |
255c6e1fd505
rationalize relevance filter, slowing moving code from Iter to MaSh
blanchet
parents:
48250
diff
changeset
|
349 |
chained_bonus : real, |
255c6e1fd505
rationalize relevance filter, slowing moving code from Iter to MaSh
blanchet
parents:
48250
diff
changeset
|
350 |
max_imperfect : real, |
255c6e1fd505
rationalize relevance filter, slowing moving code from Iter to MaSh
blanchet
parents:
48250
diff
changeset
|
351 |
max_imperfect_exp : real, |
255c6e1fd505
rationalize relevance filter, slowing moving code from Iter to MaSh
blanchet
parents:
48250
diff
changeset
|
352 |
threshold_divisor : real, |
255c6e1fd505
rationalize relevance filter, slowing moving code from Iter to MaSh
blanchet
parents:
48250
diff
changeset
|
353 |
ridiculous_threshold : real} |
255c6e1fd505
rationalize relevance filter, slowing moving code from Iter to MaSh
blanchet
parents:
48250
diff
changeset
|
354 |
|
40061
71cc5aac8b76
generalization of the Sledgehammer minimizer, to make it possible to handle SMT solvers as well
blanchet
parents:
40060
diff
changeset
|
355 |
type prover_problem = |
48321 | 356 |
{state : Proof.state, |
357 |
goal : thm, |
|
358 |
subgoal : int, |
|
359 |
subgoal_count : int, |
|
51010 | 360 |
factss : (string * fact list) list} |
35867 | 361 |
|
40061
71cc5aac8b76
generalization of the Sledgehammer minimizer, to make it possible to handle SMT solvers as well
blanchet
parents:
40060
diff
changeset
|
362 |
type prover_result = |
48321 | 363 |
{outcome : failure option, |
364 |
used_facts : (string * stature) list, |
|
51009
e8ff34a1fa9a
thread through fact triple component from which used facts come, for accurate index output
blanchet
parents:
51007
diff
changeset
|
365 |
used_from : fact list, |
48321 | 366 |
run_time : Time.time, |
50669
84c7cf36b2e0
use "Lazy" to simplify control flow a bit and guarantee single evaluation (at most)
blanchet
parents:
50667
diff
changeset
|
367 |
preplay : play Lazy.lazy, |
48321 | 368 |
message : play -> string, |
369 |
message_tail : string} |
|
35867 | 370 |
|
43051 | 371 |
type prover = |
45520 | 372 |
params -> ((string * string list) list -> string -> minimize_command) |
373 |
-> prover_problem -> prover_result |
|
35867 | 374 |
|
38023 | 375 |
(* configuration attributes *) |
376 |
||
43092
93ec303e1917
more work on new metis that exploits the powerful new type encodings
blanchet
parents:
43085
diff
changeset
|
377 |
(* Empty string means create files in Isabelle's temporary files directory. *) |
42616
92715b528e78
added Attrib.setup_config_XXX conveniences, with implicit setup of the background theory;
wenzelm
parents:
42593
diff
changeset
|
378 |
val dest_dir = |
92715b528e78
added Attrib.setup_config_XXX conveniences, with implicit setup of the background theory;
wenzelm
parents:
42593
diff
changeset
|
379 |
Attrib.setup_config_string @{binding sledgehammer_dest_dir} (K "") |
92715b528e78
added Attrib.setup_config_XXX conveniences, with implicit setup of the background theory;
wenzelm
parents:
42593
diff
changeset
|
380 |
val problem_prefix = |
92715b528e78
added Attrib.setup_config_XXX conveniences, with implicit setup of the background theory;
wenzelm
parents:
42593
diff
changeset
|
381 |
Attrib.setup_config_string @{binding sledgehammer_problem_prefix} (K "prob") |
48143 | 382 |
val completish = |
383 |
Attrib.setup_config_bool @{binding sledgehammer_completish} (K false) |
|
28484 | 384 |
|
43092
93ec303e1917
more work on new metis that exploits the powerful new type encodings
blanchet
parents:
43085
diff
changeset
|
385 |
(* In addition to being easier to read, readable names are often much shorter, |
44394
20bd9f90accc
added option to control soundness of encodings more precisely, for evaluation purposes
blanchet
parents:
44393
diff
changeset
|
386 |
especially if types are mangled in names. This makes a difference for some |
20bd9f90accc
added option to control soundness of encodings more precisely, for evaluation purposes
blanchet
parents:
44393
diff
changeset
|
387 |
provers (e.g., E). For these reason, short names are enabled by default. *) |
44592
54906b0337ab
flip logic of boolean option so it's off by default
blanchet
parents:
44586
diff
changeset
|
388 |
val atp_full_names = |
54906b0337ab
flip logic of boolean option so it's off by default
blanchet
parents:
44586
diff
changeset
|
389 |
Attrib.setup_config_bool @{binding sledgehammer_atp_full_names} (K false) |
43092
93ec303e1917
more work on new metis that exploits the powerful new type encodings
blanchet
parents:
43085
diff
changeset
|
390 |
|
42646
4781fcd53572
replaced some Unsynchronized.refs with Config.Ts
blanchet
parents:
42642
diff
changeset
|
391 |
val smt_triggers = |
4781fcd53572
replaced some Unsynchronized.refs with Config.Ts
blanchet
parents:
42642
diff
changeset
|
392 |
Attrib.setup_config_bool @{binding sledgehammer_smt_triggers} (K true) |
4781fcd53572
replaced some Unsynchronized.refs with Config.Ts
blanchet
parents:
42642
diff
changeset
|
393 |
val smt_weights = |
4781fcd53572
replaced some Unsynchronized.refs with Config.Ts
blanchet
parents:
42642
diff
changeset
|
394 |
Attrib.setup_config_bool @{binding sledgehammer_smt_weights} (K true) |
4781fcd53572
replaced some Unsynchronized.refs with Config.Ts
blanchet
parents:
42642
diff
changeset
|
395 |
val smt_weight_min_facts = |
4781fcd53572
replaced some Unsynchronized.refs with Config.Ts
blanchet
parents:
42642
diff
changeset
|
396 |
Attrib.setup_config_int @{binding sledgehammer_smt_weight_min_facts} (K 20) |
41256
0e7d45cc005f
put the SMT weights back where they belong, so that they're also used by Mirabelle
blanchet
parents:
41242
diff
changeset
|
397 |
|
0e7d45cc005f
put the SMT weights back where they belong, so that they're also used by Mirabelle
blanchet
parents:
41242
diff
changeset
|
398 |
(* FUDGE *) |
42646
4781fcd53572
replaced some Unsynchronized.refs with Config.Ts
blanchet
parents:
42642
diff
changeset
|
399 |
val smt_min_weight = |
4781fcd53572
replaced some Unsynchronized.refs with Config.Ts
blanchet
parents:
42642
diff
changeset
|
400 |
Attrib.setup_config_int @{binding sledgehammer_smt_min_weight} (K 0) |
4781fcd53572
replaced some Unsynchronized.refs with Config.Ts
blanchet
parents:
42642
diff
changeset
|
401 |
val smt_max_weight = |
4781fcd53572
replaced some Unsynchronized.refs with Config.Ts
blanchet
parents:
42642
diff
changeset
|
402 |
Attrib.setup_config_int @{binding sledgehammer_smt_max_weight} (K 10) |
4781fcd53572
replaced some Unsynchronized.refs with Config.Ts
blanchet
parents:
42642
diff
changeset
|
403 |
val smt_max_weight_index = |
4781fcd53572
replaced some Unsynchronized.refs with Config.Ts
blanchet
parents:
42642
diff
changeset
|
404 |
Attrib.setup_config_int @{binding sledgehammer_smt_max_weight_index} (K 200) |
41256
0e7d45cc005f
put the SMT weights back where they belong, so that they're also used by Mirabelle
blanchet
parents:
41242
diff
changeset
|
405 |
val smt_weight_curve = Unsynchronized.ref (fn x : int => x * x) |
0e7d45cc005f
put the SMT weights back where they belong, so that they're also used by Mirabelle
blanchet
parents:
41242
diff
changeset
|
406 |
|
42646
4781fcd53572
replaced some Unsynchronized.refs with Config.Ts
blanchet
parents:
42642
diff
changeset
|
407 |
fun smt_fact_weight ctxt j num_facts = |
4781fcd53572
replaced some Unsynchronized.refs with Config.Ts
blanchet
parents:
42642
diff
changeset
|
408 |
if Config.get ctxt smt_weights andalso |
4781fcd53572
replaced some Unsynchronized.refs with Config.Ts
blanchet
parents:
42642
diff
changeset
|
409 |
num_facts >= Config.get ctxt smt_weight_min_facts then |
4781fcd53572
replaced some Unsynchronized.refs with Config.Ts
blanchet
parents:
42642
diff
changeset
|
410 |
let |
4781fcd53572
replaced some Unsynchronized.refs with Config.Ts
blanchet
parents:
42642
diff
changeset
|
411 |
val min = Config.get ctxt smt_min_weight |
4781fcd53572
replaced some Unsynchronized.refs with Config.Ts
blanchet
parents:
42642
diff
changeset
|
412 |
val max = Config.get ctxt smt_max_weight |
4781fcd53572
replaced some Unsynchronized.refs with Config.Ts
blanchet
parents:
42642
diff
changeset
|
413 |
val max_index = Config.get ctxt smt_max_weight_index |
4781fcd53572
replaced some Unsynchronized.refs with Config.Ts
blanchet
parents:
42642
diff
changeset
|
414 |
val curve = !smt_weight_curve |
4781fcd53572
replaced some Unsynchronized.refs with Config.Ts
blanchet
parents:
42642
diff
changeset
|
415 |
in |
4781fcd53572
replaced some Unsynchronized.refs with Config.Ts
blanchet
parents:
42642
diff
changeset
|
416 |
SOME (max - (max - min + 1) * curve (Int.max (0, max_index - j - 1)) |
4781fcd53572
replaced some Unsynchronized.refs with Config.Ts
blanchet
parents:
42642
diff
changeset
|
417 |
div curve max_index) |
4781fcd53572
replaced some Unsynchronized.refs with Config.Ts
blanchet
parents:
42642
diff
changeset
|
418 |
end |
41256
0e7d45cc005f
put the SMT weights back where they belong, so that they're also used by Mirabelle
blanchet
parents:
41242
diff
changeset
|
419 |
else |
0e7d45cc005f
put the SMT weights back where they belong, so that they're also used by Mirabelle
blanchet
parents:
41242
diff
changeset
|
420 |
NONE |
0e7d45cc005f
put the SMT weights back where they belong, so that they're also used by Mirabelle
blanchet
parents:
41242
diff
changeset
|
421 |
|
42646
4781fcd53572
replaced some Unsynchronized.refs with Config.Ts
blanchet
parents:
42642
diff
changeset
|
422 |
fun weight_smt_fact ctxt num_facts ((info, th), j) = |
4781fcd53572
replaced some Unsynchronized.refs with Config.Ts
blanchet
parents:
42642
diff
changeset
|
423 |
let val thy = Proof_Context.theory_of ctxt in |
4781fcd53572
replaced some Unsynchronized.refs with Config.Ts
blanchet
parents:
42642
diff
changeset
|
424 |
(info, (smt_fact_weight ctxt j num_facts, th |> Thm.transfer thy)) |
4781fcd53572
replaced some Unsynchronized.refs with Config.Ts
blanchet
parents:
42642
diff
changeset
|
425 |
end |
38023 | 426 |
|
41313
a96ac4d180b7
optionally supply constant weights to E -- turned off by default until properly parameterized
blanchet
parents:
41259
diff
changeset
|
427 |
fun overlord_file_location_for_prover prover = |
a96ac4d180b7
optionally supply constant weights to E -- turned off by default until properly parameterized
blanchet
parents:
41259
diff
changeset
|
428 |
(getenv "ISABELLE_HOME_USER", "prob_" ^ prover) |
a96ac4d180b7
optionally supply constant weights to E -- turned off by default until properly parameterized
blanchet
parents:
41259
diff
changeset
|
429 |
|
43052
8d6a4978cc65
automatically minimize with Metis when this can be done within a few seconds
blanchet
parents:
43051
diff
changeset
|
430 |
fun proof_banner mode name = |
43033 | 431 |
case mode of |
432 |
Auto_Try => "Auto Sledgehammer (" ^ quote name ^ ") found a proof" |
|
433 |
| Try => "Sledgehammer (" ^ quote name ^ ") found a proof" |
|
43052
8d6a4978cc65
automatically minimize with Metis when this can be done within a few seconds
blanchet
parents:
43051
diff
changeset
|
434 |
| _ => "Try this" |
43033 | 435 |
|
45561
57227eedce81
don't propagate user-set "type_enc" or "lam_trans" to Metis calls
blanchet
parents:
45560
diff
changeset
|
436 |
fun bunch_of_reconstructors needs_full_types lam_trans = |
48800 | 437 |
if needs_full_types then |
48802 | 438 |
[Metis (full_type_enc, lam_trans false), |
439 |
Metis (really_full_type_enc, lam_trans false), |
|
440 |
Metis (full_type_enc, lam_trans true), |
|
441 |
Metis (really_full_type_enc, lam_trans true), |
|
442 |
SMT] |
|
443 |
else |
|
48800 | 444 |
[Metis (partial_type_enc, lam_trans false), |
445 |
Metis (full_type_enc, lam_trans false), |
|
446 |
Metis (no_typesN, lam_trans true), |
|
447 |
Metis (really_full_type_enc, lam_trans true), |
|
448 |
SMT] |
|
45561
57227eedce81
don't propagate user-set "type_enc" or "lam_trans" to Metis calls
blanchet
parents:
45560
diff
changeset
|
449 |
|
57227eedce81
don't propagate user-set "type_enc" or "lam_trans" to Metis calls
blanchet
parents:
45560
diff
changeset
|
450 |
fun extract_reconstructor ({type_enc, lam_trans, ...} : params) |
57227eedce81
don't propagate user-set "type_enc" or "lam_trans" to Metis calls
blanchet
parents:
45560
diff
changeset
|
451 |
(Metis (type_enc', lam_trans')) = |
57227eedce81
don't propagate user-set "type_enc" or "lam_trans" to Metis calls
blanchet
parents:
45560
diff
changeset
|
452 |
let |
57227eedce81
don't propagate user-set "type_enc" or "lam_trans" to Metis calls
blanchet
parents:
45560
diff
changeset
|
453 |
val override_params = |
57227eedce81
don't propagate user-set "type_enc" or "lam_trans" to Metis calls
blanchet
parents:
45560
diff
changeset
|
454 |
(if is_none type_enc andalso type_enc' = hd partial_type_encs then |
57227eedce81
don't propagate user-set "type_enc" or "lam_trans" to Metis calls
blanchet
parents:
45560
diff
changeset
|
455 |
[] |
57227eedce81
don't propagate user-set "type_enc" or "lam_trans" to Metis calls
blanchet
parents:
45560
diff
changeset
|
456 |
else |
45566
da05ce2de5a8
better threading of type encodings between Sledgehammer and "metis"
blanchet
parents:
45561
diff
changeset
|
457 |
[("type_enc", [hd (unalias_type_enc type_enc')])]) @ |
45561
57227eedce81
don't propagate user-set "type_enc" or "lam_trans" to Metis calls
blanchet
parents:
45560
diff
changeset
|
458 |
(if is_none lam_trans andalso lam_trans' = metis_default_lam_trans then |
57227eedce81
don't propagate user-set "type_enc" or "lam_trans" to Metis calls
blanchet
parents:
45560
diff
changeset
|
459 |
[] |
57227eedce81
don't propagate user-set "type_enc" or "lam_trans" to Metis calls
blanchet
parents:
45560
diff
changeset
|
460 |
else |
57227eedce81
don't propagate user-set "type_enc" or "lam_trans" to Metis calls
blanchet
parents:
45560
diff
changeset
|
461 |
[("lam_trans", [lam_trans'])]) |
57227eedce81
don't propagate user-set "type_enc" or "lam_trans" to Metis calls
blanchet
parents:
45560
diff
changeset
|
462 |
in (metisN, override_params) end |
57227eedce81
don't propagate user-set "type_enc" or "lam_trans" to Metis calls
blanchet
parents:
45560
diff
changeset
|
463 |
| extract_reconstructor _ SMT = (smtN, []) |
57227eedce81
don't propagate user-set "type_enc" or "lam_trans" to Metis calls
blanchet
parents:
45560
diff
changeset
|
464 |
|
43033 | 465 |
(* based on "Mirabelle.can_apply" and generalized *) |
43034
18259246abb5
try both "metis" and (on failure) "metisFT" in replay
blanchet
parents:
43033
diff
changeset
|
466 |
fun timed_apply timeout tac state i = |
43033 | 467 |
let |
468 |
val {context = ctxt, facts, goal} = Proof.goal state |
|
469 |
val full_tac = Method.insert_tac facts i THEN tac ctxt i |
|
50557 | 470 |
in time_limit timeout (try (Seq.pull o full_tac)) goal end |
43033 | 471 |
|
45519
cd6e78cb6ee8
make metis reconstruction handling more flexible
blanchet
parents:
45514
diff
changeset
|
472 |
fun tac_for_reconstructor (Metis (type_enc, lam_trans)) = |
45521 | 473 |
metis_tac [type_enc] lam_trans |
45379
0147a4348ca1
try "smt" as a fallback for ATPs if "metis" fails/times out
blanchet
parents:
45378
diff
changeset
|
474 |
| tac_for_reconstructor SMT = SMT_Solver.smt_tac |
43034
18259246abb5
try both "metis" and (on failure) "metisFT" in replay
blanchet
parents:
43033
diff
changeset
|
475 |
|
45520 | 476 |
fun timed_reconstructor reconstr debug timeout ths = |
44651
5d6a11e166cf
renamed "Metis_Tactics" to "Metis_Tactic", now that there is only one Metis tactic ("metisFT" is legacy)
blanchet
parents:
44649
diff
changeset
|
477 |
(Config.put Metis_Tactic.verbose debug |
45557 | 478 |
#> Config.put SMT_Config.verbose debug |
45520 | 479 |
#> (fn ctxt => tac_for_reconstructor reconstr ctxt ths)) |
43034
18259246abb5
try both "metis" and (on failure) "metisFT" in replay
blanchet
parents:
43033
diff
changeset
|
480 |
|> timed_apply timeout |
43033 | 481 |
|
48798 | 482 |
fun is_fact_chained ((_, (sc, _)), _) = sc = Chained |
483 |
||
484 |
fun filter_used_facts keep_chained used = |
|
485 |
filter ((member (op =) used o fst) orf |
|
486 |
(if keep_chained then is_fact_chained else K false)) |
|
43033 | 487 |
|
45781
fc2c368b5f54
use same order of facts for preplay as for actual reconstruction -- Metis sometimes exhibits very different timings depending on the order of the facts
blanchet
parents:
45707
diff
changeset
|
488 |
fun play_one_line_proof mode debug verbose timeout pairs state i preferred |
45520 | 489 |
reconstrs = |
43034
18259246abb5
try both "metis" and (on failure) "metisFT" in replay
blanchet
parents:
43033
diff
changeset
|
490 |
let |
45520 | 491 |
fun get_preferred reconstrs = |
492 |
if member (op =) reconstrs preferred then preferred |
|
493 |
else List.last reconstrs |
|
43034
18259246abb5
try both "metis" and (on failure) "metisFT" in replay
blanchet
parents:
43033
diff
changeset
|
494 |
in |
50557 | 495 |
if timeout = SOME Time.zeroTime then |
45520 | 496 |
Trust_Playable (get_preferred reconstrs, NONE) |
45379
0147a4348ca1
try "smt" as a fallback for ATPs if "metis" fails/times out
blanchet
parents:
45378
diff
changeset
|
497 |
else |
50557 | 498 |
let |
499 |
val _ = |
|
500 |
if mode = Minimize then Output.urgent_message "Preplaying proof..." |
|
501 |
else () |
|
502 |
val ths = pairs |> sort_wrt (fst o fst) |> map snd |
|
503 |
fun play [] [] = Failed_to_Play (get_preferred reconstrs) |
|
504 |
| play timed_outs [] = |
|
505 |
Trust_Playable (get_preferred timed_outs, timeout) |
|
506 |
| play timed_out (reconstr :: reconstrs) = |
|
507 |
let |
|
508 |
val _ = |
|
509 |
if verbose then |
|
510 |
"Trying \"" ^ string_for_reconstructor reconstr ^ "\"" ^ |
|
511 |
(case timeout of |
|
512 |
SOME timeout => " for " ^ string_from_time timeout |
|
513 |
| NONE => "") ^ "..." |
|
514 |
|> Output.urgent_message |
|
515 |
else |
|
516 |
() |
|
517 |
val timer = Timer.startRealTimer () |
|
518 |
in |
|
519 |
case timed_reconstructor reconstr debug timeout ths state i of |
|
520 |
SOME (SOME _) => Played (reconstr, Timer.checkRealTimer timer) |
|
521 |
| _ => play timed_out reconstrs |
|
522 |
end |
|
523 |
handle TimeLimit.TimeOut => play (reconstr :: timed_out) reconstrs |
|
524 |
in play [] reconstrs end |
|
43033 | 525 |
end |
526 |
||
41313
a96ac4d180b7
optionally supply constant weights to E -- turned off by default until properly parameterized
blanchet
parents:
41259
diff
changeset
|
527 |
|
41256
0e7d45cc005f
put the SMT weights back where they belong, so that they're also used by Mirabelle
blanchet
parents:
41242
diff
changeset
|
528 |
(* generic TPTP-based ATPs *) |
40061
71cc5aac8b76
generalization of the Sledgehammer minimizer, to make it possible to handle SMT solvers as well
blanchet
parents:
40060
diff
changeset
|
529 |
|
42730
d6db5a815477
improve detection of quantifications over dangerous types by leveraging "is_type_surely_finite" predicate and added "prop" to the list of surely finite types
blanchet
parents:
42729
diff
changeset
|
530 |
(* Too general means, positive equality literal with a variable X as one |
d6db5a815477
improve detection of quantifications over dangerous types by leveraging "is_type_surely_finite" predicate and added "prop" to the list of surely finite types
blanchet
parents:
42729
diff
changeset
|
531 |
operand, when X does not occur properly in the other operand. This rules out |
d6db5a815477
improve detection of quantifications over dangerous types by leveraging "is_type_surely_finite" predicate and added "prop" to the list of surely finite types
blanchet
parents:
42729
diff
changeset
|
532 |
clearly inconsistent facts such as X = a | X = b, though it by no means |
d6db5a815477
improve detection of quantifications over dangerous types by leveraging "is_type_surely_finite" predicate and added "prop" to the list of surely finite types
blanchet
parents:
42729
diff
changeset
|
533 |
guarantees soundness. *) |
d6db5a815477
improve detection of quantifications over dangerous types by leveraging "is_type_surely_finite" predicate and added "prop" to the list of surely finite types
blanchet
parents:
42729
diff
changeset
|
534 |
|
51013 | 535 |
fun get_facts_for_filter _ [(_, facts)] = facts |
536 |
| get_facts_for_filter fact_filter factss = |
|
537 |
case AList.lookup (op =) factss fact_filter of |
|
538 |
SOME facts => facts |
|
539 |
| NONE => snd (hd factss) |
|
540 |
||
42730
d6db5a815477
improve detection of quantifications over dangerous types by leveraging "is_type_surely_finite" predicate and added "prop" to the list of surely finite types
blanchet
parents:
42729
diff
changeset
|
541 |
(* Unwanted equalities are those between a (bound or schematic) variable that |
d6db5a815477
improve detection of quantifications over dangerous types by leveraging "is_type_surely_finite" predicate and added "prop" to the list of surely finite types
blanchet
parents:
42729
diff
changeset
|
542 |
does not properly occur in the second operand. *) |
d6db5a815477
improve detection of quantifications over dangerous types by leveraging "is_type_surely_finite" predicate and added "prop" to the list of surely finite types
blanchet
parents:
42729
diff
changeset
|
543 |
val is_exhaustive_finite = |
d6db5a815477
improve detection of quantifications over dangerous types by leveraging "is_type_surely_finite" predicate and added "prop" to the list of surely finite types
blanchet
parents:
42729
diff
changeset
|
544 |
let |
d6db5a815477
improve detection of quantifications over dangerous types by leveraging "is_type_surely_finite" predicate and added "prop" to the list of surely finite types
blanchet
parents:
42729
diff
changeset
|
545 |
fun is_bad_equal (Var z) t = |
d6db5a815477
improve detection of quantifications over dangerous types by leveraging "is_type_surely_finite" predicate and added "prop" to the list of surely finite types
blanchet
parents:
42729
diff
changeset
|
546 |
not (exists_subterm (fn Var z' => z = z' | _ => false) t) |
d6db5a815477
improve detection of quantifications over dangerous types by leveraging "is_type_surely_finite" predicate and added "prop" to the list of surely finite types
blanchet
parents:
42729
diff
changeset
|
547 |
| is_bad_equal (Bound j) t = not (loose_bvar1 (t, j)) |
d6db5a815477
improve detection of quantifications over dangerous types by leveraging "is_type_surely_finite" predicate and added "prop" to the list of surely finite types
blanchet
parents:
42729
diff
changeset
|
548 |
| is_bad_equal _ _ = false |
d6db5a815477
improve detection of quantifications over dangerous types by leveraging "is_type_surely_finite" predicate and added "prop" to the list of surely finite types
blanchet
parents:
42729
diff
changeset
|
549 |
fun do_equals t1 t2 = is_bad_equal t1 t2 orelse is_bad_equal t2 t1 |
d6db5a815477
improve detection of quantifications over dangerous types by leveraging "is_type_surely_finite" predicate and added "prop" to the list of surely finite types
blanchet
parents:
42729
diff
changeset
|
550 |
fun do_formula pos t = |
d6db5a815477
improve detection of quantifications over dangerous types by leveraging "is_type_surely_finite" predicate and added "prop" to the list of surely finite types
blanchet
parents:
42729
diff
changeset
|
551 |
case (pos, t) of |
d6db5a815477
improve detection of quantifications over dangerous types by leveraging "is_type_surely_finite" predicate and added "prop" to the list of surely finite types
blanchet
parents:
42729
diff
changeset
|
552 |
(_, @{const Trueprop} $ t1) => do_formula pos t1 |
d6db5a815477
improve detection of quantifications over dangerous types by leveraging "is_type_surely_finite" predicate and added "prop" to the list of surely finite types
blanchet
parents:
42729
diff
changeset
|
553 |
| (true, Const (@{const_name all}, _) $ Abs (_, _, t')) => |
d6db5a815477
improve detection of quantifications over dangerous types by leveraging "is_type_surely_finite" predicate and added "prop" to the list of surely finite types
blanchet
parents:
42729
diff
changeset
|
554 |
do_formula pos t' |
d6db5a815477
improve detection of quantifications over dangerous types by leveraging "is_type_surely_finite" predicate and added "prop" to the list of surely finite types
blanchet
parents:
42729
diff
changeset
|
555 |
| (true, Const (@{const_name All}, _) $ Abs (_, _, t')) => |
d6db5a815477
improve detection of quantifications over dangerous types by leveraging "is_type_surely_finite" predicate and added "prop" to the list of surely finite types
blanchet
parents:
42729
diff
changeset
|
556 |
do_formula pos t' |
d6db5a815477
improve detection of quantifications over dangerous types by leveraging "is_type_surely_finite" predicate and added "prop" to the list of surely finite types
blanchet
parents:
42729
diff
changeset
|
557 |
| (false, Const (@{const_name Ex}, _) $ Abs (_, _, t')) => |
d6db5a815477
improve detection of quantifications over dangerous types by leveraging "is_type_surely_finite" predicate and added "prop" to the list of surely finite types
blanchet
parents:
42729
diff
changeset
|
558 |
do_formula pos t' |
d6db5a815477
improve detection of quantifications over dangerous types by leveraging "is_type_surely_finite" predicate and added "prop" to the list of surely finite types
blanchet
parents:
42729
diff
changeset
|
559 |
| (_, @{const "==>"} $ t1 $ t2) => |
d6db5a815477
improve detection of quantifications over dangerous types by leveraging "is_type_surely_finite" predicate and added "prop" to the list of surely finite types
blanchet
parents:
42729
diff
changeset
|
560 |
do_formula (not pos) t1 andalso |
d6db5a815477
improve detection of quantifications over dangerous types by leveraging "is_type_surely_finite" predicate and added "prop" to the list of surely finite types
blanchet
parents:
42729
diff
changeset
|
561 |
(t2 = @{prop False} orelse do_formula pos t2) |
d6db5a815477
improve detection of quantifications over dangerous types by leveraging "is_type_surely_finite" predicate and added "prop" to the list of surely finite types
blanchet
parents:
42729
diff
changeset
|
562 |
| (_, @{const HOL.implies} $ t1 $ t2) => |
d6db5a815477
improve detection of quantifications over dangerous types by leveraging "is_type_surely_finite" predicate and added "prop" to the list of surely finite types
blanchet
parents:
42729
diff
changeset
|
563 |
do_formula (not pos) t1 andalso |
d6db5a815477
improve detection of quantifications over dangerous types by leveraging "is_type_surely_finite" predicate and added "prop" to the list of surely finite types
blanchet
parents:
42729
diff
changeset
|
564 |
(t2 = @{const False} orelse do_formula pos t2) |
d6db5a815477
improve detection of quantifications over dangerous types by leveraging "is_type_surely_finite" predicate and added "prop" to the list of surely finite types
blanchet
parents:
42729
diff
changeset
|
565 |
| (_, @{const Not} $ t1) => do_formula (not pos) t1 |
d6db5a815477
improve detection of quantifications over dangerous types by leveraging "is_type_surely_finite" predicate and added "prop" to the list of surely finite types
blanchet
parents:
42729
diff
changeset
|
566 |
| (true, @{const HOL.disj} $ t1 $ t2) => forall (do_formula pos) [t1, t2] |
d6db5a815477
improve detection of quantifications over dangerous types by leveraging "is_type_surely_finite" predicate and added "prop" to the list of surely finite types
blanchet
parents:
42729
diff
changeset
|
567 |
| (false, @{const HOL.conj} $ t1 $ t2) => forall (do_formula pos) [t1, t2] |
d6db5a815477
improve detection of quantifications over dangerous types by leveraging "is_type_surely_finite" predicate and added "prop" to the list of surely finite types
blanchet
parents:
42729
diff
changeset
|
568 |
| (true, Const (@{const_name HOL.eq}, _) $ t1 $ t2) => do_equals t1 t2 |
d6db5a815477
improve detection of quantifications over dangerous types by leveraging "is_type_surely_finite" predicate and added "prop" to the list of surely finite types
blanchet
parents:
42729
diff
changeset
|
569 |
| (true, Const (@{const_name "=="}, _) $ t1 $ t2) => do_equals t1 t2 |
d6db5a815477
improve detection of quantifications over dangerous types by leveraging "is_type_surely_finite" predicate and added "prop" to the list of surely finite types
blanchet
parents:
42729
diff
changeset
|
570 |
| _ => false |
d6db5a815477
improve detection of quantifications over dangerous types by leveraging "is_type_surely_finite" predicate and added "prop" to the list of surely finite types
blanchet
parents:
42729
diff
changeset
|
571 |
in do_formula true end |
d6db5a815477
improve detection of quantifications over dangerous types by leveraging "is_type_surely_finite" predicate and added "prop" to the list of surely finite types
blanchet
parents:
42729
diff
changeset
|
572 |
|
d6db5a815477
improve detection of quantifications over dangerous types by leveraging "is_type_surely_finite" predicate and added "prop" to the list of surely finite types
blanchet
parents:
42729
diff
changeset
|
573 |
fun has_bound_or_var_of_type pred = |
d6db5a815477
improve detection of quantifications over dangerous types by leveraging "is_type_surely_finite" predicate and added "prop" to the list of surely finite types
blanchet
parents:
42729
diff
changeset
|
574 |
exists_subterm (fn Var (_, T as Type _) => pred T |
d6db5a815477
improve detection of quantifications over dangerous types by leveraging "is_type_surely_finite" predicate and added "prop" to the list of surely finite types
blanchet
parents:
42729
diff
changeset
|
575 |
| Abs (_, T as Type _, _) => pred T |
d6db5a815477
improve detection of quantifications over dangerous types by leveraging "is_type_surely_finite" predicate and added "prop" to the list of surely finite types
blanchet
parents:
42729
diff
changeset
|
576 |
| _ => false) |
d6db5a815477
improve detection of quantifications over dangerous types by leveraging "is_type_surely_finite" predicate and added "prop" to the list of surely finite types
blanchet
parents:
42729
diff
changeset
|
577 |
|
d6db5a815477
improve detection of quantifications over dangerous types by leveraging "is_type_surely_finite" predicate and added "prop" to the list of surely finite types
blanchet
parents:
42729
diff
changeset
|
578 |
(* Facts are forbidden to contain variables of these types. The typical reason |
d6db5a815477
improve detection of quantifications over dangerous types by leveraging "is_type_surely_finite" predicate and added "prop" to the list of surely finite types
blanchet
parents:
42729
diff
changeset
|
579 |
is that they lead to unsoundness. Note that "unit" satisfies numerous |
d6db5a815477
improve detection of quantifications over dangerous types by leveraging "is_type_surely_finite" predicate and added "prop" to the list of surely finite types
blanchet
parents:
42729
diff
changeset
|
580 |
equations like "?x = ()". The resulting clauses will have no type constraint, |
d6db5a815477
improve detection of quantifications over dangerous types by leveraging "is_type_surely_finite" predicate and added "prop" to the list of surely finite types
blanchet
parents:
42729
diff
changeset
|
581 |
yielding false proofs. Even "bool" leads to many unsound proofs, though only |
d6db5a815477
improve detection of quantifications over dangerous types by leveraging "is_type_surely_finite" predicate and added "prop" to the list of surely finite types
blanchet
parents:
42729
diff
changeset
|
582 |
for higher-order problems. *) |
d6db5a815477
improve detection of quantifications over dangerous types by leveraging "is_type_surely_finite" predicate and added "prop" to the list of surely finite types
blanchet
parents:
42729
diff
changeset
|
583 |
|
d6db5a815477
improve detection of quantifications over dangerous types by leveraging "is_type_surely_finite" predicate and added "prop" to the list of surely finite types
blanchet
parents:
42729
diff
changeset
|
584 |
(* Facts containing variables of type "unit" or "bool" or of the form |
d6db5a815477
improve detection of quantifications over dangerous types by leveraging "is_type_surely_finite" predicate and added "prop" to the list of surely finite types
blanchet
parents:
42729
diff
changeset
|
585 |
"ALL x. x = A | x = B | x = C" are likely to lead to unsound proofs if types |
d6db5a815477
improve detection of quantifications over dangerous types by leveraging "is_type_surely_finite" predicate and added "prop" to the list of surely finite types
blanchet
parents:
42729
diff
changeset
|
586 |
are omitted. *) |
42944
9e620869a576
improved Waldmeister support -- even run it by default on unit equational goals
blanchet
parents:
42943
diff
changeset
|
587 |
fun is_dangerous_prop ctxt = |
9e620869a576
improved Waldmeister support -- even run it by default on unit equational goals
blanchet
parents:
42943
diff
changeset
|
588 |
transform_elim_prop |
44393 | 589 |
#> (has_bound_or_var_of_type (is_type_surely_finite ctxt) orf |
42730
d6db5a815477
improve detection of quantifications over dangerous types by leveraging "is_type_surely_finite" predicate and added "prop" to the list of surely finite types
blanchet
parents:
42729
diff
changeset
|
590 |
is_exhaustive_finite) |
d6db5a815477
improve detection of quantifications over dangerous types by leveraging "is_type_surely_finite" predicate and added "prop" to the list of surely finite types
blanchet
parents:
42729
diff
changeset
|
591 |
|
39492 | 592 |
(* Important messages are important but not so important that users want to see |
593 |
them each time. *) |
|
44649 | 594 |
val atp_important_message_keep_quotient = 25 |
39492 | 595 |
|
44416
cabd06b69c18
added formats to the slice and use TFF for remote Vampire
blanchet
parents:
44397
diff
changeset
|
596 |
fun choose_type_enc soundness best_type_enc format = |
44397
06375952f1fa
cleaner handling of polymorphic monotonicity inference
blanchet
parents:
44394
diff
changeset
|
597 |
the_default best_type_enc |
06375952f1fa
cleaner handling of polymorphic monotonicity inference
blanchet
parents:
44394
diff
changeset
|
598 |
#> type_enc_from_string soundness |
44416
cabd06b69c18
added formats to the slice and use TFF for remote Vampire
blanchet
parents:
44397
diff
changeset
|
599 |
#> adjust_type_enc format |
42548
ea2a28b1938f
make sure the minimizer monomorphizes when it should
blanchet
parents:
42544
diff
changeset
|
600 |
|
43051 | 601 |
val metis_minimize_max_time = seconds 2.0 |
602 |
||
45561
57227eedce81
don't propagate user-set "type_enc" or "lam_trans" to Metis calls
blanchet
parents:
45560
diff
changeset
|
603 |
fun choose_minimize_command params minimize_command name preplay = |
45520 | 604 |
let |
605 |
val (name, override_params) = |
|
606 |
case preplay of |
|
607 |
Played (reconstr, time) => |
|
608 |
if Time.<= (time, metis_minimize_max_time) then |
|
45561
57227eedce81
don't propagate user-set "type_enc" or "lam_trans" to Metis calls
blanchet
parents:
45560
diff
changeset
|
609 |
extract_reconstructor params reconstr |
45520 | 610 |
else |
611 |
(name, []) |
|
612 |
| _ => (name, []) |
|
613 |
in minimize_command override_params name end |
|
43051 | 614 |
|
47962
137883567114
lower the monomorphization thresholds for less scalable provers
blanchet
parents:
47946
diff
changeset
|
615 |
fun repair_monomorph_context max_iters best_max_iters max_new_instances |
137883567114
lower the monomorphization thresholds for less scalable provers
blanchet
parents:
47946
diff
changeset
|
616 |
best_max_new_instances = |
137883567114
lower the monomorphization thresholds for less scalable provers
blanchet
parents:
47946
diff
changeset
|
617 |
Config.put Monomorph.max_rounds (max_iters |> the_default best_max_iters) |
137883567114
lower the monomorphization thresholds for less scalable provers
blanchet
parents:
47946
diff
changeset
|
618 |
#> Config.put Monomorph.max_new_instances |
137883567114
lower the monomorphization thresholds for less scalable provers
blanchet
parents:
47946
diff
changeset
|
619 |
(max_new_instances |> the_default best_max_new_instances) |
43230
dabf6e311213
clarified meaning of monomorphization configuration option by renaming it
boehmes
parents:
43228
diff
changeset
|
620 |
#> Config.put Monomorph.keep_partial_instances false |
43226 | 621 |
|
50494 | 622 |
fun suffix_for_mode Auto_Try = "_try" |
44509
369e8c28a61a
added a component in generated file names reflecting whether the minimizer is used -- needed for evaluation to keep these files separated from the main problem files
blanchet
parents:
44423
diff
changeset
|
623 |
| suffix_for_mode Try = "_try" |
369e8c28a61a
added a component in generated file names reflecting whether the minimizer is used -- needed for evaluation to keep these files separated from the main problem files
blanchet
parents:
44423
diff
changeset
|
624 |
| suffix_for_mode Normal = "" |
50494 | 625 |
| suffix_for_mode MaSh = "" |
626 |
| suffix_for_mode Auto_Minimize = "_min" |
|
44509
369e8c28a61a
added a component in generated file names reflecting whether the minimizer is used -- needed for evaluation to keep these files separated from the main problem files
blanchet
parents:
44423
diff
changeset
|
627 |
| suffix_for_mode Minimize = "_min" |
369e8c28a61a
added a component in generated file names reflecting whether the minimizer is used -- needed for evaluation to keep these files separated from the main problem files
blanchet
parents:
44423
diff
changeset
|
628 |
|
44423
f74707e12d30
exploit TFF format in Z3 used as ATP, and renamed it "z3_tptp"
blanchet
parents:
44416
diff
changeset
|
629 |
(* Give the ATPs some slack before interrupting them the hard way. "z3_tptp" on |
43631
4144d7b4ec77
enforce hard timeout on ATPs (esp. "z3_atp" on Linux) + remove obsolete failure codes
blanchet
parents:
43626
diff
changeset
|
630 |
Linux appears to be the only ATP that does not honor its time limit. *) |
43690 | 631 |
val atp_timeout_slack = seconds 1.0 |
43631
4144d7b4ec77
enforce hard timeout on ATPs (esp. "z3_atp" on Linux) + remove obsolete failure codes
blanchet
parents:
43626
diff
changeset
|
632 |
|
48331
f190a6dbb29b
make the monomorphizer more predictable by making the cutoff independent on the number of facts
blanchet
parents:
48321
diff
changeset
|
633 |
val mono_max_privileged_facts = 10 |
f190a6dbb29b
make the monomorphizer more predictable by making the cutoff independent on the number of facts
blanchet
parents:
48321
diff
changeset
|
634 |
|
51186
c8721406511a
interpret "max_facts" argument in a slice-dependent fashion, instead of forcing the same number of facts to all slices
blanchet
parents:
51181
diff
changeset
|
635 |
(* For low values of "max_facts", this fudge value ensures that most slices are |
c8721406511a
interpret "max_facts" argument in a slice-dependent fashion, instead of forcing the same number of facts to all slices
blanchet
parents:
51181
diff
changeset
|
636 |
invoked with a nontrivial amount of facts. *) |
c8721406511a
interpret "max_facts" argument in a slice-dependent fashion, instead of forcing the same number of facts to all slices
blanchet
parents:
51181
diff
changeset
|
637 |
val max_fact_factor_fudge = 5 |
c8721406511a
interpret "max_facts" argument in a slice-dependent fashion, instead of forcing the same number of facts to all slices
blanchet
parents:
51181
diff
changeset
|
638 |
|
43021 | 639 |
fun run_atp mode name |
48376
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
640 |
({exec, arguments, proof_delims, known_failures, prem_role, best_slices, |
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
641 |
best_max_mono_iters, best_max_new_mono_instances, ...} : atp_config) |
46301 | 642 |
(params as {debug, verbose, overlord, type_enc, strict, lam_trans, |
51024
98fb341d32e3
distinguish MeSh and smart -- with smart, allow combinations of MaSh, MeSh, and MePo in different slices -- and use MaSh also with SMT solvers, based on evaluation
blanchet
parents:
51014
diff
changeset
|
643 |
uncurried_aliases, fact_filter, max_facts, max_mono_iters, |
51130
76d68444cd59
renamed sledgehammer_shrink to sledgehammer_compress
smolkas
parents:
51024
diff
changeset
|
644 |
max_new_mono_instances, isar_proofs, isar_compress, |
46409
d4754183ccce
made option available to users (mostly for experiments)
blanchet
parents:
46407
diff
changeset
|
645 |
slice, timeout, preplay_timeout, ...}) |
43037 | 646 |
minimize_command |
51013 | 647 |
({state, goal, subgoal, subgoal_count, factss, ...} : prover_problem) = |
38023 | 648 |
let |
42182
a630978fc967
start monomorphization process with subgoal, not entire goal, to avoid needless instances (and only print monomorphization messages in debug mode)
blanchet
parents:
42181
diff
changeset
|
649 |
val thy = Proof.theory_of state |
39318 | 650 |
val ctxt = Proof.context_of state |
47946
33afcfad3f8d
add an experimental "aggressive" mode to Sledgehammer, to experiment with more complete translations of higher-order features without breaking "metis"
blanchet
parents:
47934
diff
changeset
|
651 |
val atp_mode = |
48143 | 652 |
if Config.get ctxt completish then Sledgehammer_Completish |
47946
33afcfad3f8d
add an experimental "aggressive" mode to Sledgehammer, to experiment with more complete translations of higher-order features without breaking "metis"
blanchet
parents:
47934
diff
changeset
|
653 |
else Sledgehammer |
43004
20e9caff1f86
fix soundness bug in Sledgehammer: distinguish params in goals from fixed variables in context
blanchet
parents:
42998
diff
changeset
|
654 |
val (_, hyp_ts, concl_t) = strip_subgoal ctxt goal subgoal |
41159
1e12d6495423
honor "overlord" option for SMT solvers as well and don't pass "ext" to them
blanchet
parents:
41152
diff
changeset
|
655 |
val (dest_dir, problem_prefix) = |
1e12d6495423
honor "overlord" option for SMT solvers as well and don't pass "ext" to them
blanchet
parents:
41152
diff
changeset
|
656 |
if overlord then overlord_file_location_for_prover name |
1e12d6495423
honor "overlord" option for SMT solvers as well and don't pass "ext" to them
blanchet
parents:
41152
diff
changeset
|
657 |
else (Config.get ctxt dest_dir, Config.get ctxt problem_prefix) |
40061
71cc5aac8b76
generalization of the Sledgehammer minimizer, to make it possible to handle SMT solvers as well
blanchet
parents:
40060
diff
changeset
|
658 |
val problem_file_name = |
41159
1e12d6495423
honor "overlord" option for SMT solvers as well and don't pass "ext" to them
blanchet
parents:
41152
diff
changeset
|
659 |
Path.basic (problem_prefix ^ (if overlord then "" else serial_string ()) ^ |
44509
369e8c28a61a
added a component in generated file names reflecting whether the minimizer is used -- needed for evaluation to keep these files separated from the main problem files
blanchet
parents:
44423
diff
changeset
|
660 |
suffix_for_mode mode ^ "_" ^ string_of_int subgoal) |
48656
5caa414ce9a2
cleaner temporary file cleanup for MaSh, based on tried-and-trusted code
blanchet
parents:
48532
diff
changeset
|
661 |
val prob_path = |
40059
6ad9081665db
use consistent terminology in Sledgehammer: "prover = ATP or SMT solver or ..."
blanchet
parents:
39494
diff
changeset
|
662 |
if dest_dir = "" then |
40061
71cc5aac8b76
generalization of the Sledgehammer minimizer, to make it possible to handle SMT solvers as well
blanchet
parents:
40060
diff
changeset
|
663 |
File.tmp_path problem_file_name |
40059
6ad9081665db
use consistent terminology in Sledgehammer: "prover = ATP or SMT solver or ..."
blanchet
parents:
39494
diff
changeset
|
664 |
else if File.exists (Path.explode dest_dir) then |
40061
71cc5aac8b76
generalization of the Sledgehammer minimizer, to make it possible to handle SMT solvers as well
blanchet
parents:
40060
diff
changeset
|
665 |
Path.append (Path.explode dest_dir) problem_file_name |
39003
c2aebd79981f
run relevance filter in a thread, to avoid blocking
blanchet
parents:
39000
diff
changeset
|
666 |
else |
40059
6ad9081665db
use consistent terminology in Sledgehammer: "prover = ATP or SMT solver or ..."
blanchet
parents:
39494
diff
changeset
|
667 |
error ("No such directory: " ^ quote dest_dir ^ ".") |
48376
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
668 |
val command0 = |
47055
16e2633f3b4b
made "spass" a "metaprover" that uses either the new SPASS or the old SPASS, to preserve backward compatibility and prepare for the upcoming release
blanchet
parents:
47038
diff
changeset
|
669 |
case find_first (fn var => getenv var <> "") (fst exec) of |
48376
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
670 |
SOME var => |
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
671 |
let |
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
672 |
val pref = getenv var ^ "/" |
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
673 |
val paths = map (Path.explode o prefix pref) (snd exec) |
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
674 |
in |
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
675 |
case find_first File.exists paths of |
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
676 |
SOME path => path |
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
677 |
| NONE => error ("Bad executable: " ^ Path.print (hd paths) ^ ".") |
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
678 |
end |
47055
16e2633f3b4b
made "spass" a "metaprover" that uses either the new SPASS or the old SPASS, to preserve backward compatibility and prepare for the upcoming release
blanchet
parents:
47038
diff
changeset
|
679 |
| NONE => error ("The environment variable " ^ quote (hd (fst exec)) ^ |
16e2633f3b4b
made "spass" a "metaprover" that uses either the new SPASS or the old SPASS, to preserve backward compatibility and prepare for the upcoming release
blanchet
parents:
47038
diff
changeset
|
680 |
" is not set.") |
38023 | 681 |
fun split_time s = |
682 |
let |
|
42448 | 683 |
val split = String.tokens (fn c => str c = "\n") |
47737
63c939dcd055
made "split_last" more robust in the face of obscure low-level errors
blanchet
parents:
47606
diff
changeset
|
684 |
val (output, t) = |
63c939dcd055
made "split_last" more robust in the face of obscure low-level errors
blanchet
parents:
47606
diff
changeset
|
685 |
s |> split |> (try split_last #> the_default ([], "0")) |
63c939dcd055
made "split_last" more robust in the face of obscure low-level errors
blanchet
parents:
47606
diff
changeset
|
686 |
|>> cat_lines |
42448 | 687 |
fun as_num f = f >> (fst o read_int) |
688 |
val num = as_num (Scan.many1 Symbol.is_ascii_digit) |
|
689 |
val digit = Scan.one Symbol.is_ascii_digit |
|
690 |
val num3 = as_num (digit ::: digit ::: (digit >> single)) |
|
691 |
val time = num --| Scan.$$ "." -- num3 >> (fn (a, b) => a * 1000 + b) |
|
45381 | 692 |
val as_time = |
693 |
raw_explode #> Scan.read Symbol.stopper time #> the_default 0 |
|
47737
63c939dcd055
made "split_last" more robust in the face of obscure low-level errors
blanchet
parents:
47606
diff
changeset
|
694 |
in (output, as_time t |> Time.fromMilliseconds) end |
48656
5caa414ce9a2
cleaner temporary file cleanup for MaSh, based on tried-and-trusted code
blanchet
parents:
48532
diff
changeset
|
695 |
fun run () = |
48376
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
696 |
let |
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
697 |
(* If slicing is disabled, we expand the last slice to fill the entire |
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
698 |
time available. *) |
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
699 |
val actual_slices = get_slices slice (best_slices ctxt) |
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
700 |
val num_actual_slices = length actual_slices |
51186
c8721406511a
interpret "max_facts" argument in a slice-dependent fashion, instead of forcing the same number of facts to all slices
blanchet
parents:
51181
diff
changeset
|
701 |
val max_fact_factor = |
c8721406511a
interpret "max_facts" argument in a slice-dependent fashion, instead of forcing the same number of facts to all slices
blanchet
parents:
51181
diff
changeset
|
702 |
case max_facts of |
c8721406511a
interpret "max_facts" argument in a slice-dependent fashion, instead of forcing the same number of facts to all slices
blanchet
parents:
51181
diff
changeset
|
703 |
NONE => 1.0 |
c8721406511a
interpret "max_facts" argument in a slice-dependent fashion, instead of forcing the same number of facts to all slices
blanchet
parents:
51181
diff
changeset
|
704 |
| SOME max => |
c8721406511a
interpret "max_facts" argument in a slice-dependent fashion, instead of forcing the same number of facts to all slices
blanchet
parents:
51181
diff
changeset
|
705 |
Real.fromInt max |
c8721406511a
interpret "max_facts" argument in a slice-dependent fashion, instead of forcing the same number of facts to all slices
blanchet
parents:
51181
diff
changeset
|
706 |
/ Real.fromInt (fold (Integer.max o slice_max_facts) |
c8721406511a
interpret "max_facts" argument in a slice-dependent fashion, instead of forcing the same number of facts to all slices
blanchet
parents:
51181
diff
changeset
|
707 |
actual_slices 0) |
48376
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
708 |
fun monomorphize_facts facts = |
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
709 |
let |
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
710 |
val ctxt = |
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
711 |
ctxt |
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
712 |
|> repair_monomorph_context max_mono_iters best_max_mono_iters |
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
713 |
max_new_mono_instances best_max_new_mono_instances |
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
714 |
(* pseudo-theorem involving the same constants as the subgoal *) |
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
715 |
val subgoal_th = |
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
716 |
Logic.list_implies (hyp_ts, concl_t) |> Skip_Proof.make_thm thy |
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
717 |
val rths = |
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
718 |
facts |> chop mono_max_privileged_facts |
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
719 |
|>> map (pair 1 o snd) |
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
720 |
||> map (pair 2 o snd) |
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
721 |
|> op @ |
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
722 |
|> cons (0, subgoal_th) |
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
723 |
in |
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
724 |
Monomorph.monomorph atp_schematic_consts_of rths ctxt |> fst |> tl |
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
725 |
|> curry ListPair.zip (map fst facts) |
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
726 |
|> maps (fn (name, rths) => |
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
727 |
map (pair name o zero_var_indexes o snd) rths) |
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
728 |
end |
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
729 |
fun run_slice time_left (cache_key, cache_value) |
48716
1d2a12bb0640
stop distinguishing between complete and incomplete slices, since this is very fragile and has hardly any useful semantics to users
blanchet
parents:
48656
diff
changeset
|
730 |
(slice, (time_frac, |
51011 | 731 |
(key as ((best_max_facts, best_fact_filter), format, |
732 |
best_type_enc, best_lam_trans, |
|
733 |
best_uncurried_aliases), |
|
48716
1d2a12bb0640
stop distinguishing between complete and incomplete slices, since this is very fragile and has hardly any useful semantics to users
blanchet
parents:
48656
diff
changeset
|
734 |
extra))) = |
38032 | 735 |
let |
51024
98fb341d32e3
distinguish MeSh and smart -- with smart, allow combinations of MaSh, MeSh, and MePo in different slices -- and use MaSh also with SMT solvers, based on evaluation
blanchet
parents:
51014
diff
changeset
|
736 |
val effective_fact_filter = |
98fb341d32e3
distinguish MeSh and smart -- with smart, allow combinations of MaSh, MeSh, and MePo in different slices -- and use MaSh also with SMT solvers, based on evaluation
blanchet
parents:
51014
diff
changeset
|
737 |
fact_filter |> the_default best_fact_filter |
98fb341d32e3
distinguish MeSh and smart -- with smart, allow combinations of MaSh, MeSh, and MePo in different slices -- and use MaSh also with SMT solvers, based on evaluation
blanchet
parents:
51014
diff
changeset
|
738 |
val facts = get_facts_for_filter effective_fact_filter factss |
48376
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
739 |
val num_facts = |
51186
c8721406511a
interpret "max_facts" argument in a slice-dependent fashion, instead of forcing the same number of facts to all slices
blanchet
parents:
51181
diff
changeset
|
740 |
Real.ceil (max_fact_factor * Real.fromInt best_max_facts) + |
c8721406511a
interpret "max_facts" argument in a slice-dependent fashion, instead of forcing the same number of facts to all slices
blanchet
parents:
51181
diff
changeset
|
741 |
max_fact_factor_fudge |
c8721406511a
interpret "max_facts" argument in a slice-dependent fashion, instead of forcing the same number of facts to all slices
blanchet
parents:
51181
diff
changeset
|
742 |
|> Integer.min (length facts) |
48376
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
743 |
val soundness = if strict then Strict else Non_Strict |
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
744 |
val type_enc = |
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
745 |
type_enc |> choose_type_enc soundness best_type_enc format |
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
746 |
val sound = is_type_enc_sound type_enc |
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
747 |
val real_ms = Real.fromInt o Time.toMilliseconds |
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
748 |
val slice_timeout = |
50557 | 749 |
case time_left of |
750 |
SOME time_left => |
|
751 |
((real_ms time_left |
|
752 |
|> (if slice < num_actual_slices - 1 then |
|
753 |
curry Real.min (time_frac * real_ms (the timeout)) |
|
754 |
else |
|
755 |
I)) |
|
756 |
* 0.001) |
|
757 |
|> seconds |> SOME |
|
758 |
| NONE => NONE |
|
48376
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
759 |
val generous_slice_timeout = |
50558
a719106124d8
avoid creating nested threads for MaSh -- this seems to cause thread creation failures for machines with dozens of cores (unclear yet if that's really the issue)
blanchet
parents:
50557
diff
changeset
|
760 |
if mode = MaSh then NONE |
a719106124d8
avoid creating nested threads for MaSh -- this seems to cause thread creation failures for machines with dozens of cores (unclear yet if that's really the issue)
blanchet
parents:
50557
diff
changeset
|
761 |
else Option.map (curry Time.+ atp_timeout_slack) slice_timeout |
48376
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
762 |
val _ = |
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
763 |
if debug then |
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
764 |
quote name ^ " slice #" ^ string_of_int (slice + 1) ^ |
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
765 |
" with " ^ string_of_int num_facts ^ " fact" ^ |
50557 | 766 |
plural_s num_facts ^ |
767 |
(case slice_timeout of |
|
768 |
SOME timeout => " for " ^ string_from_time timeout |
|
769 |
| NONE => "") ^ "..." |
|
48376
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
770 |
|> Output.urgent_message |
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
771 |
else |
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
772 |
() |
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
773 |
val readable_names = not (Config.get ctxt atp_full_names) |
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
774 |
val lam_trans = |
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
775 |
case lam_trans of |
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
776 |
SOME s => s |
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
777 |
| NONE => best_lam_trans |
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
778 |
val uncurried_aliases = |
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
779 |
case uncurried_aliases of |
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
780 |
SOME b => b |
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
781 |
| NONE => best_uncurried_aliases |
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
782 |
val value as (atp_problem, _, fact_names, _, _) = |
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
783 |
if cache_key = SOME key then |
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
784 |
cache_value |
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
785 |
else |
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
786 |
facts |
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
787 |
|> not sound |
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
788 |
? filter_out (is_dangerous_prop ctxt o prop_of o snd) |
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
789 |
|> take num_facts |
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
790 |
|> not (is_type_enc_polymorphic type_enc) ? monomorphize_facts |
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
791 |
|> map (apsnd prop_of) |
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
792 |
|> prepare_atp_problem ctxt format prem_role type_enc atp_mode |
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
793 |
lam_trans uncurried_aliases |
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
794 |
readable_names true hyp_ts concl_t |
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
795 |
fun sel_weights () = atp_problem_selection_weights atp_problem |
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
796 |
fun ord_info () = atp_problem_term_order_info atp_problem |
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
797 |
val ord = effective_term_order ctxt name |
49918
cf441f4a358b
renamed Isar-proof related options + changed semantics of Isar shrinking
blanchet
parents:
49914
diff
changeset
|
798 |
val full_proof = debug orelse isar_proofs |
50927 | 799 |
val args = |
800 |
arguments ctxt full_proof extra |
|
801 |
(slice_timeout |> the_default one_day) |
|
802 |
(File.shell_path prob_path) (ord, ord_info, sel_weights) |
|
48376
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
803 |
val command = |
50927 | 804 |
"(exec 2>&1; " ^ File.shell_path command0 ^ " " ^ args ^ " " ^ ")" |
48532
c0f44941e674
Sledgehammer already has its own ways of reporting and recovering from crashes in external provers -- no need to additionally print scores of warnings (cf. 4b0daca2bf88)
blanchet
parents:
48392
diff
changeset
|
805 |
|> enclose "TIMEFORMAT='%3R'; { time " " ; }" |
48376
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
806 |
val _ = |
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
807 |
atp_problem |
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
808 |
|> lines_for_atp_problem format ord ord_info |
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
809 |
|> cons ("% " ^ command ^ "\n") |
48656
5caa414ce9a2
cleaner temporary file cleanup for MaSh, based on tried-and-trusted code
blanchet
parents:
48532
diff
changeset
|
810 |
|> File.write_list prob_path |
51013 | 811 |
val ((output, run_time), used_from, (atp_proof, outcome)) = |
50557 | 812 |
time_limit generous_slice_timeout Isabelle_System.bash_output |
813 |
command |
|
48376
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
814 |
|>> (if overlord then |
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
815 |
prefix ("% " ^ command ^ "\n% " ^ timestamp () ^ "\n") |
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
816 |
else |
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
817 |
I) |
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
818 |
|> fst |> split_time |
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
819 |
|> (fn accum as (output, _) => |
51013 | 820 |
(accum, facts, |
48716
1d2a12bb0640
stop distinguishing between complete and incomplete slices, since this is very fragile and has hardly any useful semantics to users
blanchet
parents:
48656
diff
changeset
|
821 |
extract_tstplike_proof_and_outcome verbose proof_delims |
1d2a12bb0640
stop distinguishing between complete and incomplete slices, since this is very fragile and has hardly any useful semantics to users
blanchet
parents:
48656
diff
changeset
|
822 |
known_failures output |
48376
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
823 |
|>> atp_proof_from_tstplike_proof atp_problem |
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
824 |
handle UNRECOGNIZED_ATP_PROOF () => |
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
825 |
([], SOME ProofIncomplete))) |
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
826 |
handle TimeLimit.TimeOut => |
51013 | 827 |
(("", the slice_timeout), [], ([], SOME TimedOut)) |
48376
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
828 |
val outcome = |
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
829 |
case outcome of |
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
830 |
NONE => |
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
831 |
(case used_facts_in_unsound_atp_proof ctxt fact_names atp_proof |
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
832 |
|> Option.map (sort string_ord) of |
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
833 |
SOME facts => |
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
834 |
let |
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
835 |
val failure = |
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
836 |
UnsoundProof (is_type_enc_sound type_enc, facts) |
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
837 |
in |
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
838 |
if debug then (warning (string_for_failure failure); NONE) |
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
839 |
else SOME failure |
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
840 |
end |
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
841 |
| NONE => NONE) |
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
842 |
| _ => outcome |
51013 | 843 |
in |
844 |
((SOME key, value), (output, run_time, facts, atp_proof, outcome)) |
|
845 |
end |
|
48376
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
846 |
val timer = Timer.startRealTimer () |
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
847 |
fun maybe_run_slice slice |
51013 | 848 |
(result as (cache, (_, run_time0, _, _, SOME _))) = |
48376
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
849 |
let |
50557 | 850 |
val time_left = |
851 |
Option.map |
|
852 |
(fn timeout => Time.- (timeout, Timer.checkRealTimer timer)) |
|
853 |
timeout |
|
48376
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
854 |
in |
50557 | 855 |
if time_left <> NONE andalso |
856 |
Time.<= (the time_left, Time.zeroTime) then |
|
48376
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
857 |
result |
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
858 |
else |
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
859 |
run_slice time_left cache slice |
51013 | 860 |
|> (fn (cache, (output, run_time, used_from, atp_proof, |
861 |
outcome)) => |
|
862 |
(cache, (output, Time.+ (run_time0, run_time), used_from, |
|
48376
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
863 |
atp_proof, outcome))) |
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
864 |
end |
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
865 |
| maybe_run_slice _ result = result |
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
866 |
in |
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
867 |
((NONE, ([], Symtab.empty, Vector.fromList [], [], Symtab.empty)), |
51013 | 868 |
("", Time.zeroTime, [], [], SOME InternalError)) |
48376
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
869 |
|> fold maybe_run_slice actual_slices |
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
870 |
end |
38023 | 871 |
(* If the problem file has not been exported, remove it; otherwise, export |
872 |
the proof file too. *) |
|
48656
5caa414ce9a2
cleaner temporary file cleanup for MaSh, based on tried-and-trusted code
blanchet
parents:
48532
diff
changeset
|
873 |
fun clean_up () = |
5caa414ce9a2
cleaner temporary file cleanup for MaSh, based on tried-and-trusted code
blanchet
parents:
48532
diff
changeset
|
874 |
if dest_dir = "" then (try File.rm prob_path; ()) else () |
51013 | 875 |
fun export (_, (output, _, _, _, _)) = |
48376
416e4123baf3
use "eproof_ram" script if available (plug-in replacement for "eproof", but faster)
blanchet
parents:
48331
diff
changeset
|
876 |
if dest_dir = "" then () |
48656
5caa414ce9a2
cleaner temporary file cleanup for MaSh, based on tried-and-trusted code
blanchet
parents:
48532
diff
changeset
|
877 |
else File.write (Path.explode (Path.implode prob_path ^ "_proof")) output |
46407
30e9720cc0b9
optimization: slice caching in case two consecutive slices are nearly identical
blanchet
parents:
46405
diff
changeset
|
878 |
val ((_, (_, pool, fact_names, _, sym_tab)), |
51013 | 879 |
(output, run_time, used_from, atp_proof, outcome)) = |
48656
5caa414ce9a2
cleaner temporary file cleanup for MaSh, based on tried-and-trusted code
blanchet
parents:
48532
diff
changeset
|
880 |
with_cleanup clean_up run () |> tap export |
39492 | 881 |
val important_message = |
43021 | 882 |
if mode = Normal andalso |
42609 | 883 |
random_range 0 (atp_important_message_keep_quotient - 1) = 0 then |
39492 | 884 |
extract_important_message output |
885 |
else |
|
886 |
"" |
|
43261
a4aeb26a6362
make sure that the message tail (timing + TPTP important message) is preserved upon automatic minimization
blanchet
parents:
43259
diff
changeset
|
887 |
val (used_facts, preplay, message, message_tail) = |
38023 | 888 |
case outcome of |
889 |
NONE => |
|
43033 | 890 |
let |
45551 | 891 |
val used_facts = used_facts_in_atp_proof ctxt fact_names atp_proof |
45590 | 892 |
val needs_full_types = is_typed_helper_used_in_atp_proof atp_proof |
45521 | 893 |
val reconstrs = |
45554
09ad83de849c
don't pass "lam_lifted" option to "metis" unless there's a good reason
blanchet
parents:
45553
diff
changeset
|
894 |
bunch_of_reconstructors needs_full_types |
45560
1606122a2d0f
don't needlessly pass "lam_lifted" option to "metis" call for SMT proof
blanchet
parents:
45557
diff
changeset
|
895 |
(lam_trans_from_atp_proof atp_proof |
46405 | 896 |
o (fn desperate => if desperate then hide_lamsN |
897 |
else metis_default_lam_trans)) |
|
43033 | 898 |
in |
43052
8d6a4978cc65
automatically minimize with Metis when this can be done within a few seconds
blanchet
parents:
43051
diff
changeset
|
899 |
(used_facts, |
50669
84c7cf36b2e0
use "Lazy" to simplify control flow a bit and guarantee single evaluation (at most)
blanchet
parents:
50667
diff
changeset
|
900 |
Lazy.lazy (fn () => |
84c7cf36b2e0
use "Lazy" to simplify control flow a bit and guarantee single evaluation (at most)
blanchet
parents:
50667
diff
changeset
|
901 |
let |
84c7cf36b2e0
use "Lazy" to simplify control flow a bit and guarantee single evaluation (at most)
blanchet
parents:
50667
diff
changeset
|
902 |
val used_pairs = |
51013 | 903 |
used_from |> filter_used_facts false used_facts |
50669
84c7cf36b2e0
use "Lazy" to simplify control flow a bit and guarantee single evaluation (at most)
blanchet
parents:
50667
diff
changeset
|
904 |
in |
84c7cf36b2e0
use "Lazy" to simplify control flow a bit and guarantee single evaluation (at most)
blanchet
parents:
50667
diff
changeset
|
905 |
play_one_line_proof mode debug verbose preplay_timeout |
84c7cf36b2e0
use "Lazy" to simplify control flow a bit and guarantee single evaluation (at most)
blanchet
parents:
50667
diff
changeset
|
906 |
used_pairs state subgoal (hd reconstrs) reconstrs |
84c7cf36b2e0
use "Lazy" to simplify control flow a bit and guarantee single evaluation (at most)
blanchet
parents:
50667
diff
changeset
|
907 |
end), |
43052
8d6a4978cc65
automatically minimize with Metis when this can be done within a few seconds
blanchet
parents:
43051
diff
changeset
|
908 |
fn preplay => |
8d6a4978cc65
automatically minimize with Metis when this can be done within a few seconds
blanchet
parents:
43051
diff
changeset
|
909 |
let |
49921 | 910 |
val _ = |
911 |
if verbose then |
|
912 |
Output.urgent_message "Generating proof text..." |
|
913 |
else |
|
914 |
() |
|
43052
8d6a4978cc65
automatically minimize with Metis when this can be done within a few seconds
blanchet
parents:
43051
diff
changeset
|
915 |
val isar_params = |
51130
76d68444cd59
renamed sledgehammer_shrink to sledgehammer_compress
smolkas
parents:
51024
diff
changeset
|
916 |
(debug, verbose, preplay_timeout, isar_compress, |
50004
c96e8e40d789
several improvements to Isar proof reconstruction, by Steffen Smolka (step merging in case splits, time measurements, etc.)
blanchet
parents:
49921
diff
changeset
|
917 |
pool, fact_names, sym_tab, atp_proof, goal) |
43052
8d6a4978cc65
automatically minimize with Metis when this can be done within a few seconds
blanchet
parents:
43051
diff
changeset
|
918 |
val one_line_params = |
8d6a4978cc65
automatically minimize with Metis when this can be done within a few seconds
blanchet
parents:
43051
diff
changeset
|
919 |
(preplay, proof_banner mode name, used_facts, |
45561
57227eedce81
don't propagate user-set "type_enc" or "lam_trans" to Metis calls
blanchet
parents:
45560
diff
changeset
|
920 |
choose_minimize_command params minimize_command name preplay, |
43052
8d6a4978cc65
automatically minimize with Metis when this can be done within a few seconds
blanchet
parents:
43051
diff
changeset
|
921 |
subgoal, subgoal_count) |
48799 | 922 |
val num_chained = length (#facts (Proof.goal state)) |
923 |
in |
|
49918
cf441f4a358b
renamed Isar-proof related options + changed semantics of Isar shrinking
blanchet
parents:
49914
diff
changeset
|
924 |
proof_text ctxt isar_proofs isar_params num_chained |
48799 | 925 |
one_line_params |
926 |
end, |
|
43261
a4aeb26a6362
make sure that the message tail (timing + TPTP important message) is preserved upon automatic minimization
blanchet
parents:
43259
diff
changeset
|
927 |
(if verbose then |
45381 | 928 |
"\nATP real CPU time: " ^ string_from_time run_time ^ "." |
43261
a4aeb26a6362
make sure that the message tail (timing + TPTP important message) is preserved upon automatic minimization
blanchet
parents:
43259
diff
changeset
|
929 |
else |
a4aeb26a6362
make sure that the message tail (timing + TPTP important message) is preserved upon automatic minimization
blanchet
parents:
43259
diff
changeset
|
930 |
"") ^ |
a4aeb26a6362
make sure that the message tail (timing + TPTP important message) is preserved upon automatic minimization
blanchet
parents:
43259
diff
changeset
|
931 |
(if important_message <> "" then |
a4aeb26a6362
make sure that the message tail (timing + TPTP important message) is preserved upon automatic minimization
blanchet
parents:
43259
diff
changeset
|
932 |
"\n\nImportant message from Dr. Geoff Sutcliffe:\n" ^ |
a4aeb26a6362
make sure that the message tail (timing + TPTP important message) is preserved upon automatic minimization
blanchet
parents:
43259
diff
changeset
|
933 |
important_message |
a4aeb26a6362
make sure that the message tail (timing + TPTP important message) is preserved upon automatic minimization
blanchet
parents:
43259
diff
changeset
|
934 |
else |
a4aeb26a6362
make sure that the message tail (timing + TPTP important message) is preserved upon automatic minimization
blanchet
parents:
43259
diff
changeset
|
935 |
"")) |
43033 | 936 |
end |
43052
8d6a4978cc65
automatically minimize with Metis when this can be done within a few seconds
blanchet
parents:
43051
diff
changeset
|
937 |
| SOME failure => |
50669
84c7cf36b2e0
use "Lazy" to simplify control flow a bit and guarantee single evaluation (at most)
blanchet
parents:
50667
diff
changeset
|
938 |
([], Lazy.value (Failed_to_Play plain_metis), |
45519
cd6e78cb6ee8
make metis reconstruction handling more flexible
blanchet
parents:
45514
diff
changeset
|
939 |
fn _ => string_for_failure failure, "") |
38023 | 940 |
in |
51013 | 941 |
{outcome = outcome, used_facts = used_facts, used_from = used_from, |
51009
e8ff34a1fa9a
thread through fact triple component from which used facts come, for accurate index output
blanchet
parents:
51007
diff
changeset
|
942 |
run_time = run_time, preplay = preplay, message = message, |
e8ff34a1fa9a
thread through fact triple component from which used facts come, for accurate index output
blanchet
parents:
51007
diff
changeset
|
943 |
message_tail = message_tail} |
38023 | 944 |
end |
945 |
||
51014 | 946 |
fun rotate_one (x :: xs) = xs @ [x] |
947 |
||
40669 | 948 |
(* "SMT_Failure.Abnormal_Termination" carries the solver's return code. Until |
949 |
these are sorted out properly in the SMT module, we have to interpret these |
|
950 |
ourselves. *) |
|
40684
c7ba327eb58c
more precise error handling in Sledgehammer/SMT for Z3 and remote SMT provers
blanchet
parents:
40669
diff
changeset
|
951 |
val remote_smt_failures = |
43631
4144d7b4ec77
enforce hard timeout on ATPs (esp. "z3_atp" on Linux) + remove obsolete failure codes
blanchet
parents:
43626
diff
changeset
|
952 |
[(2, NoLibwwwPerl), |
4144d7b4ec77
enforce hard timeout on ATPs (esp. "z3_atp" on Linux) + remove obsolete failure codes
blanchet
parents:
43626
diff
changeset
|
953 |
(22, CantConnect)] |
40684
c7ba327eb58c
more precise error handling in Sledgehammer/SMT for Z3 and remote SMT provers
blanchet
parents:
40669
diff
changeset
|
954 |
val z3_failures = |
41236 | 955 |
[(101, OutOfResources), |
956 |
(103, MalformedInput), |
|
50667 | 957 |
(110, MalformedInput), |
958 |
(112, TimedOut)] |
|
40684
c7ba327eb58c
more precise error handling in Sledgehammer/SMT for Z3 and remote SMT provers
blanchet
parents:
40669
diff
changeset
|
959 |
val unix_failures = |
48797 | 960 |
[(138, Crashed), |
961 |
(139, Crashed)] |
|
43631
4144d7b4ec77
enforce hard timeout on ATPs (esp. "z3_atp" on Linux) + remove obsolete failure codes
blanchet
parents:
43626
diff
changeset
|
962 |
val smt_failures = remote_smt_failures @ z3_failures @ unix_failures |
40555 | 963 |
|
42100
062381c5f9f8
more precise failure reporting in Sledgehammer/SMT
blanchet
parents:
42061
diff
changeset
|
964 |
fun failure_from_smt_failure (SMT_Failure.Counterexample {is_real_cex, ...}) = |
43050
59284a13abc4
support "metis" and "metisFT" as provers in the architecture, so they can be used for minimizing
blanchet
parents:
43044
diff
changeset
|
965 |
if is_real_cex then Unprovable else GaveUp |
41222 | 966 |
| failure_from_smt_failure SMT_Failure.Time_Out = TimedOut |
967 |
| failure_from_smt_failure (SMT_Failure.Abnormal_Termination code) = |
|
968 |
(case AList.lookup (op =) smt_failures code of |
|
40684
c7ba327eb58c
more precise error handling in Sledgehammer/SMT for Z3 and remote SMT provers
blanchet
parents:
40669
diff
changeset
|
969 |
SOME failure => failure |
41259
13972ced98d9
more precise error messages in "verbose" (or "debug") mode, following this morning's permission debacle
blanchet
parents:
41256
diff
changeset
|
970 |
| NONE => UnknownError ("Abnormal termination with exit code " ^ |
13972ced98d9
more precise error messages in "verbose" (or "debug") mode, following this morning's permission debacle
blanchet
parents:
41256
diff
changeset
|
971 |
string_of_int code ^ ".")) |
41222 | 972 |
| failure_from_smt_failure SMT_Failure.Out_Of_Memory = OutOfResources |
973 |
| failure_from_smt_failure (SMT_Failure.Other_Failure msg) = |
|
42061
71077681eaf6
let SMT errors through -- the main reason for keeping them quiet was that the SMT bridge used to suffer from internal bugs, but these have been fixed for some time now
blanchet
parents:
42060
diff
changeset
|
974 |
UnknownError msg |
40063
d086e3699e78
bring ATPs and SMT solvers more in line with each other
blanchet
parents:
40062
diff
changeset
|
975 |
|
40698 | 976 |
(* FUDGE *) |
42646
4781fcd53572
replaced some Unsynchronized.refs with Config.Ts
blanchet
parents:
42642
diff
changeset
|
977 |
val smt_max_slices = |
4781fcd53572
replaced some Unsynchronized.refs with Config.Ts
blanchet
parents:
42642
diff
changeset
|
978 |
Attrib.setup_config_int @{binding sledgehammer_smt_max_slices} (K 8) |
4781fcd53572
replaced some Unsynchronized.refs with Config.Ts
blanchet
parents:
42642
diff
changeset
|
979 |
val smt_slice_fact_frac = |
51014 | 980 |
Attrib.setup_config_real @{binding sledgehammer_smt_slice_fact_frac} |
981 |
(K 0.667) |
|
42646
4781fcd53572
replaced some Unsynchronized.refs with Config.Ts
blanchet
parents:
42642
diff
changeset
|
982 |
val smt_slice_time_frac = |
51014 | 983 |
Attrib.setup_config_real @{binding sledgehammer_smt_slice_time_frac} (K 0.333) |
42646
4781fcd53572
replaced some Unsynchronized.refs with Config.Ts
blanchet
parents:
42642
diff
changeset
|
984 |
val smt_slice_min_secs = |
51014 | 985 |
Attrib.setup_config_int @{binding sledgehammer_smt_slice_min_secs} (K 3) |
40409
3642dc3b72e8
invoke SMT solver in a loop, with fewer and fewer facts, in case of error
blanchet
parents:
40370
diff
changeset
|
986 |
|
50759 | 987 |
fun smt_filter_loop name |
42724
4d6bcf846759
added "max_mono_instances" option to Sledgehammer and renamed old "monomorphize_limit" option
blanchet
parents:
42723
diff
changeset
|
988 |
({debug, verbose, overlord, max_mono_iters, |
45706 | 989 |
max_new_mono_instances, timeout, slice, ...} : params) |
50486
d5dc28fafd9d
made MaSh evaluation driver work with SMT solvers
blanchet
parents:
50020
diff
changeset
|
990 |
state goal i = |
40409
3642dc3b72e8
invoke SMT solver in a loop, with fewer and fewer facts, in case of error
blanchet
parents:
40370
diff
changeset
|
991 |
let |
50759 | 992 |
fun repair_context ctxt = |
993 |
ctxt |> select_smt_solver name |
|
994 |
|> Config.put SMT_Config.verbose debug |
|
995 |
|> (if overlord then |
|
996 |
Config.put SMT_Config.debug_files |
|
997 |
(overlord_file_location_for_prover name |
|
998 |
|> (fn (path, name) => path ^ "/" ^ name)) |
|
999 |
else |
|
1000 |
I) |
|
1001 |
|> Config.put SMT_Config.infer_triggers |
|
1002 |
(Config.get ctxt smt_triggers) |
|
1003 |
val ctxt = Proof.context_of state |> repair_context |
|
1004 |
val state = state |> Proof.map_context (K ctxt) |
|
45706 | 1005 |
val max_slices = if slice then Config.get ctxt smt_max_slices else 1 |
51024
98fb341d32e3
distinguish MeSh and smart -- with smart, allow combinations of MaSh, MeSh, and MePo in different slices -- and use MaSh also with SMT solvers, based on evaluation
blanchet
parents:
51014
diff
changeset
|
1006 |
fun do_slice timeout slice outcome0 time_so_far |
98fb341d32e3
distinguish MeSh and smart -- with smart, allow combinations of MaSh, MeSh, and MePo in different slices -- and use MaSh also with SMT solvers, based on evaluation
blanchet
parents:
51014
diff
changeset
|
1007 |
(weighted_factss as (fact_filter, weighted_facts) :: _) = |
40553
1264c9172338
pick up SMT solver crashes and report them to the user/Mirabelle if desired
blanchet
parents:
40471
diff
changeset
|
1008 |
let |
1264c9172338
pick up SMT solver crashes and report them to the user/Mirabelle if desired
blanchet
parents:
40471
diff
changeset
|
1009 |
val timer = Timer.startRealTimer () |
42724
4d6bcf846759
added "max_mono_instances" option to Sledgehammer and renamed old "monomorphize_limit" option
blanchet
parents:
42723
diff
changeset
|
1010 |
val state = |
4d6bcf846759
added "max_mono_instances" option to Sledgehammer and renamed old "monomorphize_limit" option
blanchet
parents:
42723
diff
changeset
|
1011 |
state |> Proof.map_context |
43267 | 1012 |
(repair_monomorph_context max_mono_iters |
47962
137883567114
lower the monomorphization thresholds for less scalable provers
blanchet
parents:
47946
diff
changeset
|
1013 |
default_max_mono_iters max_new_mono_instances |
137883567114
lower the monomorphization thresholds for less scalable provers
blanchet
parents:
47946
diff
changeset
|
1014 |
default_max_new_mono_instances) |
42443
724e612ba248
implemented general slicing for ATPs, especially E 1.2w and above
blanchet
parents:
42361
diff
changeset
|
1015 |
val slice_timeout = |
50557 | 1016 |
if slice < max_slices andalso timeout <> NONE then |
1017 |
let val ms = timeout |> the |> Time.toMilliseconds in |
|
1018 |
Int.min (ms, |
|
1019 |
Int.max (1000 * Config.get ctxt smt_slice_min_secs, |
|
1020 |
Real.ceil (Config.get ctxt smt_slice_time_frac |
|
1021 |
* Real.fromInt ms))) |
|
1022 |
|> Time.fromMilliseconds |> SOME |
|
1023 |
end |
|
40553
1264c9172338
pick up SMT solver crashes and report them to the user/Mirabelle if desired
blanchet
parents:
40471
diff
changeset
|
1024 |
else |
1264c9172338
pick up SMT solver crashes and report them to the user/Mirabelle if desired
blanchet
parents:
40471
diff
changeset
|
1025 |
timeout |
51009
e8ff34a1fa9a
thread through fact triple component from which used facts come, for accurate index output
blanchet
parents:
51007
diff
changeset
|
1026 |
val num_facts = length weighted_facts |
40553
1264c9172338
pick up SMT solver crashes and report them to the user/Mirabelle if desired
blanchet
parents:
40471
diff
changeset
|
1027 |
val _ = |
42614
81953e554197
make "debug" more verbose and "verbose" less verbose
blanchet
parents:
42613
diff
changeset
|
1028 |
if debug then |
81953e554197
make "debug" more verbose and "verbose" less verbose
blanchet
parents:
42613
diff
changeset
|
1029 |
quote name ^ " slice " ^ string_of_int slice ^ " with " ^ |
50557 | 1030 |
string_of_int num_facts ^ " fact" ^ plural_s num_facts ^ |
1031 |
(case slice_timeout of |
|
1032 |
SOME timeout => " for " ^ string_from_time timeout |
|
1033 |
| NONE => "") ^ "..." |
|
40553
1264c9172338
pick up SMT solver crashes and report them to the user/Mirabelle if desired
blanchet
parents:
40471
diff
changeset
|
1034 |
|> Output.urgent_message |
1264c9172338
pick up SMT solver crashes and report them to the user/Mirabelle if desired
blanchet
parents:
40471
diff
changeset
|
1035 |
else |
1264c9172338
pick up SMT solver crashes and report them to the user/Mirabelle if desired
blanchet
parents:
40471
diff
changeset
|
1036 |
() |
41168 | 1037 |
val birth = Timer.checkRealTimer timer |
41171 | 1038 |
val _ = |
41211
1e2e16bc0077
no need to do a super-duper atomization if Metis fails afterwards anyway
blanchet
parents:
41209
diff
changeset
|
1039 |
if debug then Output.urgent_message "Invoking SMT solver..." else () |
50486
d5dc28fafd9d
made MaSh evaluation driver work with SMT solvers
blanchet
parents:
50020
diff
changeset
|
1040 |
val state_facts = these (try (#facts o Proof.goal) state) |
41209 | 1041 |
val (outcome, used_facts) = |
51009
e8ff34a1fa9a
thread through fact triple component from which used facts come, for accurate index output
blanchet
parents:
51007
diff
changeset
|
1042 |
SMT_Solver.smt_filter_preprocess ctxt state_facts goal weighted_facts |
e8ff34a1fa9a
thread through fact triple component from which used facts come, for accurate index output
blanchet
parents:
51007
diff
changeset
|
1043 |
i |
50557 | 1044 |
|> SMT_Solver.smt_filter_apply (slice_timeout |> the_default one_day) |
41239 | 1045 |
|> (fn {outcome, used_facts} => (outcome, used_facts)) |
41209 | 1046 |
handle exn => if Exn.is_interrupt exn then |
1047 |
reraise exn |
|
1048 |
else |
|
42061
71077681eaf6
let SMT errors through -- the main reason for keeping them quiet was that the SMT bridge used to suffer from internal bugs, but these have been fixed for some time now
blanchet
parents:
42060
diff
changeset
|
1049 |
(ML_Compiler.exn_message exn |
41209 | 1050 |
|> SMT_Failure.Other_Failure |> SOME, []) |
41168 | 1051 |
val death = Timer.checkRealTimer timer |
40553
1264c9172338
pick up SMT solver crashes and report them to the user/Mirabelle if desired
blanchet
parents:
40471
diff
changeset
|
1052 |
val outcome0 = if is_none outcome0 then SOME outcome else outcome0 |
41168 | 1053 |
val time_so_far = Time.+ (time_so_far, Time.- (death, birth)) |
40553
1264c9172338
pick up SMT solver crashes and report them to the user/Mirabelle if desired
blanchet
parents:
40471
diff
changeset
|
1054 |
val too_many_facts_perhaps = |
1264c9172338
pick up SMT solver crashes and report them to the user/Mirabelle if desired
blanchet
parents:
40471
diff
changeset
|
1055 |
case outcome of |
1264c9172338
pick up SMT solver crashes and report them to the user/Mirabelle if desired
blanchet
parents:
40471
diff
changeset
|
1056 |
NONE => false |
1264c9172338
pick up SMT solver crashes and report them to the user/Mirabelle if desired
blanchet
parents:
40471
diff
changeset
|
1057 |
| SOME (SMT_Failure.Counterexample _) => false |
42443
724e612ba248
implemented general slicing for ATPs, especially E 1.2w and above
blanchet
parents:
42361
diff
changeset
|
1058 |
| SOME SMT_Failure.Time_Out => slice_timeout <> timeout |
42614
81953e554197
make "debug" more verbose and "verbose" less verbose
blanchet
parents:
42613
diff
changeset
|
1059 |
| SOME (SMT_Failure.Abnormal_Termination _) => true (* kind of *) |
40553
1264c9172338
pick up SMT solver crashes and report them to the user/Mirabelle if desired
blanchet
parents:
40471
diff
changeset
|
1060 |
| SOME SMT_Failure.Out_Of_Memory => true |
41211
1e2e16bc0077
no need to do a super-duper atomization if Metis fails afterwards anyway
blanchet
parents:
41209
diff
changeset
|
1061 |
| SOME (SMT_Failure.Other_Failure _) => true |
50557 | 1062 |
val timeout = |
1063 |
Option.map |
|
1064 |
(fn timeout => Time.- (timeout, Timer.checkRealTimer timer)) |
|
1065 |
timeout |
|
40553
1264c9172338
pick up SMT solver crashes and report them to the user/Mirabelle if desired
blanchet
parents:
40471
diff
changeset
|
1066 |
in |
42443
724e612ba248
implemented general slicing for ATPs, especially E 1.2w and above
blanchet
parents:
42361
diff
changeset
|
1067 |
if too_many_facts_perhaps andalso slice < max_slices andalso |
50557 | 1068 |
num_facts > 0 andalso |
1069 |
(timeout = NONE orelse Time.> (the timeout, Time.zeroTime)) then |
|
41169 | 1070 |
let |
42614
81953e554197
make "debug" more verbose and "verbose" less verbose
blanchet
parents:
42613
diff
changeset
|
1071 |
val new_num_facts = |
42646
4781fcd53572
replaced some Unsynchronized.refs with Config.Ts
blanchet
parents:
42642
diff
changeset
|
1072 |
Real.ceil (Config.get ctxt smt_slice_fact_frac |
4781fcd53572
replaced some Unsynchronized.refs with Config.Ts
blanchet
parents:
42642
diff
changeset
|
1073 |
* Real.fromInt num_facts) |
51024
98fb341d32e3
distinguish MeSh and smart -- with smart, allow combinations of MaSh, MeSh, and MePo in different slices -- and use MaSh also with SMT solvers, based on evaluation
blanchet
parents:
51014
diff
changeset
|
1074 |
val weighted_factss as (new_fact_filter, _) :: _ = |
98fb341d32e3
distinguish MeSh and smart -- with smart, allow combinations of MaSh, MeSh, and MePo in different slices -- and use MaSh also with SMT solvers, based on evaluation
blanchet
parents:
51014
diff
changeset
|
1075 |
weighted_factss |
98fb341d32e3
distinguish MeSh and smart -- with smart, allow combinations of MaSh, MeSh, and MePo in different slices -- and use MaSh also with SMT solvers, based on evaluation
blanchet
parents:
51014
diff
changeset
|
1076 |
|> rotate_one |
98fb341d32e3
distinguish MeSh and smart -- with smart, allow combinations of MaSh, MeSh, and MePo in different slices -- and use MaSh also with SMT solvers, based on evaluation
blanchet
parents:
51014
diff
changeset
|
1077 |
|> app_hd (apsnd (take new_num_facts)) |
98fb341d32e3
distinguish MeSh and smart -- with smart, allow combinations of MaSh, MeSh, and MePo in different slices -- and use MaSh also with SMT solvers, based on evaluation
blanchet
parents:
51014
diff
changeset
|
1078 |
val show_filter = fact_filter <> new_fact_filter |
98fb341d32e3
distinguish MeSh and smart -- with smart, allow combinations of MaSh, MeSh, and MePo in different slices -- and use MaSh also with SMT solvers, based on evaluation
blanchet
parents:
51014
diff
changeset
|
1079 |
fun num_of_facts fact_filter num_facts = |
98fb341d32e3
distinguish MeSh and smart -- with smart, allow combinations of MaSh, MeSh, and MePo in different slices -- and use MaSh also with SMT solvers, based on evaluation
blanchet
parents:
51014
diff
changeset
|
1080 |
string_of_int num_facts ^ |
98fb341d32e3
distinguish MeSh and smart -- with smart, allow combinations of MaSh, MeSh, and MePo in different slices -- and use MaSh also with SMT solvers, based on evaluation
blanchet
parents:
51014
diff
changeset
|
1081 |
(if show_filter then " " ^ quote fact_filter else "") ^ |
98fb341d32e3
distinguish MeSh and smart -- with smart, allow combinations of MaSh, MeSh, and MePo in different slices -- and use MaSh also with SMT solvers, based on evaluation
blanchet
parents:
51014
diff
changeset
|
1082 |
" fact" ^ plural_s num_facts |
42614
81953e554197
make "debug" more verbose and "verbose" less verbose
blanchet
parents:
42613
diff
changeset
|
1083 |
val _ = |
81953e554197
make "debug" more verbose and "verbose" less verbose
blanchet
parents:
42613
diff
changeset
|
1084 |
if verbose andalso is_some outcome then |
51024
98fb341d32e3
distinguish MeSh and smart -- with smart, allow combinations of MaSh, MeSh, and MePo in different slices -- and use MaSh also with SMT solvers, based on evaluation
blanchet
parents:
51014
diff
changeset
|
1085 |
quote name ^ " invoked with " ^ |
98fb341d32e3
distinguish MeSh and smart -- with smart, allow combinations of MaSh, MeSh, and MePo in different slices -- and use MaSh also with SMT solvers, based on evaluation
blanchet
parents:
51014
diff
changeset
|
1086 |
num_of_facts fact_filter num_facts ^ ": " ^ |
42614
81953e554197
make "debug" more verbose and "verbose" less verbose
blanchet
parents:
42613
diff
changeset
|
1087 |
string_for_failure (failure_from_smt_failure (the outcome)) ^ |
51024
98fb341d32e3
distinguish MeSh and smart -- with smart, allow combinations of MaSh, MeSh, and MePo in different slices -- and use MaSh also with SMT solvers, based on evaluation
blanchet
parents:
51014
diff
changeset
|
1088 |
" Retrying with " ^ num_of_facts new_fact_filter new_num_facts ^ |
98fb341d32e3
distinguish MeSh and smart -- with smart, allow combinations of MaSh, MeSh, and MePo in different slices -- and use MaSh also with SMT solvers, based on evaluation
blanchet
parents:
51014
diff
changeset
|
1089 |
"..." |
42614
81953e554197
make "debug" more verbose and "verbose" less verbose
blanchet
parents:
42613
diff
changeset
|
1090 |
|> Output.urgent_message |
81953e554197
make "debug" more verbose and "verbose" less verbose
blanchet
parents:
42613
diff
changeset
|
1091 |
else |
81953e554197
make "debug" more verbose and "verbose" less verbose
blanchet
parents:
42613
diff
changeset
|
1092 |
() |
42443
724e612ba248
implemented general slicing for ATPs, especially E 1.2w and above
blanchet
parents:
42361
diff
changeset
|
1093 |
in |
51024
98fb341d32e3
distinguish MeSh and smart -- with smart, allow combinations of MaSh, MeSh, and MePo in different slices -- and use MaSh also with SMT solvers, based on evaluation
blanchet
parents:
51014
diff
changeset
|
1094 |
do_slice timeout (slice + 1) outcome0 time_so_far weighted_factss |
42443
724e612ba248
implemented general slicing for ATPs, especially E 1.2w and above
blanchet
parents:
42361
diff
changeset
|
1095 |
end |
40553
1264c9172338
pick up SMT solver crashes and report them to the user/Mirabelle if desired
blanchet
parents:
40471
diff
changeset
|
1096 |
else |
1264c9172338
pick up SMT solver crashes and report them to the user/Mirabelle if desired
blanchet
parents:
40471
diff
changeset
|
1097 |
{outcome = if is_none outcome then NONE else the outcome0, |
51009
e8ff34a1fa9a
thread through fact triple component from which used facts come, for accurate index output
blanchet
parents:
51007
diff
changeset
|
1098 |
used_facts = used_facts, used_from = map (apsnd snd) weighted_facts, |
e8ff34a1fa9a
thread through fact triple component from which used facts come, for accurate index output
blanchet
parents:
51007
diff
changeset
|
1099 |
run_time = time_so_far} |
40409
3642dc3b72e8
invoke SMT solver in a loop, with fewer and fewer facts, in case of error
blanchet
parents:
40370
diff
changeset
|
1100 |
end |
42443
724e612ba248
implemented general slicing for ATPs, especially E 1.2w and above
blanchet
parents:
42361
diff
changeset
|
1101 |
in do_slice timeout 1 NONE Time.zeroTime end |
40409
3642dc3b72e8
invoke SMT solver in a loop, with fewer and fewer facts, in case of error
blanchet
parents:
40370
diff
changeset
|
1102 |
|
43052
8d6a4978cc65
automatically minimize with Metis when this can be done within a few seconds
blanchet
parents:
43051
diff
changeset
|
1103 |
fun run_smt_solver mode name (params as {debug, verbose, preplay_timeout, ...}) |
43011
5f8d74d3b297
added syntax for specifying Metis timeout (currently used only by SMT solvers)
blanchet
parents:
43006
diff
changeset
|
1104 |
minimize_command |
51014 | 1105 |
({state, goal, subgoal, subgoal_count, factss, ...} : prover_problem) = |
36379
20ef039bccff
make "ATP_Manager.get_prover" a total function, since we always want to show the same error text
blanchet
parents:
36373
diff
changeset
|
1106 |
let |
41242
8edeb1dbbc76
run the SMT relevance filter only once, then run the normalization/monomorphization code once _per class_ of SMT solvers
blanchet
parents:
41241
diff
changeset
|
1107 |
val ctxt = Proof.context_of state |
51014 | 1108 |
fun weight_facts facts = |
1109 |
let val num_facts = length facts in |
|
1110 |
facts ~~ (0 upto num_facts - 1) |
|
1111 |
|> map (weight_smt_fact ctxt num_facts) |
|
1112 |
end |
|
51024
98fb341d32e3
distinguish MeSh and smart -- with smart, allow combinations of MaSh, MeSh, and MePo in different slices -- and use MaSh also with SMT solvers, based on evaluation
blanchet
parents:
51014
diff
changeset
|
1113 |
val weighted_factss = factss |> map (apsnd weight_facts) |
51009
e8ff34a1fa9a
thread through fact triple component from which used facts come, for accurate index output
blanchet
parents:
51007
diff
changeset
|
1114 |
val {outcome, used_facts = used_pairs, used_from, run_time} = |
51014 | 1115 |
smt_filter_loop name params state goal subgoal weighted_factss |
45781
fc2c368b5f54
use same order of facts for preplay as for actual reconstruction -- Metis sometimes exhibits very different timings depending on the order of the facts
blanchet
parents:
45707
diff
changeset
|
1116 |
val used_facts = used_pairs |> map fst |
41222 | 1117 |
val outcome = outcome |> Option.map failure_from_smt_failure |
43261
a4aeb26a6362
make sure that the message tail (timing + TPTP important message) is preserved upon automatic minimization
blanchet
parents:
43259
diff
changeset
|
1118 |
val (preplay, message, message_tail) = |
40184
91b4b73dbafb
proper error handling for SMT solvers in Sledgehammer
blanchet
parents:
40181
diff
changeset
|
1119 |
case outcome of |
91b4b73dbafb
proper error handling for SMT solvers in Sledgehammer
blanchet
parents:
40181
diff
changeset
|
1120 |
NONE => |
50669
84c7cf36b2e0
use "Lazy" to simplify control flow a bit and guarantee single evaluation (at most)
blanchet
parents:
50667
diff
changeset
|
1121 |
(Lazy.lazy (fn () => |
84c7cf36b2e0
use "Lazy" to simplify control flow a bit and guarantee single evaluation (at most)
blanchet
parents:
50667
diff
changeset
|
1122 |
play_one_line_proof mode debug verbose preplay_timeout used_pairs |
84c7cf36b2e0
use "Lazy" to simplify control flow a bit and guarantee single evaluation (at most)
blanchet
parents:
50667
diff
changeset
|
1123 |
state subgoal SMT |
84c7cf36b2e0
use "Lazy" to simplify control flow a bit and guarantee single evaluation (at most)
blanchet
parents:
50667
diff
changeset
|
1124 |
(bunch_of_reconstructors false (fn desperate => |
84c7cf36b2e0
use "Lazy" to simplify control flow a bit and guarantee single evaluation (at most)
blanchet
parents:
50667
diff
changeset
|
1125 |
if desperate then liftingN else metis_default_lam_trans))), |
43052
8d6a4978cc65
automatically minimize with Metis when this can be done within a few seconds
blanchet
parents:
43051
diff
changeset
|
1126 |
fn preplay => |
8d6a4978cc65
automatically minimize with Metis when this can be done within a few seconds
blanchet
parents:
43051
diff
changeset
|
1127 |
let |
8d6a4978cc65
automatically minimize with Metis when this can be done within a few seconds
blanchet
parents:
43051
diff
changeset
|
1128 |
val one_line_params = |
8d6a4978cc65
automatically minimize with Metis when this can be done within a few seconds
blanchet
parents:
43051
diff
changeset
|
1129 |
(preplay, proof_banner mode name, used_facts, |
45561
57227eedce81
don't propagate user-set "type_enc" or "lam_trans" to Metis calls
blanchet
parents:
45560
diff
changeset
|
1130 |
choose_minimize_command params minimize_command name preplay, |
43052
8d6a4978cc65
automatically minimize with Metis when this can be done within a few seconds
blanchet
parents:
43051
diff
changeset
|
1131 |
subgoal, subgoal_count) |
48799 | 1132 |
val num_chained = length (#facts (Proof.goal state)) |
1133 |
in one_line_proof_text num_chained one_line_params end, |
|
43261
a4aeb26a6362
make sure that the message tail (timing + TPTP important message) is preserved upon automatic minimization
blanchet
parents:
43259
diff
changeset
|
1134 |
if verbose then |
45370
bab52dafa63a
use "Time.time" rather than milliseconds internally
blanchet
parents:
45369
diff
changeset
|
1135 |
"\nSMT solver real CPU time: " ^ string_from_time run_time ^ "." |
43261
a4aeb26a6362
make sure that the message tail (timing + TPTP important message) is preserved upon automatic minimization
blanchet
parents:
43259
diff
changeset
|
1136 |
else |
a4aeb26a6362
make sure that the message tail (timing + TPTP important message) is preserved upon automatic minimization
blanchet
parents:
43259
diff
changeset
|
1137 |
"") |
43166 | 1138 |
| SOME failure => |
50669
84c7cf36b2e0
use "Lazy" to simplify control flow a bit and guarantee single evaluation (at most)
blanchet
parents:
50667
diff
changeset
|
1139 |
(Lazy.value (Failed_to_Play plain_metis), |
84c7cf36b2e0
use "Lazy" to simplify control flow a bit and guarantee single evaluation (at most)
blanchet
parents:
50667
diff
changeset
|
1140 |
fn _ => string_for_failure failure, "") |
40063
d086e3699e78
bring ATPs and SMT solvers more in line with each other
blanchet
parents:
40062
diff
changeset
|
1141 |
in |
51009
e8ff34a1fa9a
thread through fact triple component from which used facts come, for accurate index output
blanchet
parents:
51007
diff
changeset
|
1142 |
{outcome = outcome, used_facts = used_facts, used_from = used_from, |
e8ff34a1fa9a
thread through fact triple component from which used facts come, for accurate index output
blanchet
parents:
51007
diff
changeset
|
1143 |
run_time = run_time, preplay = preplay, message = message, |
e8ff34a1fa9a
thread through fact triple component from which used facts come, for accurate index output
blanchet
parents:
51007
diff
changeset
|
1144 |
message_tail = message_tail} |
40063
d086e3699e78
bring ATPs and SMT solvers more in line with each other
blanchet
parents:
40062
diff
changeset
|
1145 |
end |
d086e3699e78
bring ATPs and SMT solvers more in line with each other
blanchet
parents:
40062
diff
changeset
|
1146 |
|
45520 | 1147 |
fun run_reconstructor mode name |
45561
57227eedce81
don't propagate user-set "type_enc" or "lam_trans" to Metis calls
blanchet
parents:
45560
diff
changeset
|
1148 |
(params as {debug, verbose, timeout, type_enc, lam_trans, ...}) |
45379
0147a4348ca1
try "smt" as a fallback for ATPs if "metis" fails/times out
blanchet
parents:
45378
diff
changeset
|
1149 |
minimize_command |
51010 | 1150 |
({state, subgoal, subgoal_count, factss = (_, facts) :: _, ...} |
51007
4f694d52bf62
thread fact triple (MeSh, MePo, MaSh) to allow different filters in different slices
blanchet
parents:
51005
diff
changeset
|
1151 |
: prover_problem) = |
43050
59284a13abc4
support "metis" and "metisFT" as provers in the architecture, so they can be used for minimizing
blanchet
parents:
43044
diff
changeset
|
1152 |
let |
45520 | 1153 |
val reconstr = |
1154 |
if name = metisN then |
|
1155 |
Metis (type_enc |> the_default (hd partial_type_encs), |
|
1156 |
lam_trans |> the_default metis_default_lam_trans) |
|
1157 |
else if name = smtN then |
|
1158 |
SMT |
|
1159 |
else |
|
1160 |
raise Fail ("unknown reconstructor: " ^ quote name) |
|
51005
ce4290c33d73
eliminated needless speed optimization -- and simplified code quite a bit
blanchet
parents:
50927
diff
changeset
|
1161 |
val used_facts = facts |> map fst |
43050
59284a13abc4
support "metis" and "metisFT" as provers in the architecture, so they can be used for minimizing
blanchet
parents:
43044
diff
changeset
|
1162 |
in |
45379
0147a4348ca1
try "smt" as a fallback for ATPs if "metis" fails/times out
blanchet
parents:
45378
diff
changeset
|
1163 |
case play_one_line_proof (if mode = Minimize then Normal else mode) debug |
51005
ce4290c33d73
eliminated needless speed optimization -- and simplified code quite a bit
blanchet
parents:
50927
diff
changeset
|
1164 |
verbose timeout facts state subgoal reconstr |
45520 | 1165 |
[reconstr] of |
43050
59284a13abc4
support "metis" and "metisFT" as provers in the architecture, so they can be used for minimizing
blanchet
parents:
43044
diff
changeset
|
1166 |
play as Played (_, time) => |
51009
e8ff34a1fa9a
thread through fact triple component from which used facts come, for accurate index output
blanchet
parents:
51007
diff
changeset
|
1167 |
{outcome = NONE, used_facts = used_facts, used_from = facts, |
e8ff34a1fa9a
thread through fact triple component from which used facts come, for accurate index output
blanchet
parents:
51007
diff
changeset
|
1168 |
run_time = time, preplay = Lazy.value play, |
45561
57227eedce81
don't propagate user-set "type_enc" or "lam_trans" to Metis calls
blanchet
parents:
45560
diff
changeset
|
1169 |
message = |
57227eedce81
don't propagate user-set "type_enc" or "lam_trans" to Metis calls
blanchet
parents:
45560
diff
changeset
|
1170 |
fn play => |
57227eedce81
don't propagate user-set "type_enc" or "lam_trans" to Metis calls
blanchet
parents:
45560
diff
changeset
|
1171 |
let |
57227eedce81
don't propagate user-set "type_enc" or "lam_trans" to Metis calls
blanchet
parents:
45560
diff
changeset
|
1172 |
val (_, override_params) = extract_reconstructor params reconstr |
57227eedce81
don't propagate user-set "type_enc" or "lam_trans" to Metis calls
blanchet
parents:
45560
diff
changeset
|
1173 |
val one_line_params = |
57227eedce81
don't propagate user-set "type_enc" or "lam_trans" to Metis calls
blanchet
parents:
45560
diff
changeset
|
1174 |
(play, proof_banner mode name, used_facts, |
57227eedce81
don't propagate user-set "type_enc" or "lam_trans" to Metis calls
blanchet
parents:
45560
diff
changeset
|
1175 |
minimize_command override_params name, subgoal, |
57227eedce81
don't propagate user-set "type_enc" or "lam_trans" to Metis calls
blanchet
parents:
45560
diff
changeset
|
1176 |
subgoal_count) |
48799 | 1177 |
val num_chained = length (#facts (Proof.goal state)) |
1178 |
in one_line_proof_text num_chained one_line_params end, |
|
43261
a4aeb26a6362
make sure that the message tail (timing + TPTP important message) is preserved upon automatic minimization
blanchet
parents:
43259
diff
changeset
|
1179 |
message_tail = ""} |
43052
8d6a4978cc65
automatically minimize with Metis when this can be done within a few seconds
blanchet
parents:
43051
diff
changeset
|
1180 |
| play => |
43166 | 1181 |
let |
1182 |
val failure = case play of Failed_to_Play _ => GaveUp | _ => TimedOut |
|
1183 |
in |
|
51009
e8ff34a1fa9a
thread through fact triple component from which used facts come, for accurate index output
blanchet
parents:
51007
diff
changeset
|
1184 |
{outcome = SOME failure, used_facts = [], used_from = [], |
e8ff34a1fa9a
thread through fact triple component from which used facts come, for accurate index output
blanchet
parents:
51007
diff
changeset
|
1185 |
run_time = Time.zeroTime, preplay = Lazy.value play, |
50669
84c7cf36b2e0
use "Lazy" to simplify control flow a bit and guarantee single evaluation (at most)
blanchet
parents:
50667
diff
changeset
|
1186 |
message = fn _ => string_for_failure failure, message_tail = ""} |
43050
59284a13abc4
support "metis" and "metisFT" as provers in the architecture, so they can be used for minimizing
blanchet
parents:
43044
diff
changeset
|
1187 |
end |
59284a13abc4
support "metis" and "metisFT" as provers in the architecture, so they can be used for minimizing
blanchet
parents:
43044
diff
changeset
|
1188 |
end |
59284a13abc4
support "metis" and "metisFT" as provers in the architecture, so they can be used for minimizing
blanchet
parents:
43044
diff
changeset
|
1189 |
|
43021 | 1190 |
fun get_prover ctxt mode name = |
42361 | 1191 |
let val thy = Proof_Context.theory_of ctxt in |
45379
0147a4348ca1
try "smt" as a fallback for ATPs if "metis" fails/times out
blanchet
parents:
45378
diff
changeset
|
1192 |
if is_reconstructor name then run_reconstructor mode name |
47606
06dde48a1503
true delayed evaluation of "SPASS_VERSION" environment variable
blanchet
parents:
47531
diff
changeset
|
1193 |
else if is_atp thy name then run_atp mode name (get_atp thy name ()) |
43052
8d6a4978cc65
automatically minimize with Metis when this can be done within a few seconds
blanchet
parents:
43051
diff
changeset
|
1194 |
else if is_smt_prover ctxt name then run_smt_solver mode name |
8d6a4978cc65
automatically minimize with Metis when this can be done within a few seconds
blanchet
parents:
43051
diff
changeset
|
1195 |
else error ("No such prover: " ^ name ^ ".") |
40941
a3e6f8634a11
replace "smt" prover with specific SMT solvers, e.g. "z3" -- whatever the SMT module gives us
blanchet
parents:
40723
diff
changeset
|
1196 |
end |
40063
d086e3699e78
bring ATPs and SMT solvers more in line with each other
blanchet
parents:
40062
diff
changeset
|
1197 |
|
28582 | 1198 |
end; |