author  blanchet 
Wed, 18 Jul 2012 08:44:04 +0200  
changeset 48326  ef800e91d072 
parent 48325  2ec05ef3e593 
child 48327  568b3193e53e 
permissions  rwrr 
48248  1 
(* Title: HOL/Tools/Sledgehammer/sledgehammer_filter_mash.ML 
2 
Author: Jasmin Blanchette, TU Muenchen 

3 

4 
Sledgehammer's machinelearningbased relevance filter (MaSh). 

5 
*) 

6 

7 
signature SLEDGEHAMMER_FILTER_MASH = 

8 
sig 

48251
6cdcfbddc077
moved most of MaSh exporter code to Sledgehammer
blanchet
parents:
48249
diff
changeset

9 
type status = ATP_Problem_Generate.status 
6cdcfbddc077
moved most of MaSh exporter code to Sledgehammer
blanchet
parents:
48249
diff
changeset

10 
type stature = ATP_Problem_Generate.stature 
48296
e7f01b7e244e
gracefully handle the case of empty theories when going up the accessibility chain
blanchet
parents:
48293
diff
changeset

11 
type fact = Sledgehammer_Fact.fact 
e7f01b7e244e
gracefully handle the case of empty theories when going up the accessibility chain
blanchet
parents:
48293
diff
changeset

12 
type fact_override = Sledgehammer_Fact.fact_override 
48251
6cdcfbddc077
moved most of MaSh exporter code to Sledgehammer
blanchet
parents:
48249
diff
changeset

13 
type params = Sledgehammer_Provers.params 
48288
255c6e1fd505
rationalize relevance filter, slowing moving code from Iter to MaSh
blanchet
parents:
48251
diff
changeset

14 
type relevance_fudge = Sledgehammer_Provers.relevance_fudge 
48251
6cdcfbddc077
moved most of MaSh exporter code to Sledgehammer
blanchet
parents:
48249
diff
changeset

15 
type prover_result = Sledgehammer_Provers.prover_result 
6cdcfbddc077
moved most of MaSh exporter code to Sledgehammer
blanchet
parents:
48249
diff
changeset

16 

48308  17 
val trace : bool Config.T 
48319
340187063d84
use async manager to manage MaSh learners to make sure they get killed cleanly
blanchet
parents:
48318
diff
changeset

18 
val MaShN : string 
48314
ee33ba3c0e05
added option to control which fact filter is used
blanchet
parents:
48313
diff
changeset

19 
val meshN : string 
ee33ba3c0e05
added option to control which fact filter is used
blanchet
parents:
48313
diff
changeset

20 
val iterN : string 
ee33ba3c0e05
added option to control which fact filter is used
blanchet
parents:
48313
diff
changeset

21 
val mashN : string 
ee33ba3c0e05
added option to control which fact filter is used
blanchet
parents:
48313
diff
changeset

22 
val fact_filters : string list 
48303
f1d135d0ea69
improved MaSh string escaping and make more operations stringbased
blanchet
parents:
48302
diff
changeset

23 
val escape_meta : string > string 
f1d135d0ea69
improved MaSh string escaping and make more operations stringbased
blanchet
parents:
48302
diff
changeset

24 
val escape_metas : string list > string 
48308  25 
val unescape_meta : string > string 
26 
val unescape_metas : string > string list 

48311  27 
val extract_query : string > string * string list 
48321  28 
val suggested_facts : string list > ('a * thm) list > ('a * thm) list 
29 
val mesh_facts : 

30 
int > (('a * thm) list * ('a * thm) list) list > ('a * thm) list 

48324  31 
val is_likely_tautology_or_too_meta : thm > bool 
48251
6cdcfbddc077
moved most of MaSh exporter code to Sledgehammer
blanchet
parents:
48249
diff
changeset

32 
val theory_ord : theory * theory > order 
6cdcfbddc077
moved most of MaSh exporter code to Sledgehammer
blanchet
parents:
48249
diff
changeset

33 
val thm_ord : thm * thm > order 
48318  34 
val features_of : 
35 
Proof.context > string > theory > status > term list > string list 

48316
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

36 
val isabelle_dependencies_of : unit Symtab.table > thm > string list 
48251
6cdcfbddc077
moved most of MaSh exporter code to Sledgehammer
blanchet
parents:
48249
diff
changeset

37 
val goal_of_thm : theory > thm > thm 
48321  38 
val run_prover_for_mash : 
48318  39 
Proof.context > params > string > fact list > thm > prover_result 
48308  40 
val mash_RESET : Proof.context > unit 
48316
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

41 
val mash_INIT : 
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

42 
Proof.context > bool 
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

43 
> (string * string list * string list * string list) list > unit 
48308  44 
val mash_ADD : 
48316
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

45 
Proof.context > bool 
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

46 
> (string * string list * string list * string list) list > unit 
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

47 
val mash_QUERY : 
48318  48 
Proof.context > bool > int > string list * string list > string list 
48308  49 
val mash_reset : Proof.context > unit 
48318  50 
val mash_could_suggest_facts : unit > bool 
48321  51 
val mash_can_suggest_facts : Proof.context > bool 
48298  52 
val mash_suggest_facts : 
48321  53 
Proof.context > params > string > int > term list > term 
54 
> ('a * thm) list > ('a * thm) list * ('a * thm) list 

48319
340187063d84
use async manager to manage MaSh learners to make sure they get killed cleanly
blanchet
parents:
48318
diff
changeset

55 
val mash_learn_thy : 
340187063d84
use async manager to manage MaSh learners to make sure they get killed cleanly
blanchet
parents:
48318
diff
changeset

56 
Proof.context > params > theory > Time.time > fact list > string 
48316
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

57 
val mash_learn_proof : 
48321  58 
Proof.context > params > term > ('a * thm) list > thm list > unit 
48288
255c6e1fd505
rationalize relevance filter, slowing moving code from Iter to MaSh
blanchet
parents:
48251
diff
changeset

59 
val relevant_facts : 
48292  60 
Proof.context > params > string > int > fact_override > term list 
48296
e7f01b7e244e
gracefully handle the case of empty theories when going up the accessibility chain
blanchet
parents:
48293
diff
changeset

61 
> term > fact list > fact list 
48319
340187063d84
use async manager to manage MaSh learners to make sure they get killed cleanly
blanchet
parents:
48318
diff
changeset

62 
val kill_learners : unit > unit 
340187063d84
use async manager to manage MaSh learners to make sure they get killed cleanly
blanchet
parents:
48318
diff
changeset

63 
val running_learners : unit > unit 
48248  64 
end; 
65 

66 
structure Sledgehammer_Filter_MaSh : SLEDGEHAMMER_FILTER_MASH = 

67 
struct 

48249  68 

48251
6cdcfbddc077
moved most of MaSh exporter code to Sledgehammer
blanchet
parents:
48249
diff
changeset

69 
open ATP_Util 
6cdcfbddc077
moved most of MaSh exporter code to Sledgehammer
blanchet
parents:
48249
diff
changeset

70 
open ATP_Problem_Generate 
6cdcfbddc077
moved most of MaSh exporter code to Sledgehammer
blanchet
parents:
48249
diff
changeset

71 
open Sledgehammer_Util 
6cdcfbddc077
moved most of MaSh exporter code to Sledgehammer
blanchet
parents:
48249
diff
changeset

72 
open Sledgehammer_Fact 
6cdcfbddc077
moved most of MaSh exporter code to Sledgehammer
blanchet
parents:
48249
diff
changeset

73 
open Sledgehammer_Filter_Iter 
6cdcfbddc077
moved most of MaSh exporter code to Sledgehammer
blanchet
parents:
48249
diff
changeset

74 
open Sledgehammer_Provers 
48318  75 
open Sledgehammer_Minimize 
48251
6cdcfbddc077
moved most of MaSh exporter code to Sledgehammer
blanchet
parents:
48249
diff
changeset

76 

48308  77 
val trace = 
78 
Attrib.setup_config_bool @{binding sledgehammer_filter_mash_trace} (K false) 

79 
fun trace_msg ctxt msg = if Config.get ctxt trace then tracing (msg ()) else () 

80 

48319
340187063d84
use async manager to manage MaSh learners to make sure they get killed cleanly
blanchet
parents:
48318
diff
changeset

81 
val MaShN = "MaSh" 
340187063d84
use async manager to manage MaSh learners to make sure they get killed cleanly
blanchet
parents:
48318
diff
changeset

82 

48314
ee33ba3c0e05
added option to control which fact filter is used
blanchet
parents:
48313
diff
changeset

83 
val meshN = "mesh" 
ee33ba3c0e05
added option to control which fact filter is used
blanchet
parents:
48313
diff
changeset

84 
val iterN = "iter" 
ee33ba3c0e05
added option to control which fact filter is used
blanchet
parents:
48313
diff
changeset

85 
val mashN = "mash" 
ee33ba3c0e05
added option to control which fact filter is used
blanchet
parents:
48313
diff
changeset

86 

ee33ba3c0e05
added option to control which fact filter is used
blanchet
parents:
48313
diff
changeset

87 
val fact_filters = [meshN, iterN, mashN] 
ee33ba3c0e05
added option to control which fact filter is used
blanchet
parents:
48313
diff
changeset

88 

ee33ba3c0e05
added option to control which fact filter is used
blanchet
parents:
48313
diff
changeset

89 
fun mash_home () = getenv "MASH_HOME" 
ee33ba3c0e05
added option to control which fact filter is used
blanchet
parents:
48313
diff
changeset

90 
fun mash_state_dir () = 
48309  91 
getenv "ISABELLE_HOME_USER" ^ "/mash" 
48316
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

92 
> tap (Isabelle_System.mkdir o Path.explode) 
48314
ee33ba3c0e05
added option to control which fact filter is used
blanchet
parents:
48313
diff
changeset

93 
fun mash_state_path () = mash_state_dir () ^ "/state" > Path.explode 
48251
6cdcfbddc077
moved most of MaSh exporter code to Sledgehammer
blanchet
parents:
48249
diff
changeset

94 

6cdcfbddc077
moved most of MaSh exporter code to Sledgehammer
blanchet
parents:
48249
diff
changeset

95 
(*** Isabelle helpers ***) 
6cdcfbddc077
moved most of MaSh exporter code to Sledgehammer
blanchet
parents:
48249
diff
changeset

96 

48308  97 
fun meta_char c = 
48251
6cdcfbddc077
moved most of MaSh exporter code to Sledgehammer
blanchet
parents:
48249
diff
changeset

98 
if Char.isAlphaNum c orelse c = #"_" orelse c = #"." orelse c = #"(" orelse 
6cdcfbddc077
moved most of MaSh exporter code to Sledgehammer
blanchet
parents:
48249
diff
changeset

99 
c = #")" orelse c = #"," then 
6cdcfbddc077
moved most of MaSh exporter code to Sledgehammer
blanchet
parents:
48249
diff
changeset

100 
String.str c 
6cdcfbddc077
moved most of MaSh exporter code to Sledgehammer
blanchet
parents:
48249
diff
changeset

101 
else 
6cdcfbddc077
moved most of MaSh exporter code to Sledgehammer
blanchet
parents:
48249
diff
changeset

102 
(* fixed width, in case more digits follow *) 
6cdcfbddc077
moved most of MaSh exporter code to Sledgehammer
blanchet
parents:
48249
diff
changeset

103 
"\\" ^ stringN_of_int 3 (Char.ord c) 
6cdcfbddc077
moved most of MaSh exporter code to Sledgehammer
blanchet
parents:
48249
diff
changeset

104 

48308  105 
fun unmeta_chars accum [] = String.implode (rev accum) 
106 
 unmeta_chars accum (#"\\" :: d1 :: d2 :: d3 :: cs) = 

107 
(case Int.fromString (String.implode [d1, d2, d3]) of 

108 
SOME n => unmeta_chars (Char.chr n :: accum) cs 

109 
 NONE => "" (* error *)) 

110 
 unmeta_chars _ (#"\\" :: _) = "" (* error *) 

111 
 unmeta_chars accum (c :: cs) = unmeta_chars (c :: accum) cs 

112 

113 
val escape_meta = String.translate meta_char 

48303
f1d135d0ea69
improved MaSh string escaping and make more operations stringbased
blanchet
parents:
48302
diff
changeset

114 
val escape_metas = map escape_meta #> space_implode " " 
48315
82d6e46c673f
fixed order of accessibles + other tweaks to MaSh
blanchet
parents:
48314
diff
changeset

115 
val unescape_meta = String.explode #> unmeta_chars [] 
82d6e46c673f
fixed order of accessibles + other tweaks to MaSh
blanchet
parents:
48314
diff
changeset

116 
val unescape_metas = 
82d6e46c673f
fixed order of accessibles + other tweaks to MaSh
blanchet
parents:
48314
diff
changeset

117 
space_explode " " #> filter_out (curry (op =) "") #> map unescape_meta 
48251
6cdcfbddc077
moved most of MaSh exporter code to Sledgehammer
blanchet
parents:
48249
diff
changeset

118 

48311  119 
fun extract_query line = 
120 
case space_explode ":" line of 

48315
82d6e46c673f
fixed order of accessibles + other tweaks to MaSh
blanchet
parents:
48314
diff
changeset

121 
[goal_name, suggs] => (unescape_meta goal_name, unescape_metas suggs) 
48312  122 
 _ => ("", []) 
48311  123 

124 
fun find_suggested facts sugg = 

125 
find_first (fn (_, th) => Thm.get_name_hint th = sugg) facts 

126 
fun suggested_facts suggs facts = map_filter (find_suggested facts) suggs 

127 

48320
891a24a48155
improved meshing of MaSh and MengPaulson if some MaSh suggestions are cutoff (the common case)
blanchet
parents:
48319
diff
changeset

128 
fun sum_avg _ [] = 1000000000 (* big number *) 
891a24a48155
improved meshing of MaSh and MengPaulson if some MaSh suggestions are cutoff (the common case)
blanchet
parents:
48319
diff
changeset

129 
 sum_avg n xs = fold (Integer.add o Integer.mult n) xs 0 div (length xs) 
48313
0faafdffa662
mesh facts by taking into consideration whether a fact is known to MeSh
blanchet
parents:
48312
diff
changeset

130 

48320
891a24a48155
improved meshing of MaSh and MengPaulson if some MaSh suggestions are cutoff (the common case)
blanchet
parents:
48319
diff
changeset

131 
fun mesh_facts max_facts [(selected, unknown)] = 
891a24a48155
improved meshing of MaSh and MengPaulson if some MaSh suggestions are cutoff (the common case)
blanchet
parents:
48319
diff
changeset

132 
take max_facts selected @ take (max_facts  length selected) unknown 
48314
ee33ba3c0e05
added option to control which fact filter is used
blanchet
parents:
48313
diff
changeset

133 
 mesh_facts max_facts mess = 
ee33ba3c0e05
added option to control which fact filter is used
blanchet
parents:
48313
diff
changeset

134 
let 
48320
891a24a48155
improved meshing of MaSh and MengPaulson if some MaSh suggestions are cutoff (the common case)
blanchet
parents:
48319
diff
changeset

135 
val mess = mess > map (apfst (`length)) 
48314
ee33ba3c0e05
added option to control which fact filter is used
blanchet
parents:
48313
diff
changeset

136 
val n = length mess 
ee33ba3c0e05
added option to control which fact filter is used
blanchet
parents:
48313
diff
changeset

137 
val fact_eq = Thm.eq_thm o pairself snd 
48320
891a24a48155
improved meshing of MaSh and MengPaulson if some MaSh suggestions are cutoff (the common case)
blanchet
parents:
48319
diff
changeset

138 
fun score_in fact ((sel_len, sels), unks) = 
891a24a48155
improved meshing of MaSh and MengPaulson if some MaSh suggestions are cutoff (the common case)
blanchet
parents:
48319
diff
changeset

139 
case find_index (curry fact_eq fact) sels of 
891a24a48155
improved meshing of MaSh and MengPaulson if some MaSh suggestions are cutoff (the common case)
blanchet
parents:
48319
diff
changeset

140 
~1 => (case find_index (curry fact_eq fact) unks of 
891a24a48155
improved meshing of MaSh and MengPaulson if some MaSh suggestions are cutoff (the common case)
blanchet
parents:
48319
diff
changeset

141 
~1 => SOME sel_len 
891a24a48155
improved meshing of MaSh and MengPaulson if some MaSh suggestions are cutoff (the common case)
blanchet
parents:
48319
diff
changeset

142 
 _ => NONE) 
48314
ee33ba3c0e05
added option to control which fact filter is used
blanchet
parents:
48313
diff
changeset

143 
 j => SOME j 
ee33ba3c0e05
added option to control which fact filter is used
blanchet
parents:
48313
diff
changeset

144 
fun score_of fact = mess > map_filter (score_in fact) > sum_avg n 
48320
891a24a48155
improved meshing of MaSh and MengPaulson if some MaSh suggestions are cutoff (the common case)
blanchet
parents:
48319
diff
changeset

145 
val facts = fold (union fact_eq o take max_facts o snd o fst) mess [] 
48314
ee33ba3c0e05
added option to control which fact filter is used
blanchet
parents:
48313
diff
changeset

146 
in 
ee33ba3c0e05
added option to control which fact filter is used
blanchet
parents:
48313
diff
changeset

147 
facts > map (`score_of) > sort (int_ord o pairself fst) > map snd 
ee33ba3c0e05
added option to control which fact filter is used
blanchet
parents:
48313
diff
changeset

148 
> take max_facts 
ee33ba3c0e05
added option to control which fact filter is used
blanchet
parents:
48313
diff
changeset

149 
end 
48312  150 

48303
f1d135d0ea69
improved MaSh string escaping and make more operations stringbased
blanchet
parents:
48302
diff
changeset

151 
val thy_feature_prefix = "y_" 
48251
6cdcfbddc077
moved most of MaSh exporter code to Sledgehammer
blanchet
parents:
48249
diff
changeset

152 

48303
f1d135d0ea69
improved MaSh string escaping and make more operations stringbased
blanchet
parents:
48302
diff
changeset

153 
val thy_feature_name_of = prefix thy_feature_prefix 
f1d135d0ea69
improved MaSh string escaping and make more operations stringbased
blanchet
parents:
48302
diff
changeset

154 
val const_name_of = prefix const_prefix 
f1d135d0ea69
improved MaSh string escaping and make more operations stringbased
blanchet
parents:
48302
diff
changeset

155 
val type_name_of = prefix type_const_prefix 
f1d135d0ea69
improved MaSh string escaping and make more operations stringbased
blanchet
parents:
48302
diff
changeset

156 
val class_name_of = prefix class_prefix 
48251
6cdcfbddc077
moved most of MaSh exporter code to Sledgehammer
blanchet
parents:
48249
diff
changeset

157 

48324  158 
fun is_likely_tautology_or_too_meta th = 
159 
let 

160 
val is_boring_const = member (op =) atp_widely_irrelevant_consts 

161 
fun is_boring_bool t = 

162 
not (exists_Const (not o is_boring_const o fst) t) orelse 

163 
exists_type (exists_subtype (curry (op =) @{typ prop})) t 

164 
fun is_boring_prop (@{const Trueprop} $ t) = is_boring_bool t 

165 
 is_boring_prop (@{const "==>"} $ t $ u) = 

166 
is_boring_prop t andalso is_boring_prop u 

167 
 is_boring_prop (Const (@{const_name all}, _) $ (Abs (_, _, t)) $ u) = 

168 
is_boring_prop t andalso is_boring_prop u 

169 
 is_boring_prop (Const (@{const_name "=="}, _) $ t $ u) = 

170 
is_boring_bool t andalso is_boring_bool u 

171 
 is_boring_prop _ = true 

172 
in 

173 
is_boring_prop (prop_of th) andalso not (Thm.eq_thm_prop (@{thm ext}, th)) 

174 
end 

175 

176 
fun theory_ord p = 

177 
if Theory.eq_thy p then 

178 
EQUAL 

179 
else if Theory.subthy p then 

180 
LESS 

181 
else if Theory.subthy (swap p) then 

182 
GREATER 

183 
else case int_ord (pairself (length o Theory.ancestors_of) p) of 

184 
EQUAL => string_ord (pairself Context.theory_name p) 

185 
 order => order 

186 

187 
val thm_ord = theory_ord o pairself theory_of_thm 

188 

48326  189 
val bad_types = [@{type_name prop}, @{type_name bool}, @{type_name fun}] 
190 

48318  191 
fun interesting_terms_types_and_classes ctxt prover term_max_depth 
192 
type_max_depth ts = 

48251
6cdcfbddc077
moved most of MaSh exporter code to Sledgehammer
blanchet
parents:
48249
diff
changeset

193 
let 
48318  194 
fun is_bad_const (x as (s, _)) args = 
195 
member (op =) atp_logical_consts s orelse 

196 
fst (is_built_in_const_for_prover ctxt prover x args) 

48304  197 
fun add_classes @{sort type} = I 
198 
 add_classes S = union (op =) (map class_name_of S) 

48251
6cdcfbddc077
moved most of MaSh exporter code to Sledgehammer
blanchet
parents:
48249
diff
changeset

199 
fun do_add_type (Type (s, Ts)) = 
6cdcfbddc077
moved most of MaSh exporter code to Sledgehammer
blanchet
parents:
48249
diff
changeset

200 
(not (member (op =) bad_types s) ? insert (op =) (type_name_of s)) 
6cdcfbddc077
moved most of MaSh exporter code to Sledgehammer
blanchet
parents:
48249
diff
changeset

201 
#> fold do_add_type Ts 
48304  202 
 do_add_type (TFree (_, S)) = add_classes S 
203 
 do_add_type (TVar (_, S)) = add_classes S 

48251
6cdcfbddc077
moved most of MaSh exporter code to Sledgehammer
blanchet
parents:
48249
diff
changeset

204 
fun add_type T = type_max_depth >= 0 ? do_add_type T 
6cdcfbddc077
moved most of MaSh exporter code to Sledgehammer
blanchet
parents:
48249
diff
changeset

205 
fun mk_app s args = 
6cdcfbddc077
moved most of MaSh exporter code to Sledgehammer
blanchet
parents:
48249
diff
changeset

206 
if member (op <>) args "" then s ^ "(" ^ space_implode "," args ^ ")" 
6cdcfbddc077
moved most of MaSh exporter code to Sledgehammer
blanchet
parents:
48249
diff
changeset

207 
else s 
6cdcfbddc077
moved most of MaSh exporter code to Sledgehammer
blanchet
parents:
48249
diff
changeset

208 
fun patternify ~1 _ = "" 
6cdcfbddc077
moved most of MaSh exporter code to Sledgehammer
blanchet
parents:
48249
diff
changeset

209 
 patternify depth t = 
6cdcfbddc077
moved most of MaSh exporter code to Sledgehammer
blanchet
parents:
48249
diff
changeset

210 
case strip_comb t of 
6cdcfbddc077
moved most of MaSh exporter code to Sledgehammer
blanchet
parents:
48249
diff
changeset

211 
(Const (s, _), args) => 
6cdcfbddc077
moved most of MaSh exporter code to Sledgehammer
blanchet
parents:
48249
diff
changeset

212 
mk_app (const_name_of s) (map (patternify (depth  1)) args) 
6cdcfbddc077
moved most of MaSh exporter code to Sledgehammer
blanchet
parents:
48249
diff
changeset

213 
 _ => "" 
6cdcfbddc077
moved most of MaSh exporter code to Sledgehammer
blanchet
parents:
48249
diff
changeset

214 
fun add_term_patterns ~1 _ = I 
6cdcfbddc077
moved most of MaSh exporter code to Sledgehammer
blanchet
parents:
48249
diff
changeset

215 
 add_term_patterns depth t = 
6cdcfbddc077
moved most of MaSh exporter code to Sledgehammer
blanchet
parents:
48249
diff
changeset

216 
insert (op =) (patternify depth t) 
6cdcfbddc077
moved most of MaSh exporter code to Sledgehammer
blanchet
parents:
48249
diff
changeset

217 
#> add_term_patterns (depth  1) t 
6cdcfbddc077
moved most of MaSh exporter code to Sledgehammer
blanchet
parents:
48249
diff
changeset

218 
val add_term = add_term_patterns term_max_depth 
6cdcfbddc077
moved most of MaSh exporter code to Sledgehammer
blanchet
parents:
48249
diff
changeset

219 
fun add_patterns t = 
6cdcfbddc077
moved most of MaSh exporter code to Sledgehammer
blanchet
parents:
48249
diff
changeset

220 
let val (head, args) = strip_comb t in 
6cdcfbddc077
moved most of MaSh exporter code to Sledgehammer
blanchet
parents:
48249
diff
changeset

221 
(case head of 
48318  222 
Const (x as (_, T)) => 
223 
not (is_bad_const x args) ? (add_term t #> add_type T) 

48251
6cdcfbddc077
moved most of MaSh exporter code to Sledgehammer
blanchet
parents:
48249
diff
changeset

224 
 Free (_, T) => add_type T 
6cdcfbddc077
moved most of MaSh exporter code to Sledgehammer
blanchet
parents:
48249
diff
changeset

225 
 Var (_, T) => add_type T 
6cdcfbddc077
moved most of MaSh exporter code to Sledgehammer
blanchet
parents:
48249
diff
changeset

226 
 Abs (_, T, body) => add_type T #> add_patterns body 
6cdcfbddc077
moved most of MaSh exporter code to Sledgehammer
blanchet
parents:
48249
diff
changeset

227 
 _ => I) 
6cdcfbddc077
moved most of MaSh exporter code to Sledgehammer
blanchet
parents:
48249
diff
changeset

228 
#> fold add_patterns args 
6cdcfbddc077
moved most of MaSh exporter code to Sledgehammer
blanchet
parents:
48249
diff
changeset

229 
end 
48326  230 
in [] > fold add_patterns ts end 
48251
6cdcfbddc077
moved most of MaSh exporter code to Sledgehammer
blanchet
parents:
48249
diff
changeset

231 

6cdcfbddc077
moved most of MaSh exporter code to Sledgehammer
blanchet
parents:
48249
diff
changeset

232 
fun is_exists (s, _) = (s = @{const_name Ex} orelse s = @{const_name Ex1}) 
6cdcfbddc077
moved most of MaSh exporter code to Sledgehammer
blanchet
parents:
48249
diff
changeset

233 

48297  234 
val term_max_depth = 1 
235 
val type_max_depth = 1 

48251
6cdcfbddc077
moved most of MaSh exporter code to Sledgehammer
blanchet
parents:
48249
diff
changeset

236 

6cdcfbddc077
moved most of MaSh exporter code to Sledgehammer
blanchet
parents:
48249
diff
changeset

237 
(* TODO: Generate type classes for types? *) 
48318  238 
fun features_of ctxt prover thy status ts = 
48303
f1d135d0ea69
improved MaSh string escaping and make more operations stringbased
blanchet
parents:
48302
diff
changeset

239 
thy_feature_name_of (Context.theory_name thy) :: 
48318  240 
interesting_terms_types_and_classes ctxt prover term_max_depth type_max_depth 
241 
ts 

48302  242 
> exists (not o is_lambda_free) ts ? cons "lambdas" 
243 
> exists (exists_Const is_exists) ts ? cons "skolems" 

244 
> (case status of 

245 
General => I 

246 
 Induction => cons "induction" 

247 
 Intro => cons "intro" 

248 
 Inductive => cons "inductive" 

249 
 Elim => cons "elim" 

250 
 Simp => cons "simp" 

251 
 Def => cons "def") 

48251
6cdcfbddc077
moved most of MaSh exporter code to Sledgehammer
blanchet
parents:
48249
diff
changeset

252 

48326  253 
fun isabelle_dependencies_of all_facts = thms_in_proof (SOME all_facts) 
48251
6cdcfbddc077
moved most of MaSh exporter code to Sledgehammer
blanchet
parents:
48249
diff
changeset

254 

6cdcfbddc077
moved most of MaSh exporter code to Sledgehammer
blanchet
parents:
48249
diff
changeset

255 
val freezeT = Type.legacy_freeze_type 
6cdcfbddc077
moved most of MaSh exporter code to Sledgehammer
blanchet
parents:
48249
diff
changeset

256 

6cdcfbddc077
moved most of MaSh exporter code to Sledgehammer
blanchet
parents:
48249
diff
changeset

257 
fun freeze (t $ u) = freeze t $ freeze u 
6cdcfbddc077
moved most of MaSh exporter code to Sledgehammer
blanchet
parents:
48249
diff
changeset

258 
 freeze (Abs (s, T, t)) = Abs (s, freezeT T, freeze t) 
6cdcfbddc077
moved most of MaSh exporter code to Sledgehammer
blanchet
parents:
48249
diff
changeset

259 
 freeze (Var ((s, _), T)) = Free (s, freezeT T) 
6cdcfbddc077
moved most of MaSh exporter code to Sledgehammer
blanchet
parents:
48249
diff
changeset

260 
 freeze (Const (s, T)) = Const (s, freezeT T) 
6cdcfbddc077
moved most of MaSh exporter code to Sledgehammer
blanchet
parents:
48249
diff
changeset

261 
 freeze (Free (s, T)) = Free (s, freezeT T) 
6cdcfbddc077
moved most of MaSh exporter code to Sledgehammer
blanchet
parents:
48249
diff
changeset

262 
 freeze t = t 
6cdcfbddc077
moved most of MaSh exporter code to Sledgehammer
blanchet
parents:
48249
diff
changeset

263 

6cdcfbddc077
moved most of MaSh exporter code to Sledgehammer
blanchet
parents:
48249
diff
changeset

264 
fun goal_of_thm thy = prop_of #> freeze #> cterm_of thy #> Goal.init 
6cdcfbddc077
moved most of MaSh exporter code to Sledgehammer
blanchet
parents:
48249
diff
changeset

265 

48321  266 
fun run_prover_for_mash ctxt params prover facts goal = 
48251
6cdcfbddc077
moved most of MaSh exporter code to Sledgehammer
blanchet
parents:
48249
diff
changeset

267 
let 
6cdcfbddc077
moved most of MaSh exporter code to Sledgehammer
blanchet
parents:
48249
diff
changeset

268 
val problem = 
6cdcfbddc077
moved most of MaSh exporter code to Sledgehammer
blanchet
parents:
48249
diff
changeset

269 
{state = Proof.init ctxt, goal = goal, subgoal = 1, subgoal_count = 1, 
48289  270 
facts = facts > map (apfst (apfst (fn name => name ()))) 
48318  271 
> map Untranslated_Fact} 
48321  272 
val prover = get_minimizing_prover ctxt Normal (K ()) prover 
48251
6cdcfbddc077
moved most of MaSh exporter code to Sledgehammer
blanchet
parents:
48249
diff
changeset

273 
in prover params (K (K (K ""))) problem end 
6cdcfbddc077
moved most of MaSh exporter code to Sledgehammer
blanchet
parents:
48249
diff
changeset

274 

6cdcfbddc077
moved most of MaSh exporter code to Sledgehammer
blanchet
parents:
48249
diff
changeset

275 

48302  276 
(*** Lowlevel communication with MaSh ***) 
277 

48323  278 
fun write_file (xs, f) file = 
48318  279 
let val path = Path.explode file in 
48323  280 
File.write path ""; 
281 
xs > chunk_list 500 

282 
> List.app (File.append path o space_implode "" o map f) 

48318  283 
end 
48316
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

284 

252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

285 
fun mash_info overlord = 
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

286 
if overlord then (getenv "ISABELLE_HOME_USER", "") 
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

287 
else (getenv "ISABELLE_TMP", serial_string ()) 
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

288 

252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

289 
fun run_mash ctxt (temp_dir, serial) core = 
48311  290 
let 
48316
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

291 
val log_file = temp_dir ^ "/mash_log" ^ serial 
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

292 
val err_file = temp_dir ^ "/mash_err" ^ serial 
48311  293 
val command = 
48316
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

294 
mash_home () ^ "/mash.py quiet outputDir " ^ mash_state_dir () ^ 
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

295 
" log " ^ log_file ^ " " ^ core ^ " 2>&1 > " ^ err_file 
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

296 
in 
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

297 
trace_msg ctxt (fn () => "Running " ^ command); 
48323  298 
write_file ([], K "") log_file; 
299 
write_file ([], K "") err_file; 

48316
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

300 
Isabelle_System.bash command; () 
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

301 
end 
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

302 

252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

303 
fun run_mash_init ctxt overlord write_access write_feats write_deps = 
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

304 
let 
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

305 
val info as (temp_dir, serial) = mash_info overlord 
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

306 
val in_dir = temp_dir ^ "/mash_init" ^ serial 
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

307 
> tap (Isabelle_System.mkdir o Path.explode) 
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

308 
in 
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

309 
write_file write_access (in_dir ^ "/mash_accessibility"); 
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

310 
write_file write_feats (in_dir ^ "/mash_features"); 
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

311 
write_file write_deps (in_dir ^ "/mash_dependencies"); 
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

312 
run_mash ctxt info ("init inputDir " ^ in_dir) 
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

313 
end 
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

314 

48318  315 
fun run_mash_commands ctxt overlord save max_suggs write_cmds read_suggs = 
48316
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

316 
let 
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

317 
val info as (temp_dir, serial) = mash_info overlord 
48318  318 
val sugg_file = temp_dir ^ "/mash_suggs" ^ serial 
48316
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

319 
val cmd_file = temp_dir ^ "/mash_commands" ^ serial 
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

320 
in 
48323  321 
write_file ([], K "") sugg_file; 
48316
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

322 
write_file write_cmds cmd_file; 
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

323 
run_mash ctxt info 
48318  324 
("inputFile " ^ cmd_file ^ " predictions " ^ sugg_file ^ 
325 
" numberOfPredictions " ^ string_of_int max_suggs ^ 

48316
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

326 
(if save then " saveModel" else "")); 
48318  327 
read_suggs (fn () => File.read_lines (Path.explode sugg_file)) 
48316
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

328 
end 
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

329 

252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

330 
fun str_of_update (name, parents, feats, deps) = 
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

331 
"! " ^ escape_meta name ^ ": " ^ escape_metas parents ^ "; " ^ 
48311  332 
escape_metas feats ^ "; " ^ escape_metas deps ^ "\n" 
333 

48316
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

334 
fun str_of_query (parents, feats) = 
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

335 
"? " ^ escape_metas parents ^ "; " ^ escape_metas feats 
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

336 

252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

337 
fun init_str_of_update get (upd as (name, _, _, _)) = 
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

338 
escape_meta name ^ ": " ^ escape_metas (get upd) ^ "\n" 
48311  339 

48308  340 
fun mash_RESET ctxt = 
48314
ee33ba3c0e05
added option to control which fact filter is used
blanchet
parents:
48313
diff
changeset

341 
let val path = mash_state_dir () > Path.explode in 
48309  342 
trace_msg ctxt (K "MaSh RESET"); 
343 
File.fold_dir (fn file => fn () => 

344 
File.rm (Path.append path (Path.basic file))) 

345 
path () 

346 
end 

48302  347 

48316
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

348 
fun mash_INIT ctxt _ [] = mash_RESET ctxt 
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

349 
 mash_INIT ctxt overlord upds = 
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

350 
(trace_msg ctxt (fn () => "MaSh INIT " ^ 
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

351 
elide_string 1000 (space_implode " " (map #1 upds))); 
48323  352 
run_mash_init ctxt overlord (upds, init_str_of_update #2) 
353 
(upds, init_str_of_update #3) (upds, init_str_of_update #4)) 

48302  354 

48316
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

355 
fun mash_ADD _ _ [] = () 
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

356 
 mash_ADD ctxt overlord upds = 
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

357 
(trace_msg ctxt (fn () => "MaSh ADD " ^ 
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

358 
elide_string 1000 (space_implode " " (map #1 upds))); 
48323  359 
run_mash_commands ctxt overlord true 0 (upds, str_of_update) (K ())) 
48302  360 

48318  361 
fun mash_QUERY ctxt overlord max_suggs (query as (_, feats)) = 
48314
ee33ba3c0e05
added option to control which fact filter is used
blanchet
parents:
48313
diff
changeset

362 
(trace_msg ctxt (fn () => "MaSh QUERY " ^ space_implode " " feats); 
48318  363 
run_mash_commands ctxt overlord false max_suggs 
48323  364 
([query], str_of_query) 
48318  365 
(fn suggs => snd (extract_query (List.last (suggs ())))) 
48311  366 
handle List.Empty => []) 
48302  367 

368 

48251
6cdcfbddc077
moved most of MaSh exporter code to Sledgehammer
blanchet
parents:
48249
diff
changeset

369 
(*** Highlevel communication with MaSh ***) 
6cdcfbddc077
moved most of MaSh exporter code to Sledgehammer
blanchet
parents:
48249
diff
changeset

370 

48321  371 
fun try_graph ctxt when def f = 
372 
f () 

373 
handle Graph.CYCLES (cycle :: _) => 

374 
(trace_msg ctxt (fn () => 

375 
"Cycle involving " ^ commas cycle ^ " when " ^ when); def) 

376 
 Graph.UNDEF name => 

377 
(trace_msg ctxt (fn () => 

378 
"Unknown fact " ^ quote name ^ " when " ^ when); def) 

379 

48301  380 
type mash_state = 
48316
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

381 
{thys : bool Symtab.table, 
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

382 
fact_graph : unit Graph.T} 
48301  383 

48316
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

384 
val empty_state = {thys = Symtab.empty, fact_graph = Graph.empty} 
48301  385 

386 
local 

387 

48321  388 
fun mash_load _ (state as (true, _)) = state 
389 
 mash_load ctxt _ = 

48309  390 
let val path = mash_state_path () in 
48302  391 
(true, 
392 
case try File.read_lines path of 

48316
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

393 
SOME (comp_thys :: incomp_thys :: fact_lines) => 
48302  394 
let 
48316
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

395 
fun add_thy comp thy = Symtab.update (thy, comp) 
48322
8a8d71e34297
fixed MaSh state load code so it works even if the facts are read in disorder
blanchet
parents:
48321
diff
changeset

396 
fun add_edge_to name parent = 
8a8d71e34297
fixed MaSh state load code so it works even if the facts are read in disorder
blanchet
parents:
48321
diff
changeset

397 
Graph.default_node (parent, ()) 
8a8d71e34297
fixed MaSh state load code so it works even if the facts are read in disorder
blanchet
parents:
48321
diff
changeset

398 
#> Graph.add_edge (parent, name) 
48316
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

399 
fun add_fact_line line = 
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

400 
case extract_query line of 
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

401 
("", _) => I (* shouldn't happen *) 
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

402 
 (name, parents) => 
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

403 
Graph.default_node (name, ()) 
48322
8a8d71e34297
fixed MaSh state load code so it works even if the facts are read in disorder
blanchet
parents:
48321
diff
changeset

404 
#> fold (add_edge_to name) parents 
48316
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

405 
val thys = 
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

406 
Symtab.empty > fold (add_thy true) (unescape_metas comp_thys) 
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

407 
> fold (add_thy false) (unescape_metas incomp_thys) 
48321  408 
val fact_graph = 
48322
8a8d71e34297
fixed MaSh state load code so it works even if the facts are read in disorder
blanchet
parents:
48321
diff
changeset

409 
try_graph ctxt "loading state" Graph.empty (fn () => 
48321  410 
Graph.empty > fold add_fact_line fact_lines) 
48316
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

411 
in {thys = thys, fact_graph = fact_graph} end 
48304  412 
 _ => empty_state) 
48302  413 
end 
48249  414 

48316
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

415 
fun mash_save ({thys, fact_graph, ...} : mash_state) = 
48301  416 
let 
48309  417 
val path = mash_state_path () 
48316
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

418 
val thys = Symtab.dest thys 
48318  419 
val line_for_thys = escape_metas o AList.find (op =) thys 
420 
fun fact_line_for name parents = 

421 
escape_meta name ^ ": " ^ escape_metas parents 

48316
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

422 
val append_fact = File.append path o suffix "\n" oo fact_line_for 
48301  423 
in 
48316
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

424 
File.write path (line_for_thys true ^ "\n" ^ line_for_thys false ^ "\n"); 
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

425 
Graph.fold (fn (name, ((), (parents, _))) => fn () => 
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

426 
append_fact name (Graph.Keys.dest parents)) 
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

427 
fact_graph () 
48301  428 
end 
429 

48302  430 
val global_state = 
48304  431 
Synchronized.var "Sledgehammer_Filter_MaSh.global_state" (false, empty_state) 
48301  432 

433 
in 

434 

48321  435 
fun mash_map ctxt f = 
436 
Synchronized.change global_state (mash_load ctxt ##> (f #> tap mash_save)) 

48302  437 

48321  438 
fun mash_get ctxt = 
439 
Synchronized.change_result global_state (mash_load ctxt #> `snd) 

48302  440 

48308  441 
fun mash_reset ctxt = 
48302  442 
Synchronized.change global_state (fn _ => 
48309  443 
(mash_RESET ctxt; File.write (mash_state_path ()) ""; 
48308  444 
(true, empty_state))) 
48301  445 

446 
end 

447 

48318  448 
fun mash_could_suggest_facts () = mash_home () <> "" 
48321  449 
fun mash_can_suggest_facts ctxt = 
450 
not (Graph.is_empty (#fact_graph (mash_get ctxt))) 

48249  451 

48321  452 
fun parents_wrt_facts ctxt facts fact_graph = 
48316
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

453 
let 
48318  454 
val graph_facts = Symtab.make (map (rpair ()) (Graph.keys fact_graph)) 
48316
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

455 
val facts = 
48321  456 
try_graph ctxt "when computing ancestor facts" [] (fn () => 
457 
[] > fold (cons o Thm.get_name_hint o snd) facts 

458 
> filter (Symtab.defined graph_facts) 

459 
> Graph.all_preds fact_graph) 

48318  460 
val facts = Symtab.empty > fold (fn name => Symtab.update (name, ())) facts 
48321  461 
in 
462 
try_graph ctxt "when computing parent facts" [] (fn () => 

463 
fact_graph > Graph.restrict (Symtab.defined facts) > Graph.maximals) 

464 
end 

48316
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

465 

48318  466 
(* Generate more suggestions than requested, because some might be thrown out 
467 
later for various reasons and "meshing" gives better results with some 

468 
slack. *) 

469 
fun max_suggs_of max_facts = max_facts + Int.min (200, max_facts) 

470 

48320
891a24a48155
improved meshing of MaSh and MengPaulson if some MaSh suggestions are cutoff (the common case)
blanchet
parents:
48319
diff
changeset

471 
fun is_fact_in_graph fact_graph (_, th) = 
891a24a48155
improved meshing of MaSh and MengPaulson if some MaSh suggestions are cutoff (the common case)
blanchet
parents:
48319
diff
changeset

472 
can (Graph.get_node fact_graph) (Thm.get_name_hint th) 
891a24a48155
improved meshing of MaSh and MengPaulson if some MaSh suggestions are cutoff (the common case)
blanchet
parents:
48319
diff
changeset

473 

48318  474 
fun mash_suggest_facts ctxt ({overlord, ...} : params) prover max_facts hyp_ts 
475 
concl_t facts = 

48301  476 
let 
48302  477 
val thy = Proof_Context.theory_of ctxt 
48321  478 
val fact_graph = #fact_graph (mash_get ctxt) 
479 
val parents = parents_wrt_facts ctxt facts fact_graph 

48318  480 
val feats = features_of ctxt prover thy General (concl_t :: hyp_ts) 
481 
val suggs = 

48320
891a24a48155
improved meshing of MaSh and MengPaulson if some MaSh suggestions are cutoff (the common case)
blanchet
parents:
48319
diff
changeset

482 
if Graph.is_empty fact_graph then [] 
891a24a48155
improved meshing of MaSh and MengPaulson if some MaSh suggestions are cutoff (the common case)
blanchet
parents:
48319
diff
changeset

483 
else mash_QUERY ctxt overlord (max_suggs_of max_facts) (parents, feats) 
891a24a48155
improved meshing of MaSh and MengPaulson if some MaSh suggestions are cutoff (the common case)
blanchet
parents:
48319
diff
changeset

484 
val selected = facts > suggested_facts suggs 
891a24a48155
improved meshing of MaSh and MengPaulson if some MaSh suggestions are cutoff (the common case)
blanchet
parents:
48319
diff
changeset

485 
val unknown = facts > filter_out (is_fact_in_graph fact_graph) 
891a24a48155
improved meshing of MaSh and MengPaulson if some MaSh suggestions are cutoff (the common case)
blanchet
parents:
48319
diff
changeset

486 
in (selected, unknown) end 
48249  487 

48316
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

488 
fun add_thys_for thy = 
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

489 
let fun add comp thy = Symtab.update (Context.theory_name thy, comp) in 
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

490 
add false thy #> fold (add true) (Theory.ancestors_of thy) 
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

491 
end 
48249  492 

48316
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

493 
fun update_fact_graph ctxt (name, parents, feats, deps) (upds, graph) = 
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

494 
let 
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

495 
fun maybe_add_from from (accum as (parents, graph)) = 
48321  496 
try_graph ctxt "updating graph" accum (fn () => 
497 
(from :: parents, Graph.add_edge_acyclic (from, name) graph)) 

498 
val graph = graph > Graph.default_node (name, ()) 

48316
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

499 
val (parents, graph) = ([], graph) > fold maybe_add_from parents 
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

500 
val (deps, graph) = ([], graph) > fold maybe_add_from deps 
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

501 
in ((name, parents, feats, deps) :: upds, graph) end 
48306  502 

48318  503 
val pass1_learn_timeout_factor = 0.5 
504 

505 
(* The timeout is understood in a very slack fashion. *) 

48319
340187063d84
use async manager to manage MaSh learners to make sure they get killed cleanly
blanchet
parents:
48318
diff
changeset

506 
fun mash_learn_thy ctxt ({provers, verbose, overlord, ...} : params) thy timeout 
340187063d84
use async manager to manage MaSh learners to make sure they get killed cleanly
blanchet
parents:
48318
diff
changeset

507 
facts = 
48304  508 
let 
48318  509 
val timer = Timer.startRealTimer () 
510 
val prover = hd provers 

511 
fun timed_out frac = 

512 
Time.> (Timer.checkRealTimer timer, time_mult frac timeout) 

48321  513 
val {fact_graph, ...} = mash_get ctxt 
48320
891a24a48155
improved meshing of MaSh and MengPaulson if some MaSh suggestions are cutoff (the common case)
blanchet
parents:
48319
diff
changeset

514 
val new_facts = 
891a24a48155
improved meshing of MaSh and MengPaulson if some MaSh suggestions are cutoff (the common case)
blanchet
parents:
48319
diff
changeset

515 
facts > filter_out (is_fact_in_graph fact_graph) 
891a24a48155
improved meshing of MaSh and MengPaulson if some MaSh suggestions are cutoff (the common case)
blanchet
parents:
48319
diff
changeset

516 
> sort (thm_ord o pairself snd) 
48308  517 
in 
518 
if null new_facts then 

48319
340187063d84
use async manager to manage MaSh learners to make sure they get killed cleanly
blanchet
parents:
48318
diff
changeset

519 
"" 
48308  520 
else 
48304  521 
let 
48308  522 
val ths = facts > map snd 
48315
82d6e46c673f
fixed order of accessibles + other tweaks to MaSh
blanchet
parents:
48314
diff
changeset

523 
val all_names = 
48324  524 
ths > filter_out is_likely_tautology_or_too_meta 
48316
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

525 
> map (rpair () o Thm.get_name_hint) 
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

526 
> Symtab.make 
48318  527 
fun do_fact _ (accum as (_, true)) = accum 
528 
 do_fact ((_, (_, status)), th) ((parents, upds), false) = 

529 
let 

530 
val name = Thm.get_name_hint th 

531 
val feats = features_of ctxt prover thy status [prop_of th] 

532 
val deps = isabelle_dependencies_of all_names th 

533 
val upd = (name, parents, feats, deps) 

534 
in (([name], upd :: upds), timed_out pass1_learn_timeout_factor) end 

48321  535 
val parents = parents_wrt_facts ctxt facts fact_graph 
48318  536 
val ((_, upds), _) = 
537 
((parents, []), false) > fold do_fact new_facts >> apsnd rev 

538 
val n = length upds 

48316
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

539 
fun trans {thys, fact_graph} = 
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

540 
let 
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

541 
val mash_INIT_or_ADD = 
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

542 
if Graph.is_empty fact_graph then mash_INIT else mash_ADD 
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

543 
val (upds, fact_graph) = 
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

544 
([], fact_graph) > fold (update_fact_graph ctxt) upds 
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

545 
in 
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

546 
(mash_INIT_or_ADD ctxt overlord (rev upds); 
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

547 
{thys = thys > add_thys_for thy, 
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

548 
fact_graph = fact_graph}) 
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

549 
end 
48318  550 
in 
48321  551 
mash_map ctxt trans; 
48319
340187063d84
use async manager to manage MaSh learners to make sure they get killed cleanly
blanchet
parents:
48318
diff
changeset

552 
if verbose then 
340187063d84
use async manager to manage MaSh learners to make sure they get killed cleanly
blanchet
parents:
48318
diff
changeset

553 
"Processed " ^ string_of_int n ^ " proof" ^ plural_s n ^ 
340187063d84
use async manager to manage MaSh learners to make sure they get killed cleanly
blanchet
parents:
48318
diff
changeset

554 
(if verbose then 
340187063d84
use async manager to manage MaSh learners to make sure they get killed cleanly
blanchet
parents:
48318
diff
changeset

555 
" in " ^ string_from_time (Timer.checkRealTimer timer) 
340187063d84
use async manager to manage MaSh learners to make sure they get killed cleanly
blanchet
parents:
48318
diff
changeset

556 
else 
340187063d84
use async manager to manage MaSh learners to make sure they get killed cleanly
blanchet
parents:
48318
diff
changeset

557 
"") ^ "." 
340187063d84
use async manager to manage MaSh learners to make sure they get killed cleanly
blanchet
parents:
48318
diff
changeset

558 
else 
340187063d84
use async manager to manage MaSh learners to make sure they get killed cleanly
blanchet
parents:
48318
diff
changeset

559 
"" 
48318  560 
end 
48308  561 
end 
48304  562 

48321  563 
fun mash_learn_proof ctxt ({provers, overlord, ...} : params) t facts used_ths = 
48316
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

564 
let 
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

565 
val thy = Proof_Context.theory_of ctxt 
48318  566 
val prover = hd provers 
567 
val name = ATP_Util.timestamp () ^ serial_string () (* fresh enough *) 

568 
val feats = features_of ctxt prover thy General [t] 

48316
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

569 
val deps = used_ths > map Thm.get_name_hint 
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

570 
in 
48321  571 
mash_map ctxt (fn {thys, fact_graph} => 
48309  572 
let 
48321  573 
val parents = parents_wrt_facts ctxt facts fact_graph 
48316
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

574 
val upds = [(name, parents, feats, deps)] 
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

575 
val (upds, fact_graph) = 
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

576 
([], fact_graph) > fold (update_fact_graph ctxt) upds 
48309  577 
in 
48316
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

578 
mash_ADD ctxt overlord upds; 
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

579 
{thys = thys, fact_graph = fact_graph} 
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

580 
end) 
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset

581 
end 
48249  582 

48318  583 
(* The threshold should be large enough so that MaSh doesn't kick in for Auto 
584 
Sledgehammer and Try. *) 

585 
val min_secs_for_learning = 15 

586 
val short_learn_timeout_factor = 0.2 

587 
val long_learn_timeout_factor = 4.0 

588 

48321  589 
fun relevant_facts ctxt (params as {learn, fact_filter, timeout, ...}) prover 
590 
max_facts ({add, only, ...} : fact_override) hyp_ts concl_t facts = 

48314
ee33ba3c0e05
added option to control which fact filter is used
blanchet
parents:
48313
diff
changeset

591 
if not (subset (op =) (the_list fact_filter, fact_filters)) then 
ee33ba3c0e05
added option to control which fact filter is used
blanchet
parents:
48313
diff
changeset

592 
error ("Unknown fact filter: " ^ quote (the fact_filter) ^ ".") 
ee33ba3c0e05
added option to control which fact filter is used
blanchet
parents:
48313
diff
changeset

593 
else if only then 
48289  594 
facts 
48321  595 
else if max_facts <= 0 orelse null facts then 
48288
255c6e1fd505
rationalize relevance filter, slowing moving code from Iter to MaSh
blanchet
parents:
48251
diff
changeset

596 
[] 
255c6e1fd505
rationalize relevance filter, slowing moving code from Iter to MaSh
blanchet
parents:
48251
diff
changeset

597 
else 
255c6e1fd505
rationalize relevance filter, slowing moving code from Iter to MaSh
blanchet
parents:
48251
diff
changeset

598 
let 
48318  599 
val thy = Proof_Context.theory_of ctxt 
600 
fun maybe_learn can_suggest = 

48321  601 
if not learn orelse Async_Manager.has_running_threads MaShN then 
48319
340187063d84
use async manager to manage MaSh learners to make sure they get killed cleanly
blanchet
parents:
48318
diff
changeset

602 
() 
340187063d84
use async manager to manage MaSh learners to make sure they get killed cleanly
blanchet
parents:
48318
diff
changeset

603 
else if Time.toSeconds timeout >= min_secs_for_learning then 
340187063d84
use async manager to manage MaSh learners to make sure they get killed cleanly
blanchet
parents:
48318
diff
changeset

604 
let 
340187063d84
use async manager to manage MaSh learners to make sure they get killed cleanly
blanchet
parents:
48318
diff
changeset

605 
val factor = 
340187063d84
use async manager to manage MaSh learners to make sure they get killed cleanly
blanchet
parents:
48318
diff
changeset

606 
if can_suggest then short_learn_timeout_factor 
340187063d84
use async manager to manage MaSh learners to make sure they get killed cleanly
blanchet
parents:
48318
diff
changeset

607 
else long_learn_timeout_factor 
340187063d84
use async manager to manage MaSh learners to make sure they get killed cleanly
blanchet
parents:
48318
diff
changeset

608 
val soft_timeout = time_mult factor timeout 
340187063d84
use async manager to manage MaSh learners to make sure they get killed cleanly
blanchet
parents:
48318
diff
changeset

609 
val hard_timeout = time_mult 2.0 soft_timeout 
340187063d84
use async manager to manage MaSh learners to make sure they get killed cleanly
blanchet
parents:
48318
diff
changeset

610 
val birth_time = Time.now () 
340187063d84
use async manager to manage MaSh learners to make sure they get killed cleanly
blanchet
parents:
48318
diff
changeset

611 
val death_time = Time.+ (birth_time, hard_timeout) 
340187063d84
use async manager to manage MaSh learners to make sure they get killed cleanly
blanchet
parents:
48318
diff
changeset

612 
val desc = ("machine learner for Sledgehammer", "") 
340187063d84
use async manager to manage MaSh learners to make sure they get killed cleanly
blanchet
parents:
48318
diff
changeset

613 
in 
340187063d84
use async manager to manage MaSh learners to make sure they get killed cleanly
blanchet
parents:
48318
diff
changeset

614 
Async_Manager.launch MaShN birth_time death_time desc 
340187063d84
use async manager to manage MaSh learners to make sure they get killed cleanly
blanchet
parents:
48318
diff
changeset

615 
(fn () => 
340187063d84
use async manager to manage MaSh learners to make sure they get killed cleanly
blanchet
parents:
48318
diff
changeset

616 
(true, mash_learn_thy ctxt params thy soft_timeout facts)) 
340187063d84
use async manager to manage MaSh learners to make sure they get killed cleanly
blanchet
parents:
48318
diff
changeset

617 
end 
48318  618 
else 
619 
() 

48314
ee33ba3c0e05
added option to control which fact filter is used
blanchet
parents:
48313
diff
changeset

620 
val fact_filter = 
ee33ba3c0e05
added option to control which fact filter is used
blanchet
parents:
48313
diff
changeset

621 
case fact_filter of 
48318  622 
SOME ff => 
48321  623 
(if ff <> iterN then maybe_learn (mash_can_suggest_facts ctxt) 
624 
else (); ff) 

48318  625 
 NONE => 
48321  626 
if mash_can_suggest_facts ctxt then (maybe_learn true; meshN) 
48318  627 
else if mash_could_suggest_facts () then (maybe_learn false; iterN) 
628 
else iterN 

48288
255c6e1fd505
rationalize relevance filter, slowing moving code from Iter to MaSh
blanchet
parents:
48251
diff
changeset

629 
val add_ths = Attrib.eval_thms ctxt add 
48292  630 
fun prepend_facts ths accepts = 
48288
255c6e1fd505
rationalize relevance filter, slowing moving code from Iter to MaSh
blanchet
parents:
48251
diff
changeset

631 
((facts > filter (member Thm.eq_thm_prop ths o snd)) @ 
48292  632 
(accepts > filter_out (member Thm.eq_thm_prop ths o snd))) 
48293  633 
> take max_facts 
48314
ee33ba3c0e05
added option to control which fact filter is used
blanchet
parents:
48313
diff
changeset

634 
fun iter () = 
48298  635 
iterative_relevant_facts ctxt params prover max_facts NONE hyp_ts 
636 
concl_t facts 

48314
ee33ba3c0e05
added option to control which fact filter is used
blanchet
parents:
48313
diff
changeset

637 
fun mash () = 
48320
891a24a48155
improved meshing of MaSh and MengPaulson if some MaSh suggestions are cutoff (the common case)
blanchet
parents:
48319
diff
changeset

638 
mash_suggest_facts ctxt params prover max_facts hyp_ts concl_t facts 
48314
ee33ba3c0e05
added option to control which fact filter is used
blanchet
parents:
48313
diff
changeset

639 
val mess = 
48320
891a24a48155
improved meshing of MaSh and MengPaulson if some MaSh suggestions are cutoff (the common case)
blanchet
parents:
48319
diff
changeset

640 
[] > (if fact_filter <> mashN then cons (iter (), []) else I) 
48314
ee33ba3c0e05
added option to control which fact filter is used
blanchet
parents:
48313
diff
changeset

641 
> (if fact_filter <> iterN then cons (mash ()) else I) 
48288
255c6e1fd505
rationalize relevance filter, slowing moving code from Iter to MaSh
blanchet
parents:
48251
diff
changeset

642 
in 
48313
0faafdffa662
mesh facts by taking into consideration whether a fact is known to MeSh
blanchet
parents:
48312
diff
changeset

643 
mesh_facts max_facts mess 
48288
255c6e1fd505
rationalize relevance filter, slowing moving code from Iter to MaSh
blanchet
parents:
48251
diff
changeset

644 
> not (null add_ths) ? prepend_facts add_ths 
255c6e1fd505
rationalize relevance filter, slowing moving code from Iter to MaSh
blanchet
parents:
48251
diff
changeset

645 
end 
255c6e1fd505
rationalize relevance filter, slowing moving code from Iter to MaSh
blanchet
parents:
48251
diff
changeset

646 

48319
340187063d84
use async manager to manage MaSh learners to make sure they get killed cleanly
blanchet
parents:
48318
diff
changeset

647 
fun kill_learners () = Async_Manager.kill_threads MaShN "learner" 
340187063d84
use async manager to manage MaSh learners to make sure they get killed cleanly
blanchet
parents:
48318
diff
changeset

648 
fun running_learners () = Async_Manager.running_threads MaShN "learner" 
340187063d84
use async manager to manage MaSh learners to make sure they get killed cleanly
blanchet
parents:
48318
diff
changeset

649 

48248  650 
end; 