author | blanchet |
Sun, 06 Jan 2013 17:38:29 +0100 | |
changeset 50754 | 74a6adcb96ac |
parent 50735 | 6b232d76cbc9 |
child 50814 | 4247cbd78aaf |
permissions | -rw-r--r-- |
48234 | 1 |
(* Title: HOL/TPTP/mash_export.ML |
2 |
Author: Jasmin Blanchette, TU Muenchen |
|
3 |
Copyright 2012 |
|
4 |
||
5 |
Export Isabelle theory information for MaSh (Machine-learning for Sledgehammer). |
|
6 |
*) |
|
7 |
||
8 |
signature MASH_EXPORT = |
|
9 |
sig |
|
48251
6cdcfbddc077
moved most of MaSh exporter code to Sledgehammer
blanchet
parents:
48250
diff
changeset
|
10 |
type params = Sledgehammer_Provers.params |
48235 | 11 |
|
50349 | 12 |
val generate_accessibility : |
13 |
Proof.context -> theory list -> bool -> string -> unit |
|
48318 | 14 |
val generate_features : |
50349 | 15 |
Proof.context -> string -> theory list -> bool -> string -> unit |
48333 | 16 |
val generate_isar_dependencies : |
50349 | 17 |
Proof.context -> theory list -> bool -> string -> unit |
50484
8ec31bdb9d36
adopt the neutral "prover" terminology for MaSh rather than the ambiguous/wrong ATP terminology (which sometimes excludes SMT solvers)
blanchet
parents:
50442
diff
changeset
|
18 |
val generate_prover_dependencies : |
50559
89c0d2f13cca
MaSh exporter can now export subsets of the facts, as consecutive ranges
blanchet
parents:
50523
diff
changeset
|
19 |
Proof.context -> params -> int * int option -> theory list -> bool -> string |
89c0d2f13cca
MaSh exporter can now export subsets of the facts, as consecutive ranges
blanchet
parents:
50523
diff
changeset
|
20 |
-> unit |
50411 | 21 |
val generate_isar_commands : |
22 |
Proof.context -> string -> theory list -> string -> unit |
|
50484
8ec31bdb9d36
adopt the neutral "prover" terminology for MaSh rather than the ambiguous/wrong ATP terminology (which sometimes excludes SMT solvers)
blanchet
parents:
50442
diff
changeset
|
23 |
val generate_prover_commands : |
50559
89c0d2f13cca
MaSh exporter can now export subsets of the facts, as consecutive ranges
blanchet
parents:
50523
diff
changeset
|
24 |
Proof.context -> params -> int * int option -> theory list -> string -> unit |
48379
2b5ad61e2ccc
renamed "iter" fact filter to "MePo" (Meng--Paulson)
blanchet
parents:
48378
diff
changeset
|
25 |
val generate_mepo_suggestions : |
50349 | 26 |
Proof.context -> params -> theory list -> int -> string -> unit |
48234 | 27 |
end; |
28 |
||
29 |
structure MaSh_Export : MASH_EXPORT = |
|
30 |
struct |
|
31 |
||
50485
3c6ac2da2f45
merge aliased theorems in MaSh dependencies, modulo symmetry of equality
blanchet
parents:
50484
diff
changeset
|
32 |
open Sledgehammer_Fact |
48381 | 33 |
open Sledgehammer_MePo |
34 |
open Sledgehammer_MaSh |
|
48245 | 35 |
|
50559
89c0d2f13cca
MaSh exporter can now export subsets of the facts, as consecutive ranges
blanchet
parents:
50523
diff
changeset
|
36 |
fun in_range (from, to) j = |
89c0d2f13cca
MaSh exporter can now export subsets of the facts, as consecutive ranges
blanchet
parents:
50523
diff
changeset
|
37 |
j >= from andalso (to = NONE orelse j <= the to) |
89c0d2f13cca
MaSh exporter can now export subsets of the facts, as consecutive ranges
blanchet
parents:
50523
diff
changeset
|
38 |
|
50349 | 39 |
fun has_thm_thy th thy = |
48316
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset
|
40 |
Context.theory_name thy = Context.theory_name (theory_of_thm th) |
252f45c04042
drastic overhaul of MaSh data structures + fixed a few performance issues
blanchet
parents:
48315
diff
changeset
|
41 |
|
50349 | 42 |
fun has_thys thys th = exists (has_thm_thy th) thys |
43 |
||
44 |
fun all_facts ctxt = |
|
48531 | 45 |
let val css = Sledgehammer_Fact.clasimpset_rule_table_of ctxt in |
50442
4f6a4d32522c
don't blacklist "case" theorems -- this causes problems in MaSh later
blanchet
parents:
50434
diff
changeset
|
46 |
Sledgehammer_Fact.all_facts ctxt true false Symtab.empty [] [] css |
50485
3c6ac2da2f45
merge aliased theorems in MaSh dependencies, modulo symmetry of equality
blanchet
parents:
50484
diff
changeset
|
47 |
|> sort (thm_ord o pairself snd) |
48531 | 48 |
end |
49 |
||
50349 | 50 |
fun generate_accessibility ctxt thys include_thys file_name = |
48304 | 51 |
let |
52 |
val path = file_name |> Path.explode |
|
53 |
val _ = File.write path "" |
|
54 |
fun do_fact fact prevs = |
|
55 |
let |
|
56 |
val s = escape_meta fact ^ ": " ^ escape_metas prevs ^ "\n" |
|
57 |
val _ = File.append path s |
|
58 |
in [fact] end |
|
50611
99af6b652b3a
linearize eval driver, to work around horrible bug in previous implementation
blanchet
parents:
50582
diff
changeset
|
59 |
val facts = |
50349 | 60 |
all_facts ctxt |
61 |
|> not include_thys ? filter_out (has_thys thys o snd) |
|
50624
4d0997abce79
improved thm order hack, in case the default names are overridden
blanchet
parents:
50611
diff
changeset
|
62 |
|> map (snd #> nickname_of_thm) |
50611
99af6b652b3a
linearize eval driver, to work around horrible bug in previous implementation
blanchet
parents:
50582
diff
changeset
|
63 |
in fold do_fact facts []; () end |
48304 | 64 |
|
50349 | 65 |
fun generate_features ctxt prover thys include_thys file_name = |
48304 | 66 |
let |
67 |
val path = file_name |> Path.explode |
|
68 |
val _ = File.write path "" |
|
69 |
val facts = |
|
50349 | 70 |
all_facts ctxt |
71 |
|> not include_thys ? filter_out (has_thys thys o snd) |
|
48385 | 72 |
fun do_fact ((_, stature), th) = |
48304 | 73 |
let |
50624
4d0997abce79
improved thm order hack, in case the default names are overridden
blanchet
parents:
50611
diff
changeset
|
74 |
val name = nickname_of_thm th |
48318 | 75 |
val feats = |
48385 | 76 |
features_of ctxt prover (theory_of_thm th) stature [prop_of th] |
50582 | 77 |
val s = |
78 |
escape_meta name ^ ": " ^ encode_features (sort_wrt fst feats) ^ "\n" |
|
48304 | 79 |
in File.append path s end |
80 |
in List.app do_fact facts end |
|
81 |
||
50735
6b232d76cbc9
refined class handling, to prevent cycles in fact graph
blanchet
parents:
50624
diff
changeset
|
82 |
fun isar_or_prover_dependencies_of ctxt params_opt facts name_tabs th |
50515
c4a27ab89c9b
shared bad MaSh query detection between MePo and MaSh, so that the generated files mirror each other
blanchet
parents:
50511
diff
changeset
|
83 |
isar_deps_opt = |
50754
74a6adcb96ac
also generate queries for goals with too many Isar dependencies
blanchet
parents:
50735
diff
changeset
|
84 |
case params_opt of |
74a6adcb96ac
also generate queries for goals with too many Isar dependencies
blanchet
parents:
50735
diff
changeset
|
85 |
SOME (params as {provers = prover :: _, ...}) => |
74a6adcb96ac
also generate queries for goals with too many Isar dependencies
blanchet
parents:
50735
diff
changeset
|
86 |
prover_dependencies_of ctxt params prover 0 facts name_tabs th |> snd |
74a6adcb96ac
also generate queries for goals with too many Isar dependencies
blanchet
parents:
50735
diff
changeset
|
87 |
| NONE => |
74a6adcb96ac
also generate queries for goals with too many Isar dependencies
blanchet
parents:
50735
diff
changeset
|
88 |
case isar_deps_opt of |
74a6adcb96ac
also generate queries for goals with too many Isar dependencies
blanchet
parents:
50735
diff
changeset
|
89 |
SOME deps => deps |
74a6adcb96ac
also generate queries for goals with too many Isar dependencies
blanchet
parents:
50735
diff
changeset
|
90 |
| NONE => isar_dependencies_of name_tabs th |
50411 | 91 |
|
50559
89c0d2f13cca
MaSh exporter can now export subsets of the facts, as consecutive ranges
blanchet
parents:
50523
diff
changeset
|
92 |
fun generate_isar_or_prover_dependencies ctxt params_opt range thys include_thys |
50484
8ec31bdb9d36
adopt the neutral "prover" terminology for MaSh rather than the ambiguous/wrong ATP terminology (which sometimes excludes SMT solvers)
blanchet
parents:
50442
diff
changeset
|
93 |
file_name = |
48304 | 94 |
let |
95 |
val path = file_name |> Path.explode |
|
96 |
val facts = |
|
50485
3c6ac2da2f45
merge aliased theorems in MaSh dependencies, modulo symmetry of equality
blanchet
parents:
50484
diff
changeset
|
97 |
all_facts ctxt |> not include_thys ? filter_out (has_thys thys o snd) |
50735
6b232d76cbc9
refined class handling, to prevent cycles in fact graph
blanchet
parents:
50624
diff
changeset
|
98 |
val name_tabs = build_name_tables nickname_of_thm facts |
50559
89c0d2f13cca
MaSh exporter can now export subsets of the facts, as consecutive ranges
blanchet
parents:
50523
diff
changeset
|
99 |
fun do_fact (j, (_, th)) = |
89c0d2f13cca
MaSh exporter can now export subsets of the facts, as consecutive ranges
blanchet
parents:
50523
diff
changeset
|
100 |
if in_range range j then |
89c0d2f13cca
MaSh exporter can now export subsets of the facts, as consecutive ranges
blanchet
parents:
50523
diff
changeset
|
101 |
let |
50624
4d0997abce79
improved thm order hack, in case the default names are overridden
blanchet
parents:
50611
diff
changeset
|
102 |
val name = nickname_of_thm th |
50561 | 103 |
val _ = tracing ("Fact " ^ string_of_int j ^ ": " ^ name) |
50559
89c0d2f13cca
MaSh exporter can now export subsets of the facts, as consecutive ranges
blanchet
parents:
50523
diff
changeset
|
104 |
val deps = |
50735
6b232d76cbc9
refined class handling, to prevent cycles in fact graph
blanchet
parents:
50624
diff
changeset
|
105 |
isar_or_prover_dependencies_of ctxt params_opt facts name_tabs th |
50559
89c0d2f13cca
MaSh exporter can now export subsets of the facts, as consecutive ranges
blanchet
parents:
50523
diff
changeset
|
106 |
NONE |
89c0d2f13cca
MaSh exporter can now export subsets of the facts, as consecutive ranges
blanchet
parents:
50523
diff
changeset
|
107 |
in escape_meta name ^ ": " ^ escape_metas deps ^ "\n" end |
89c0d2f13cca
MaSh exporter can now export subsets of the facts, as consecutive ranges
blanchet
parents:
50523
diff
changeset
|
108 |
else |
89c0d2f13cca
MaSh exporter can now export subsets of the facts, as consecutive ranges
blanchet
parents:
50523
diff
changeset
|
109 |
"" |
89c0d2f13cca
MaSh exporter can now export subsets of the facts, as consecutive ranges
blanchet
parents:
50523
diff
changeset
|
110 |
val lines = Par_List.map do_fact (tag_list 1 facts) |
50519 | 111 |
in File.write_list path lines end |
48304 | 112 |
|
50411 | 113 |
fun generate_isar_dependencies ctxt = |
50559
89c0d2f13cca
MaSh exporter can now export subsets of the facts, as consecutive ranges
blanchet
parents:
50523
diff
changeset
|
114 |
generate_isar_or_prover_dependencies ctxt NONE (1, NONE) |
50411 | 115 |
|
50484
8ec31bdb9d36
adopt the neutral "prover" terminology for MaSh rather than the ambiguous/wrong ATP terminology (which sometimes excludes SMT solvers)
blanchet
parents:
50442
diff
changeset
|
116 |
fun generate_prover_dependencies ctxt params = |
8ec31bdb9d36
adopt the neutral "prover" terminology for MaSh rather than the ambiguous/wrong ATP terminology (which sometimes excludes SMT solvers)
blanchet
parents:
50442
diff
changeset
|
117 |
generate_isar_or_prover_dependencies ctxt (SOME params) |
50411 | 118 |
|
50515
c4a27ab89c9b
shared bad MaSh query detection between MePo and MaSh, so that the generated files mirror each other
blanchet
parents:
50511
diff
changeset
|
119 |
fun is_bad_query ctxt ho_atp th isar_deps = |
c4a27ab89c9b
shared bad MaSh query detection between MePo and MaSh, so that the generated files mirror each other
blanchet
parents:
50511
diff
changeset
|
120 |
Thm.legacy_get_kind th = "" orelse null isar_deps orelse |
50523
0799339fea0f
get rid of some junk facts in the MaSh evaluation driver
blanchet
parents:
50519
diff
changeset
|
121 |
is_blacklisted_or_something ctxt ho_atp (Thm.get_name_hint th) |
50515
c4a27ab89c9b
shared bad MaSh query detection between MePo and MaSh, so that the generated files mirror each other
blanchet
parents:
50511
diff
changeset
|
122 |
|
50559
89c0d2f13cca
MaSh exporter can now export subsets of the facts, as consecutive ranges
blanchet
parents:
50523
diff
changeset
|
123 |
fun generate_isar_or_prover_commands ctxt prover params_opt range thys |
89c0d2f13cca
MaSh exporter can now export subsets of the facts, as consecutive ranges
blanchet
parents:
50523
diff
changeset
|
124 |
file_name = |
48234 | 125 |
let |
50511
8825c36cb1ce
don't query blacklisted theorems in evaluation driver
blanchet
parents:
50485
diff
changeset
|
126 |
val ho_atp = Sledgehammer_Provers.is_ho_atp ctxt prover |
48234 | 127 |
val path = file_name |> Path.explode |
50349 | 128 |
val facts = all_facts ctxt |
50485
3c6ac2da2f45
merge aliased theorems in MaSh dependencies, modulo symmetry of equality
blanchet
parents:
50484
diff
changeset
|
129 |
val (new_facts, old_facts) = facts |> List.partition (has_thys thys o snd) |
50735
6b232d76cbc9
refined class handling, to prevent cycles in fact graph
blanchet
parents:
50624
diff
changeset
|
130 |
val name_tabs = build_name_tables nickname_of_thm facts |
50559
89c0d2f13cca
MaSh exporter can now export subsets of the facts, as consecutive ranges
blanchet
parents:
50523
diff
changeset
|
131 |
fun do_fact (j, ((name, ((_, stature), th)), prevs)) = |
89c0d2f13cca
MaSh exporter can now export subsets of the facts, as consecutive ranges
blanchet
parents:
50523
diff
changeset
|
132 |
if in_range range j then |
89c0d2f13cca
MaSh exporter can now export subsets of the facts, as consecutive ranges
blanchet
parents:
50523
diff
changeset
|
133 |
let |
50561 | 134 |
val _ = tracing ("Fact " ^ string_of_int j ^ ": " ^ name) |
50559
89c0d2f13cca
MaSh exporter can now export subsets of the facts, as consecutive ranges
blanchet
parents:
50523
diff
changeset
|
135 |
val feats = |
89c0d2f13cca
MaSh exporter can now export subsets of the facts, as consecutive ranges
blanchet
parents:
50523
diff
changeset
|
136 |
features_of ctxt prover (theory_of_thm th) stature [prop_of th] |
50735
6b232d76cbc9
refined class handling, to prevent cycles in fact graph
blanchet
parents:
50624
diff
changeset
|
137 |
val isar_deps = isar_dependencies_of name_tabs th |
50559
89c0d2f13cca
MaSh exporter can now export subsets of the facts, as consecutive ranges
blanchet
parents:
50523
diff
changeset
|
138 |
val deps = |
50735
6b232d76cbc9
refined class handling, to prevent cycles in fact graph
blanchet
parents:
50624
diff
changeset
|
139 |
isar_or_prover_dependencies_of ctxt params_opt facts name_tabs th |
50559
89c0d2f13cca
MaSh exporter can now export subsets of the facts, as consecutive ranges
blanchet
parents:
50523
diff
changeset
|
140 |
(SOME isar_deps) |
89c0d2f13cca
MaSh exporter can now export subsets of the facts, as consecutive ranges
blanchet
parents:
50523
diff
changeset
|
141 |
val core = |
89c0d2f13cca
MaSh exporter can now export subsets of the facts, as consecutive ranges
blanchet
parents:
50523
diff
changeset
|
142 |
escape_meta name ^ ": " ^ escape_metas prevs ^ "; " ^ |
50582 | 143 |
encode_features (sort_wrt fst feats) |
50559
89c0d2f13cca
MaSh exporter can now export subsets of the facts, as consecutive ranges
blanchet
parents:
50523
diff
changeset
|
144 |
val query = |
50754
74a6adcb96ac
also generate queries for goals with too many Isar dependencies
blanchet
parents:
50735
diff
changeset
|
145 |
if is_bad_query ctxt ho_atp th isar_deps then "" |
50559
89c0d2f13cca
MaSh exporter can now export subsets of the facts, as consecutive ranges
blanchet
parents:
50523
diff
changeset
|
146 |
else "? " ^ core ^ "\n" |
50754
74a6adcb96ac
also generate queries for goals with too many Isar dependencies
blanchet
parents:
50735
diff
changeset
|
147 |
val update = |
74a6adcb96ac
also generate queries for goals with too many Isar dependencies
blanchet
parents:
50735
diff
changeset
|
148 |
"! " ^ core ^ "; " ^ |
74a6adcb96ac
also generate queries for goals with too many Isar dependencies
blanchet
parents:
50735
diff
changeset
|
149 |
escape_metas (these (trim_dependencies th deps)) ^ "\n" |
50559
89c0d2f13cca
MaSh exporter can now export subsets of the facts, as consecutive ranges
blanchet
parents:
50523
diff
changeset
|
150 |
in query ^ update end |
89c0d2f13cca
MaSh exporter can now export subsets of the facts, as consecutive ranges
blanchet
parents:
50523
diff
changeset
|
151 |
else |
89c0d2f13cca
MaSh exporter can now export subsets of the facts, as consecutive ranges
blanchet
parents:
50523
diff
changeset
|
152 |
"" |
50624
4d0997abce79
improved thm order hack, in case the default names are overridden
blanchet
parents:
50611
diff
changeset
|
153 |
val parents = |
4d0997abce79
improved thm order hack, in case the default names are overridden
blanchet
parents:
50611
diff
changeset
|
154 |
map (nickname_of_thm o snd) (the_list (try List.last old_facts)) |
4d0997abce79
improved thm order hack, in case the default names are overridden
blanchet
parents:
50611
diff
changeset
|
155 |
val new_facts = new_facts |> map (`(nickname_of_thm o snd)) |
50519 | 156 |
val prevss = fst (split_last (parents :: map (single o fst) new_facts)) |
50559
89c0d2f13cca
MaSh exporter can now export subsets of the facts, as consecutive ranges
blanchet
parents:
50523
diff
changeset
|
157 |
val lines = Par_List.map do_fact (tag_list 1 (new_facts ~~ prevss)) |
50519 | 158 |
in File.write_list path lines end |
48239
0016290f904c
generate Meng--Paulson facts for evaluation purposes
blanchet
parents:
48235
diff
changeset
|
159 |
|
50411 | 160 |
fun generate_isar_commands ctxt prover = |
50559
89c0d2f13cca
MaSh exporter can now export subsets of the facts, as consecutive ranges
blanchet
parents:
50523
diff
changeset
|
161 |
generate_isar_or_prover_commands ctxt prover NONE (1, NONE) |
50411 | 162 |
|
50484
8ec31bdb9d36
adopt the neutral "prover" terminology for MaSh rather than the ambiguous/wrong ATP terminology (which sometimes excludes SMT solvers)
blanchet
parents:
50442
diff
changeset
|
163 |
fun generate_prover_commands ctxt (params as {provers = prover :: _, ...}) = |
8ec31bdb9d36
adopt the neutral "prover" terminology for MaSh rather than the ambiguous/wrong ATP terminology (which sometimes excludes SMT solvers)
blanchet
parents:
50442
diff
changeset
|
164 |
generate_isar_or_prover_commands ctxt prover (SOME params) |
50411 | 165 |
|
50515
c4a27ab89c9b
shared bad MaSh query detection between MePo and MaSh, so that the generated files mirror each other
blanchet
parents:
50511
diff
changeset
|
166 |
fun generate_mepo_suggestions ctxt (params as {provers = prover :: _, ...}) thys |
c4a27ab89c9b
shared bad MaSh query detection between MePo and MaSh, so that the generated files mirror each other
blanchet
parents:
50511
diff
changeset
|
167 |
max_facts file_name = |
48239
0016290f904c
generate Meng--Paulson facts for evaluation purposes
blanchet
parents:
48235
diff
changeset
|
168 |
let |
50515
c4a27ab89c9b
shared bad MaSh query detection between MePo and MaSh, so that the generated files mirror each other
blanchet
parents:
50511
diff
changeset
|
169 |
val ho_atp = Sledgehammer_Provers.is_ho_atp ctxt prover |
48239
0016290f904c
generate Meng--Paulson facts for evaluation purposes
blanchet
parents:
48235
diff
changeset
|
170 |
val path = file_name |> Path.explode |
50349 | 171 |
val facts = all_facts ctxt |
50485
3c6ac2da2f45
merge aliased theorems in MaSh dependencies, modulo symmetry of equality
blanchet
parents:
50484
diff
changeset
|
172 |
val (new_facts, old_facts) = facts |> List.partition (has_thys thys o snd) |
50735
6b232d76cbc9
refined class handling, to prevent cycles in fact graph
blanchet
parents:
50624
diff
changeset
|
173 |
val name_tabs = build_name_tables nickname_of_thm facts |
50523
0799339fea0f
get rid of some junk facts in the MaSh evaluation driver
blanchet
parents:
50519
diff
changeset
|
174 |
fun do_fact ((_, th), old_facts) = |
48239
0016290f904c
generate Meng--Paulson facts for evaluation purposes
blanchet
parents:
48235
diff
changeset
|
175 |
let |
50624
4d0997abce79
improved thm order hack, in case the default names are overridden
blanchet
parents:
50611
diff
changeset
|
176 |
val name = nickname_of_thm th |
50349 | 177 |
val goal = goal_of_thm (Proof_Context.theory_of ctxt) th |
48292 | 178 |
val (_, hyp_ts, concl_t) = ATP_Util.strip_subgoal ctxt goal 1 |
50735
6b232d76cbc9
refined class handling, to prevent cycles in fact graph
blanchet
parents:
50624
diff
changeset
|
179 |
val isar_deps = isar_dependencies_of name_tabs th |
50519 | 180 |
in |
50754
74a6adcb96ac
also generate queries for goals with too many Isar dependencies
blanchet
parents:
50735
diff
changeset
|
181 |
if is_bad_query ctxt ho_atp th isar_deps then |
50519 | 182 |
"" |
183 |
else |
|
184 |
let |
|
185 |
val suggs = |
|
186 |
old_facts |
|
187 |
|> Sledgehammer_MePo.mepo_suggested_facts ctxt params prover |
|
188 |
max_facts NONE hyp_ts concl_t |
|
50624
4d0997abce79
improved thm order hack, in case the default names are overridden
blanchet
parents:
50611
diff
changeset
|
189 |
|> map (nickname_of_thm o snd) |
50519 | 190 |
in escape_meta name ^ ": " ^ escape_metas suggs ^ "\n" end |
191 |
end |
|
192 |
fun accum x (yss as ys :: _) = (x :: ys) :: yss |
|
193 |
val old_factss = tl (fold accum new_facts [old_facts]) |
|
194 |
val lines = Par_List.map do_fact (new_facts ~~ rev old_factss) |
|
195 |
in File.write_list path lines end |
|
48234 | 196 |
|
197 |
end; |