author | boehmes |
Fri, 08 Apr 2011 19:04:08 +0200 | |
changeset 42323 | ab5747d44120 |
parent 37523 | 40c352510065 |
child 45404 | 69ec395ef6ca |
permissions | -rw-r--r-- |
12319 | 1 |
(* Title: Pure/net.ML |
2 |
Author: Lawrence C Paulson, Cambridge University Computer Laboratory |
|
0 | 3 |
Copyright 1993 University of Cambridge |
4 |
||
5 |
Discrimination nets: a data structure for indexing items |
|
6 |
||
12319 | 7 |
From the book |
8 |
E. Charniak, C. K. Riesbeck, D. V. McDermott. |
|
0 | 9 |
Artificial Intelligence Programming. |
10 |
(Lawrence Erlbaum Associates, 1980). [Chapter 14] |
|
225
76f60e6400e8
optimized net for matching of abstractions to speed up simplifier
nipkow
parents:
0
diff
changeset
|
11 |
|
12319 | 12 |
match_term no longer treats abstractions as wildcards; instead they match |
228 | 13 |
only wildcards in patterns. Requires operands to be beta-eta-normal. |
0 | 14 |
*) |
15 |
||
12319 | 16 |
signature NET = |
16808 | 17 |
sig |
0 | 18 |
type key |
16808 | 19 |
val key_of_term: term -> key list |
37523 | 20 |
val encode_type: typ -> term |
0 | 21 |
type 'a net |
22 |
val empty: 'a net |
|
16808 | 23 |
exception INSERT |
24 |
val insert: ('a * 'a -> bool) -> key list * 'a -> 'a net -> 'a net |
|
25 |
val insert_term: ('a * 'a -> bool) -> term * 'a -> 'a net -> 'a net |
|
33371 | 26 |
val insert_safe: ('a * 'a -> bool) -> key list * 'a -> 'a net -> 'a net |
27 |
val insert_term_safe: ('a * 'a -> bool) -> term * 'a -> 'a net -> 'a net |
|
16808 | 28 |
exception DELETE |
29 |
val delete: ('b * 'a -> bool) -> key list * 'b -> 'a net -> 'a net |
|
30 |
val delete_term: ('b * 'a -> bool) -> term * 'b -> 'a net -> 'a net |
|
33371 | 31 |
val delete_safe: ('b * 'a -> bool) -> key list * 'b -> 'a net -> 'a net |
32 |
val delete_term_safe: ('b * 'a -> bool) -> term * 'b -> 'a net -> 'a net |
|
16808 | 33 |
val lookup: 'a net -> key list -> 'a list |
0 | 34 |
val match_term: 'a net -> term -> 'a list |
35 |
val unify_term: 'a net -> term -> 'a list |
|
16808 | 36 |
val entries: 'a net -> 'a list |
37 |
val subtract: ('b * 'a -> bool) -> 'a net -> 'b net -> 'b list |
|
38 |
val merge: ('a * 'a -> bool) -> 'a net * 'a net -> 'a net |
|
20011 | 39 |
val content: 'a net -> 'a list |
16808 | 40 |
end; |
0 | 41 |
|
16808 | 42 |
structure Net: NET = |
0 | 43 |
struct |
44 |
||
45 |
datatype key = CombK | VarK | AtomK of string; |
|
46 |
||
228 | 47 |
(*Keys are preorder lists of symbols -- Combinations, Vars, Atoms. |
225
76f60e6400e8
optimized net for matching of abstractions to speed up simplifier
nipkow
parents:
0
diff
changeset
|
48 |
Any term whose head is a Var is regarded entirely as a Var. |
228 | 49 |
Abstractions are also regarded as Vars; this covers eta-conversion |
50 |
and "near" eta-conversions such as %x.?P(?f(x)). |
|
0 | 51 |
*) |
12319 | 52 |
fun add_key_of_terms (t, cs) = |
0 | 53 |
let fun rands (f$t, cs) = CombK :: rands (f, add_key_of_terms(t, cs)) |
12319 | 54 |
| rands (Const(c,_), cs) = AtomK c :: cs |
55 |
| rands (Free(c,_), cs) = AtomK c :: cs |
|
20080 | 56 |
| rands (Bound i, cs) = AtomK (Name.bound i) :: cs |
0 | 57 |
in case (head_of t) of |
225
76f60e6400e8
optimized net for matching of abstractions to speed up simplifier
nipkow
parents:
0
diff
changeset
|
58 |
Var _ => VarK :: cs |
228 | 59 |
| Abs _ => VarK :: cs |
225
76f60e6400e8
optimized net for matching of abstractions to speed up simplifier
nipkow
parents:
0
diff
changeset
|
60 |
| _ => rands(t,cs) |
0 | 61 |
end; |
62 |
||
225
76f60e6400e8
optimized net for matching of abstractions to speed up simplifier
nipkow
parents:
0
diff
changeset
|
63 |
(*convert a term to a list of keys*) |
0 | 64 |
fun key_of_term t = add_key_of_terms (t, []); |
65 |
||
37523 | 66 |
(*encode_type -- for indexing purposes*) |
67 |
fun encode_type (Type (c, Ts)) = Term.list_comb (Const (c, dummyT), map encode_type Ts) |
|
68 |
| encode_type (TFree (a, _)) = Free (a, dummyT) |
|
69 |
| encode_type (TVar (a, _)) = Var (a, dummyT); |
|
70 |
||
0 | 71 |
|
72 |
(*Trees indexed by key lists: each arc is labelled by a key. |
|
73 |
Each node contains a list of items, and arcs to children. |
|
74 |
The empty key addresses the entire net. |
|
75 |
Lookup functions preserve order in items stored at same level. |
|
76 |
*) |
|
77 |
datatype 'a net = Leaf of 'a list |
|
12319 | 78 |
| Net of {comb: 'a net, |
79 |
var: 'a net, |
|
16708 | 80 |
atoms: 'a net Symtab.table}; |
0 | 81 |
|
82 |
val empty = Leaf[]; |
|
16708 | 83 |
fun is_empty (Leaf []) = true | is_empty _ = false; |
84 |
val emptynet = Net{comb=empty, var=empty, atoms=Symtab.empty}; |
|
0 | 85 |
|
86 |
||
87 |
(*** Insertion into a discrimination net ***) |
|
88 |
||
12319 | 89 |
exception INSERT; (*duplicate item in the net*) |
0 | 90 |
|
91 |
||
92 |
(*Adds item x to the list at the node addressed by the keys. |
|
93 |
Creates node if not already present. |
|
12319 | 94 |
eq is the equality test for items. |
0 | 95 |
The empty list of keys generates a Leaf node, others a Net node. |
96 |
*) |
|
16808 | 97 |
fun insert eq (keys,x) net = |
12319 | 98 |
let fun ins1 ([], Leaf xs) = |
16686 | 99 |
if member eq xs x then raise INSERT else Leaf(x::xs) |
0 | 100 |
| ins1 (keys, Leaf[]) = ins1 (keys, emptynet) (*expand empty...*) |
16708 | 101 |
| ins1 (CombK :: keys, Net{comb,var,atoms}) = |
102 |
Net{comb=ins1(keys,comb), var=var, atoms=atoms} |
|
103 |
| ins1 (VarK :: keys, Net{comb,var,atoms}) = |
|
104 |
Net{comb=comb, var=ins1(keys,var), atoms=atoms} |
|
105 |
| ins1 (AtomK a :: keys, Net{comb,var,atoms}) = |
|
106 |
let |
|
18939 | 107 |
val net' = the_default empty (Symtab.lookup atoms a); |
17412 | 108 |
val atoms' = Symtab.update (a, ins1 (keys, net')) atoms; |
16708 | 109 |
in Net{comb=comb, var=var, atoms=atoms'} end |
0 | 110 |
in ins1 (keys,net) end; |
111 |
||
33371 | 112 |
fun insert_term eq (t, x) = insert eq (key_of_term t, x); |
113 |
||
16808 | 114 |
fun insert_safe eq entry net = insert eq entry net handle INSERT => net; |
33371 | 115 |
fun insert_term_safe eq entry net = insert_term eq entry net handle INSERT => net; |
16808 | 116 |
|
0 | 117 |
|
118 |
(*** Deletion from a discrimination net ***) |
|
119 |
||
12319 | 120 |
exception DELETE; (*missing item in the net*) |
0 | 121 |
|
122 |
(*Create a new Net node if it would be nonempty*) |
|
16708 | 123 |
fun newnet (args as {comb,var,atoms}) = |
124 |
if is_empty comb andalso is_empty var andalso Symtab.is_empty atoms |
|
125 |
then empty else Net args; |
|
0 | 126 |
|
127 |
(*Deletes item x from the list at the node addressed by the keys. |
|
128 |
Raises DELETE if absent. Collapses the net if possible. |
|
129 |
eq is the equality test for items. *) |
|
16808 | 130 |
fun delete eq (keys, x) net = |
0 | 131 |
let fun del1 ([], Leaf xs) = |
16686 | 132 |
if member eq xs x then Leaf (remove eq x xs) |
0 | 133 |
else raise DELETE |
12319 | 134 |
| del1 (keys, Leaf[]) = raise DELETE |
16708 | 135 |
| del1 (CombK :: keys, Net{comb,var,atoms}) = |
136 |
newnet{comb=del1(keys,comb), var=var, atoms=atoms} |
|
137 |
| del1 (VarK :: keys, Net{comb,var,atoms}) = |
|
138 |
newnet{comb=comb, var=del1(keys,var), atoms=atoms} |
|
139 |
| del1 (AtomK a :: keys, Net{comb,var,atoms}) = |
|
140 |
let val atoms' = |
|
17412 | 141 |
(case Symtab.lookup atoms a of |
16708 | 142 |
NONE => raise DELETE |
143 |
| SOME net' => |
|
144 |
(case del1 (keys, net') of |
|
145 |
Leaf [] => Symtab.delete a atoms |
|
17412 | 146 |
| net'' => Symtab.update (a, net'') atoms)) |
16708 | 147 |
in newnet{comb=comb, var=var, atoms=atoms'} end |
0 | 148 |
in del1 (keys,net) end; |
149 |
||
16808 | 150 |
fun delete_term eq (t, x) = delete eq (key_of_term t, x); |
0 | 151 |
|
33371 | 152 |
fun delete_safe eq entry net = delete eq entry net handle DELETE => net; |
153 |
fun delete_term_safe eq entry net = delete_term eq entry net handle DELETE => net; |
|
154 |
||
16677 | 155 |
|
0 | 156 |
(*** Retrieval functions for discrimination nets ***) |
157 |
||
16708 | 158 |
exception ABSENT; |
0 | 159 |
|
16708 | 160 |
fun the_atom atoms a = |
17412 | 161 |
(case Symtab.lookup atoms a of |
16708 | 162 |
NONE => raise ABSENT |
163 |
| SOME net => net); |
|
0 | 164 |
|
165 |
(*Return the list of items at the given node, [] if no such node*) |
|
16808 | 166 |
fun lookup (Leaf xs) [] = xs |
167 |
| lookup (Leaf _) (_ :: _) = [] (*non-empty keys and empty net*) |
|
168 |
| lookup (Net {comb, var, atoms}) (CombK :: keys) = lookup comb keys |
|
169 |
| lookup (Net {comb, var, atoms}) (VarK :: keys) = lookup var keys |
|
170 |
| lookup (Net {comb, var, atoms}) (AtomK a :: keys) = |
|
171 |
lookup (the_atom atoms a) keys handle ABSENT => []; |
|
0 | 172 |
|
173 |
||
174 |
(*Skipping a term in a net. Recursively skip 2 levels if a combination*) |
|
23178 | 175 |
fun net_skip (Leaf _) nets = nets |
176 |
| net_skip (Net{comb,var,atoms}) nets = |
|
177 |
fold_rev net_skip (net_skip comb []) (Symtab.fold (cons o #2) atoms (var::nets)); |
|
0 | 178 |
|
16808 | 179 |
|
180 |
(** Matching and Unification **) |
|
0 | 181 |
|
182 |
(*conses the linked net, if present, to nets*) |
|
16708 | 183 |
fun look1 (atoms, a) nets = |
184 |
the_atom atoms a :: nets handle ABSENT => nets; |
|
0 | 185 |
|
12319 | 186 |
(*Return the nodes accessible from the term (cons them before nets) |
0 | 187 |
"unif" signifies retrieval for unification rather than matching. |
188 |
Var in net matches any term. |
|
12319 | 189 |
Abs or Var in object: if "unif", regarded as wildcard, |
225
76f60e6400e8
optimized net for matching of abstractions to speed up simplifier
nipkow
parents:
0
diff
changeset
|
190 |
else matches only a variable in net. |
76f60e6400e8
optimized net for matching of abstractions to speed up simplifier
nipkow
parents:
0
diff
changeset
|
191 |
*) |
23178 | 192 |
fun matching unif t net nets = |
0 | 193 |
let fun rands _ (Leaf _, nets) = nets |
16708 | 194 |
| rands t (Net{comb,atoms,...}, nets) = |
12319 | 195 |
case t of |
23178 | 196 |
f$t => fold_rev (matching unif t) (rands f (comb,[])) nets |
16708 | 197 |
| Const(c,_) => look1 (atoms, c) nets |
198 |
| Free(c,_) => look1 (atoms, c) nets |
|
20080 | 199 |
| Bound i => look1 (atoms, Name.bound i) nets |
12319 | 200 |
| _ => nets |
201 |
in |
|
0 | 202 |
case net of |
12319 | 203 |
Leaf _ => nets |
0 | 204 |
| Net{var,...} => |
12319 | 205 |
case head_of t of |
23178 | 206 |
Var _ => if unif then net_skip net nets |
12319 | 207 |
else var::nets (*only matches Var in net*) |
2836 | 208 |
(*If "unif" then a var instantiation in the abstraction could allow |
209 |
an eta-reduction, so regard the abstraction as a wildcard.*) |
|
23178 | 210 |
| Abs _ => if unif then net_skip net nets |
12319 | 211 |
else var::nets (*only a Var can match*) |
212 |
| _ => rands t (net, var::nets) (*var could match also*) |
|
0 | 213 |
end; |
214 |
||
19482
9f11af8f7ef9
tuned basic list operators (flat, maps, map_filter);
wenzelm
parents:
18939
diff
changeset
|
215 |
fun extract_leaves l = maps (fn Leaf xs => xs) l; |
0 | 216 |
|
225
76f60e6400e8
optimized net for matching of abstractions to speed up simplifier
nipkow
parents:
0
diff
changeset
|
217 |
(*return items whose key could match t, WHICH MUST BE BETA-ETA NORMAL*) |
12319 | 218 |
fun match_term net t = |
23178 | 219 |
extract_leaves (matching false t net []); |
0 | 220 |
|
221 |
(*return items whose key could unify with t*) |
|
12319 | 222 |
fun unify_term net t = |
23178 | 223 |
extract_leaves (matching true t net []); |
0 | 224 |
|
3548 | 225 |
|
16808 | 226 |
(** operations on nets **) |
227 |
||
228 |
(*subtraction: collect entries of second net that are NOT present in first net*) |
|
229 |
fun subtract eq net1 net2 = |
|
230 |
let |
|
231 |
fun subtr (Net _) (Leaf ys) = append ys |
|
232 |
| subtr (Leaf xs) (Leaf ys) = |
|
233 |
fold_rev (fn y => if member eq xs y then I else cons y) ys |
|
234 |
| subtr (Leaf _) (net as Net _) = subtr emptynet net |
|
235 |
| subtr (Net {comb = comb1, var = var1, atoms = atoms1}) |
|
236 |
(Net {comb = comb2, var = var2, atoms = atoms2}) = |
|
16842 | 237 |
subtr comb1 comb2 |
238 |
#> subtr var1 var2 |
|
239 |
#> Symtab.fold (fn (a, net) => |
|
18939 | 240 |
subtr (the_default emptynet (Symtab.lookup atoms1 a)) net) atoms2 |
16808 | 241 |
in subtr net1 net2 [] end; |
242 |
||
243 |
fun entries net = subtract (K false) empty net; |
|
244 |
||
245 |
||
246 |
(* merge *) |
|
3548 | 247 |
|
248 |
fun cons_fst x (xs, y) = (x :: xs, y); |
|
249 |
||
250 |
fun dest (Leaf xs) = map (pair []) xs |
|
16708 | 251 |
| dest (Net {comb, var, atoms}) = |
3560 | 252 |
map (cons_fst CombK) (dest comb) @ |
253 |
map (cons_fst VarK) (dest var) @ |
|
19482
9f11af8f7ef9
tuned basic list operators (flat, maps, map_filter);
wenzelm
parents:
18939
diff
changeset
|
254 |
maps (fn (a, net) => map (cons_fst (AtomK a)) (dest net)) (Symtab.dest atoms); |
3548 | 255 |
|
16808 | 256 |
fun merge eq (net1, net2) = fold (insert_safe eq) (dest net2) net1; |
3548 | 257 |
|
20011 | 258 |
fun content net = map #2 (dest net); |
259 |
||
0 | 260 |
end; |