| author | wenzelm | 
| Fri, 24 May 2024 16:15:27 +0200 | |
| changeset 80188 | 3956e8b6a9c9 | 
| parent 78817 | 30bcf149054d | 
| child 81588 | 81a72b7fcb0c | 
| permissions | -rw-r--r-- | 
| 11523 | 1 | (* Title: Pure/General/scan.ML | 
| 2 | Author: Markus Wenzel and Tobias Nipkow, TU Muenchen | |
| 6116 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 3 | |
| 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 4 | Generic scanners (for potentially infinite input). | 
| 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 5 | *) | 
| 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 6 | |
| 24025 | 7 | infix 5 -- :-- :|-- |-- --| ^^; | 
| 25999 | 8 | infixr 5 ::: @@@; | 
| 6116 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 9 | infix 3 >>; | 
| 23699 | 10 | infixr 0 ||; | 
| 6116 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 11 | |
| 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 12 | signature BASIC_SCAN = | 
| 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 13 | sig | 
| 43947 
9b00f09f7721
defer evaluation of Scan.message, for improved performance in the frequent situation where failure is handled later (e.g. via ||);
 wenzelm parents: 
40627diff
changeset | 14 | type message = unit -> string | 
| 14677 | 15 | (*error msg handler*) | 
| 43947 
9b00f09f7721
defer evaluation of Scan.message, for improved performance in the frequent situation where failure is handled later (e.g. via ||);
 wenzelm parents: 
40627diff
changeset | 16 |   val !! : ('a * message option -> message) -> ('a -> 'b) -> 'a -> 'b
 | 
| 78817 | 17 |   val !!! : string -> ('a -> string option) -> ('a -> 'b) -> 'a -> 'b
 | 
| 14677 | 18 | (*apply function*) | 
| 6116 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 19 |   val >> : ('a -> 'b * 'c) * ('b -> 'd) -> 'a -> 'd * 'c
 | 
| 14677 | 20 | (*alternative*) | 
| 6116 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 21 |   val || : ('a -> 'b) * ('a -> 'b) -> 'a -> 'b
 | 
| 14677 | 22 | (*sequential pairing*) | 
| 6116 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 23 |   val -- : ('a -> 'b * 'c) * ('c -> 'd * 'e) -> 'a -> ('b * 'd) * 'e
 | 
| 14677 | 24 | (*dependent pairing*) | 
| 6116 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 25 |   val :-- : ('a -> 'b * 'c) * ('b -> 'c -> 'd * 'e) -> 'a -> ('b * 'd) * 'e
 | 
| 24025 | 26 | (*projections*) | 
| 27 |   val :|-- : ('a -> 'b * 'c) * ('b -> 'c -> 'd * 'e) -> 'a -> 'd * 'e
 | |
| 6116 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 28 |   val |-- : ('a -> 'b * 'c) * ('c -> 'd * 'e) -> 'a -> 'd * 'e
 | 
| 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 29 |   val --| : ('a -> 'b * 'c) * ('c -> 'd * 'e) -> 'a -> 'b * 'e
 | 
| 14677 | 30 | (*concatenation*) | 
| 6116 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 31 |   val ^^ : ('a -> string * 'b) * ('b -> string * 'c) -> 'a -> string * 'c
 | 
| 25999 | 32 |   val ::: : ('a -> 'b * 'c) * ('c -> 'b list * 'd) -> 'a -> 'b list * 'd
 | 
| 33 |   val @@@ : ('a -> 'b list * 'c) * ('c -> 'b list * 'd) -> 'a -> 'b list * 'd
 | |
| 14677 | 34 | (*one element literal*) | 
| 19291 | 35 | val $$ : string -> string list -> string * string list | 
| 19306 | 36 | val ~$$ : string -> string list -> string * string list | 
| 6116 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 37 | end; | 
| 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 38 | |
| 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 39 | signature SCAN = | 
| 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 40 | sig | 
| 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 41 | include BASIC_SCAN | 
| 48743 
a72f8ffecf31
refined recovery of scan errors: longest prefix of delimited token after failure, otherwise just one symbol;
 wenzelm parents: 
43947diff
changeset | 42 |   val permissive: ('a -> 'b) -> 'a -> 'b
 | 
| 23699 | 43 |   val error: ('a -> 'b) -> 'a -> 'b
 | 
| 44 |   val catch: ('a -> 'b) -> 'a -> 'b    (*exception Fail*)
 | |
| 58864 | 45 |   val recover: ('a -> 'b) -> (string -> 'a -> 'b) -> 'a -> 'b
 | 
| 61466 | 46 |   val triple1: ('a * 'b) * 'c -> 'a * 'b * 'c
 | 
| 47 |   val triple2: 'a * ('b * 'c) -> 'a * 'b * 'c
 | |
| 6116 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 48 | val fail: 'a -> 'b | 
| 43947 
9b00f09f7721
defer evaluation of Scan.message, for improved performance in the frequent situation where failure is handled later (e.g. via ||);
 wenzelm parents: 
40627diff
changeset | 49 |   val fail_with: ('a -> message) -> 'a -> 'b
 | 
| 6116 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 50 | val succeed: 'a -> 'b -> 'a * 'b | 
| 15664 | 51 |   val some: ('a -> 'b option) -> 'a list -> 'b * 'a list
 | 
| 52 |   val one: ('a -> bool) -> 'a list -> 'a * 'a list
 | |
| 19291 | 53 | val this: string list -> string list -> string list * string list | 
| 14927 | 54 | val this_string: string -> string list -> string * string list | 
| 21858 
05f57309170c
avoid conflict with Alice keywords: renamed pack -> implode, unpack -> explode, any -> many, avoided assert;
 wenzelm parents: 
19473diff
changeset | 55 |   val many: ('a -> bool) -> 'a list -> 'a list * 'a list
 | 
| 
05f57309170c
avoid conflict with Alice keywords: renamed pack -> implode, unpack -> explode, any -> many, avoided assert;
 wenzelm parents: 
19473diff
changeset | 56 |   val many1: ('a -> bool) -> 'a list -> 'a list * 'a list
 | 
| 6116 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 57 |   val optional: ('a -> 'b * 'a) -> 'b -> 'a -> 'b * 'a
 | 
| 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 58 |   val option: ('a -> 'b * 'a) -> 'a -> 'b option * 'a
 | 
| 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 59 |   val repeat: ('a -> 'b * 'a) -> 'a -> 'b list * 'a
 | 
| 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 60 |   val repeat1: ('a -> 'b * 'a) -> 'a -> 'b list * 'a
 | 
| 61476 | 61 |   val repeats: ('a -> 'b list * 'a) -> 'a -> 'b list * 'a
 | 
| 62 |   val repeats1: ('a -> 'b list * 'a) -> 'a -> 'b list * 'a
 | |
| 23699 | 63 |   val single: ('a -> 'b * 'a) -> 'a -> 'b list * 'a
 | 
| 64 |   val bulk: ('a -> 'b * 'a) -> 'a -> 'b list * 'a
 | |
| 6116 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 65 |   val max: ('a * 'a -> bool) -> ('b -> 'a * 'b) -> ('b -> 'a * 'b) -> 'b -> 'a * 'b
 | 
| 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 66 |   val ahead: ('a -> 'b * 'c) -> 'a -> 'b * 'a
 | 
| 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 67 |   val unless: ('a -> 'b * 'a) -> ('a -> 'c * 'd) -> 'a -> 'c * 'd
 | 
| 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 68 |   val first: ('a -> 'b) list -> 'a -> 'b
 | 
| 14677 | 69 |   val state: 'a * 'b -> 'a * ('a * 'b)
 | 
| 6116 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 70 |   val depend: ('a -> 'b -> ('c * 'd) * 'e) -> 'a * 'b -> 'd * ('c * 'e)
 | 
| 15664 | 71 |   val peek: ('a -> 'b -> 'c * 'd) -> 'a * 'b -> 'c * ('a * 'd)
 | 
| 55104 
8284c0d5bf52
clarified scan_cartouche_depth, according to Scala version;
 wenzelm parents: 
48743diff
changeset | 72 |   val provide: ('a -> bool) -> 'b -> ('b * 'c -> 'd * ('a * 'e)) -> 'c -> 'd * 'e
 | 
| 15664 | 73 |   val pass: 'a -> ('a * 'b -> 'c * ('d * 'e)) -> 'b -> 'c * 'e
 | 
| 6116 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 74 |   val lift: ('a -> 'b * 'c) -> 'd * 'a -> 'b * ('d * 'c)
 | 
| 23699 | 75 |   val unlift: (unit * 'a -> 'b * ('c * 'd)) -> 'a -> 'b * 'd
 | 
| 15664 | 76 |   val trace: ('a list -> 'b * 'c list) -> 'a list -> ('b * 'a list) * 'c list
 | 
| 27731 
a7444ded92cf
abstract type stopper, may depend on final input;
 wenzelm parents: 
25999diff
changeset | 77 | type 'a stopper | 
| 
a7444ded92cf
abstract type stopper, may depend on final input;
 wenzelm parents: 
25999diff
changeset | 78 |   val stopper: ('a list -> 'a) -> ('a -> bool) -> 'a stopper
 | 
| 
a7444ded92cf
abstract type stopper, may depend on final input;
 wenzelm parents: 
25999diff
changeset | 79 | val is_stopper: 'a stopper -> 'a -> bool | 
| 
a7444ded92cf
abstract type stopper, may depend on final input;
 wenzelm parents: 
25999diff
changeset | 80 |   val finite': 'a stopper -> ('b * 'a list -> 'c * ('d * 'a list))
 | 
| 6116 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 81 |     -> 'b * 'a list -> 'c * ('d * 'a list)
 | 
| 27731 
a7444ded92cf
abstract type stopper, may depend on final input;
 wenzelm parents: 
25999diff
changeset | 82 |   val finite: 'a stopper -> ('a list -> 'b * 'a list) -> 'a list -> 'b * 'a list
 | 
| 
a7444ded92cf
abstract type stopper, may depend on final input;
 wenzelm parents: 
25999diff
changeset | 83 |   val read: 'a stopper -> ('a list -> 'b * 'a list) -> 'a list -> 'b option
 | 
| 58850 | 84 |   val drain: ('a -> 'b list * 'a) -> 'b stopper -> ('c * 'b list -> 'd * ('e * 'b list)) ->
 | 
| 85 |     ('c * 'b list) * 'a -> ('d * ('e * 'b list)) * 'a
 | |
| 6116 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 86 | type lexicon | 
| 27765 
5df443dd9deb
reorganized lexicon: allow scanning of annotated symbols, tuned representation and interfaces;
 wenzelm parents: 
27731diff
changeset | 87 | val is_literal: lexicon -> string list -> bool | 
| 
5df443dd9deb
reorganized lexicon: allow scanning of annotated symbols, tuned representation and interfaces;
 wenzelm parents: 
27731diff
changeset | 88 | val literal: lexicon -> (string * 'a) list -> (string * 'a) list * (string * 'a) list | 
| 6116 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 89 | val empty_lexicon: lexicon | 
| 27765 
5df443dd9deb
reorganized lexicon: allow scanning of annotated symbols, tuned representation and interfaces;
 wenzelm parents: 
27731diff
changeset | 90 | val extend_lexicon: string list -> lexicon -> lexicon | 
| 
5df443dd9deb
reorganized lexicon: allow scanning of annotated symbols, tuned representation and interfaces;
 wenzelm parents: 
27731diff
changeset | 91 | val make_lexicon: string list list -> lexicon | 
| 
5df443dd9deb
reorganized lexicon: allow scanning of annotated symbols, tuned representation and interfaces;
 wenzelm parents: 
27731diff
changeset | 92 | val dest_lexicon: lexicon -> string list | 
| 
5df443dd9deb
reorganized lexicon: allow scanning of annotated symbols, tuned representation and interfaces;
 wenzelm parents: 
27731diff
changeset | 93 | val merge_lexicons: lexicon * lexicon -> lexicon | 
| 6116 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 94 | end; | 
| 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 95 | |
| 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 96 | structure Scan: SCAN = | 
| 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 97 | struct | 
| 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 98 | |
| 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 99 | |
| 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 100 | (** scanners **) | 
| 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 101 | |
| 23699 | 102 | (* exceptions *) | 
| 103 | ||
| 43947 
9b00f09f7721
defer evaluation of Scan.message, for improved performance in the frequent situation where failure is handled later (e.g. via ||);
 wenzelm parents: 
40627diff
changeset | 104 | type message = unit -> string; | 
| 
9b00f09f7721
defer evaluation of Scan.message, for improved performance in the frequent situation where failure is handled later (e.g. via ||);
 wenzelm parents: 
40627diff
changeset | 105 | |
| 58850 | 106 | exception MORE of unit; (*need more input*) | 
| 107 | exception FAIL of message option; (*try alternatives (reason of failure)*) | |
| 108 | exception ABORT of message; (*dead end*) | |
| 6116 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 109 | |
| 23699 | 110 | fun !! err scan xs = scan xs handle FAIL msg => raise ABORT (err (xs, msg)); | 
| 78817 | 111 | |
| 112 | fun !!! prefix input_position scan = | |
| 113 | let | |
| 114 | fun print_position inp = the_default " (end-of-input)" (input_position inp); | |
| 115 | ||
| 116 | fun err (inp, NONE) = (fn () => prefix ^ print_position inp) | |
| 117 | | err (inp, SOME msg) = | |
| 118 | (fn () => | |
| 119 | let val s = msg () in | |
| 120 | if String.isPrefix prefix s then s | |
| 121 | else prefix ^ print_position inp ^ ": " ^ s | |
| 122 | end); | |
| 123 | in !! err scan end; | |
| 124 | ||
| 58850 | 125 | fun permissive scan xs = scan xs handle MORE () => raise FAIL NONE | ABORT _ => raise FAIL NONE; | 
| 126 | fun strict scan xs = scan xs handle MORE () => raise FAIL NONE; | |
| 62491 | 127 | fun error scan xs = scan xs handle ABORT msg => Exn.error (msg ()); | 
| 23699 | 128 | |
| 129 | fun catch scan xs = scan xs | |
| 43947 
9b00f09f7721
defer evaluation of Scan.message, for improved performance in the frequent situation where failure is handled later (e.g. via ||);
 wenzelm parents: 
40627diff
changeset | 130 | handle ABORT msg => raise Fail (msg ()) | 
| 
9b00f09f7721
defer evaluation of Scan.message, for improved performance in the frequent situation where failure is handled later (e.g. via ||);
 wenzelm parents: 
40627diff
changeset | 131 | | FAIL msg => raise Fail (case msg of NONE => "Syntax error" | SOME m => m ()); | 
| 23699 | 132 | |
| 58864 | 133 | fun recover scan1 scan2 xs = | 
| 134 | catch scan1 xs handle Fail msg => scan2 msg xs; | |
| 135 | ||
| 6116 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 136 | |
| 61466 | 137 | (* utils *) | 
| 138 | ||
| 139 | fun triple1 ((x, y), z) = (x, y, z); | |
| 140 | fun triple2 (x, (y, z)) = (x, y, z); | |
| 141 | ||
| 142 | ||
| 6116 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 143 | (* scanner combinators *) | 
| 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 144 | |
| 19306 | 145 | fun (scan >> f) xs = scan xs |>> f; | 
| 14078 | 146 | |
| 19306 | 147 | fun (scan1 || scan2) xs = scan1 xs handle FAIL _ => scan2 xs; | 
| 14078 | 148 | |
| 19306 | 149 | fun (scan1 :-- scan2) xs = | 
| 14108 
eaf3c75f2c8e
Restored old (tail recursive!) version of repeat.
 berghofe parents: 
14078diff
changeset | 150 | let | 
| 19306 | 151 | val (x, ys) = scan1 xs; | 
| 152 | val (y, zs) = scan2 x ys; | |
| 153 | in ((x, y), zs) end; | |
| 14078 | 154 | |
| 19306 | 155 | fun (scan1 -- scan2) = scan1 :-- (fn _ => scan2); | 
| 24025 | 156 | fun (scan1 :|-- scan2) = scan1 :-- scan2 >> #2; | 
| 19306 | 157 | fun (scan1 |-- scan2) = scan1 -- scan2 >> #2; | 
| 158 | fun (scan1 --| scan2) = scan1 -- scan2 >> #1; | |
| 159 | fun (scan1 ^^ scan2) = scan1 -- scan2 >> op ^; | |
| 25999 | 160 | fun (scan1 ::: scan2) = scan1 -- scan2 >> op ::; | 
| 161 | fun (scan1 @@@ scan2) = scan1 -- scan2 >> op @; | |
| 6116 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 162 | |
| 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 163 | |
| 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 164 | (* generic scanners *) | 
| 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 165 | |
| 15531 | 166 | fun fail _ = raise FAIL NONE; | 
| 167 | fun fail_with msg_of xs = raise FAIL (SOME (msg_of xs)); | |
| 6116 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 168 | fun succeed y xs = (y, xs); | 
| 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 169 | |
| 58850 | 170 | fun some _ [] = raise MORE () | 
| 15664 | 171 | | some f (x :: xs) = | 
| 172 | (case f x of SOME y => (y, xs) | _ => raise FAIL NONE); | |
| 173 | ||
| 58850 | 174 | fun one _ [] = raise MORE () | 
| 6116 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 175 | | one pred (x :: xs) = | 
| 15531 | 176 | if pred x then (x, xs) else raise FAIL NONE; | 
| 6116 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 177 | |
| 19306 | 178 | fun $$ a = one (fn s: string => s = a); | 
| 179 | fun ~$$ a = one (fn s: string => s <> a); | |
| 6116 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 180 | |
| 14833 | 181 | fun this ys xs = | 
| 14726 | 182 | let | 
| 183 | fun drop_prefix [] xs = xs | |
| 58850 | 184 | | drop_prefix (_ :: _) [] = raise MORE () | 
| 14726 | 185 | | drop_prefix (y :: ys) (x :: xs) = | 
| 19291 | 186 | if (y: string) = x then drop_prefix ys xs else raise FAIL NONE; | 
| 14726 | 187 | in (ys, drop_prefix ys xs) end; | 
| 188 | ||
| 40627 
becf5d5187cc
renamed raw "explode" function to "raw_explode" to emphasize its meaning;
 wenzelm parents: 
38875diff
changeset | 189 | fun this_string s = this (raw_explode s) >> K s; (*primitive string -- no symbols here!*) | 
| 14907 | 190 | |
| 58850 | 191 | fun many _ [] = raise MORE () | 
| 21858 
05f57309170c
avoid conflict with Alice keywords: renamed pack -> implode, unpack -> explode, any -> many, avoided assert;
 wenzelm parents: 
19473diff
changeset | 192 | | many pred (lst as x :: xs) = | 
| 
05f57309170c
avoid conflict with Alice keywords: renamed pack -> implode, unpack -> explode, any -> many, avoided assert;
 wenzelm parents: 
19473diff
changeset | 193 | if pred x then apfst (cons x) (many pred xs) | 
| 6116 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 194 | else ([], lst); | 
| 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 195 | |
| 25999 | 196 | fun many1 pred = one pred ::: many pred; | 
| 6116 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 197 | |
| 15664 | 198 | fun optional scan def = scan || succeed def; | 
| 199 | fun option scan = (scan >> SOME) || succeed NONE; | |
| 6116 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 200 | |
| 13795 | 201 | fun repeat scan = | 
| 15664 | 202 | let | 
| 203 | fun rep ys xs = | |
| 204 | (case (SOME (scan xs) handle FAIL _ => NONE) of | |
| 205 | NONE => (rev ys, xs) | |
| 206 | | SOME (y, xs') => rep (y :: ys) xs'); | |
| 14108 
eaf3c75f2c8e
Restored old (tail recursive!) version of repeat.
 berghofe parents: 
14078diff
changeset | 207 | in rep [] end; | 
| 13795 | 208 | |
| 25999 | 209 | fun repeat1 scan = scan ::: repeat scan; | 
| 6116 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 210 | |
| 61476 | 211 | fun repeats scan = repeat scan >> flat; | 
| 212 | fun repeats1 scan = repeat1 scan >> flat; | |
| 213 | ||
| 23699 | 214 | fun single scan = scan >> (fn x => [x]); | 
| 215 | fun bulk scan = scan -- repeat (permissive scan) >> (op ::); | |
| 216 | ||
| 6116 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 217 | fun max leq scan1 scan2 xs = | 
| 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 218 | (case (option scan1 xs, option scan2 xs) of | 
| 15531 | 219 | ((NONE, _), (NONE, _)) => raise FAIL NONE (*looses FAIL msg!*) | 
| 220 | | ((SOME tok1, xs'), (NONE, _)) => (tok1, xs') | |
| 221 | | ((NONE, _), (SOME tok2, xs')) => (tok2, xs') | |
| 222 | | ((SOME tok1, xs1'), (SOME tok2, xs2')) => | |
| 6116 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 223 | if leq (tok2, tok1) then (tok1, xs1') else (tok2, xs2')); | 
| 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 224 | |
| 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 225 | fun ahead scan xs = (fst (scan xs), xs); | 
| 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 226 | |
| 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 227 | fun unless test scan = | 
| 15531 | 228 | ahead (option test) :-- (fn NONE => scan | _ => fail) >> #2; | 
| 6116 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 229 | |
| 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 230 | fun first [] = fail | 
| 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 231 | | first (scan :: scans) = scan || first scans; | 
| 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 232 | |
| 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 233 | |
| 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 234 | (* state based scanners *) | 
| 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 235 | |
| 9122 | 236 | fun state (st, xs) = (st, (st, xs)); | 
| 237 | ||
| 6116 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 238 | fun depend scan (st, xs) = | 
| 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 239 | let val ((st', y), xs') = scan st xs | 
| 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 240 | in (y, (st', xs')) end; | 
| 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 241 | |
| 15664 | 242 | fun peek scan = depend (fn st => scan st >> pair st); | 
| 243 | ||
| 55104 
8284c0d5bf52
clarified scan_cartouche_depth, according to Scala version;
 wenzelm parents: 
48743diff
changeset | 244 | fun provide pred st scan xs = | 
| 
8284c0d5bf52
clarified scan_cartouche_depth, according to Scala version;
 wenzelm parents: 
48743diff
changeset | 245 | let val (y, (st', xs')) = scan (st, xs) | 
| 
8284c0d5bf52
clarified scan_cartouche_depth, according to Scala version;
 wenzelm parents: 
48743diff
changeset | 246 | in if pred st' then (y, xs') else fail () end; | 
| 
8284c0d5bf52
clarified scan_cartouche_depth, according to Scala version;
 wenzelm parents: 
48743diff
changeset | 247 | |
| 
8284c0d5bf52
clarified scan_cartouche_depth, according to Scala version;
 wenzelm parents: 
48743diff
changeset | 248 | fun pass st = provide (K true) st; | 
| 15664 | 249 | |
| 6116 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 250 | fun lift scan (st, xs) = | 
| 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 251 | let val (y, xs') = scan xs | 
| 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 252 | in (y, (st, xs')) end; | 
| 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 253 | |
| 15664 | 254 | fun unlift scan = pass () scan; | 
| 255 | ||
| 256 | ||
| 257 | (* trace input *) | |
| 258 | ||
| 23699 | 259 | fun trace scan xs = | 
| 260 | let val (y, xs') = scan xs | |
| 33957 | 261 | in ((y, take (length xs - length xs') xs), xs') end; | 
| 6116 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 262 | |
| 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 263 | |
| 27731 
a7444ded92cf
abstract type stopper, may depend on final input;
 wenzelm parents: 
25999diff
changeset | 264 | (* stopper *) | 
| 
a7444ded92cf
abstract type stopper, may depend on final input;
 wenzelm parents: 
25999diff
changeset | 265 | |
| 
a7444ded92cf
abstract type stopper, may depend on final input;
 wenzelm parents: 
25999diff
changeset | 266 | datatype 'a stopper = Stopper of ('a list -> 'a) * ('a -> bool);
 | 
| 
a7444ded92cf
abstract type stopper, may depend on final input;
 wenzelm parents: 
25999diff
changeset | 267 | |
| 
a7444ded92cf
abstract type stopper, may depend on final input;
 wenzelm parents: 
25999diff
changeset | 268 | fun stopper mk_stopper is_stopper = Stopper (mk_stopper, is_stopper); | 
| 
a7444ded92cf
abstract type stopper, may depend on final input;
 wenzelm parents: 
25999diff
changeset | 269 | fun is_stopper (Stopper (_, is_stopper)) = is_stopper; | 
| 
a7444ded92cf
abstract type stopper, may depend on final input;
 wenzelm parents: 
25999diff
changeset | 270 | |
| 
a7444ded92cf
abstract type stopper, may depend on final input;
 wenzelm parents: 
25999diff
changeset | 271 | |
| 6116 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 272 | (* finite scans *) | 
| 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 273 | |
| 27731 
a7444ded92cf
abstract type stopper, may depend on final input;
 wenzelm parents: 
25999diff
changeset | 274 | fun finite' (Stopper (mk_stopper, is_stopper)) scan (state, input) = | 
| 6116 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 275 | let | 
| 43947 
9b00f09f7721
defer evaluation of Scan.message, for improved performance in the frequent situation where failure is handled later (e.g. via ||);
 wenzelm parents: 
40627diff
changeset | 276 | fun lost () = raise ABORT (fn () => "Bad scanner: lost stopper of finite scan!"); | 
| 6116 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 277 | |
| 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 278 | fun stop [] = lost () | 
| 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 279 | | stop lst = | 
| 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 280 | let val (xs, x) = split_last lst | 
| 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 281 | in if is_stopper x then ((), xs) else lost () end; | 
| 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 282 | in | 
| 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 283 | if exists is_stopper input then | 
| 43947 
9b00f09f7721
defer evaluation of Scan.message, for improved performance in the frequent situation where failure is handled later (e.g. via ||);
 wenzelm parents: 
40627diff
changeset | 284 | raise ABORT (fn () => "Stopper may not occur in input of finite scan!") | 
| 27731 
a7444ded92cf
abstract type stopper, may depend on final input;
 wenzelm parents: 
25999diff
changeset | 285 | else (strict scan --| lift stop) (state, input @ [mk_stopper input]) | 
| 6116 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 286 | end; | 
| 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 287 | |
| 15664 | 288 | fun finite stopper scan = unlift (finite' stopper (lift scan)); | 
| 6116 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 289 | |
| 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 290 | fun read stopper scan xs = | 
| 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 291 | (case error (finite stopper (option scan)) xs of | 
| 15531 | 292 | (y as SOME _, []) => y | 
| 293 | | _ => NONE); | |
| 6116 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 294 | |
| 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 295 | |
| 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 296 | (* infinite scans -- draining state-based source *) | 
| 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 297 | |
| 58850 | 298 | fun drain get stopper scan ((state, xs), src) = | 
| 299 | (scan (state, xs), src) handle MORE () => | |
| 300 | (case get src of | |
| 6116 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 301 | ([], _) => (finite' stopper scan (state, xs), src) | 
| 58850 | 302 | | (xs', src') => drain get stopper scan ((state, xs @ xs'), src')); | 
| 6116 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 303 | |
| 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 304 | |
| 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 305 | |
| 27782 
377810fd718e
datatype lexicon: alternative representation using nested Symtab.table;
 wenzelm parents: 
27765diff
changeset | 306 | (** datatype lexicon -- position tree **) | 
| 
377810fd718e
datatype lexicon: alternative representation using nested Symtab.table;
 wenzelm parents: 
27765diff
changeset | 307 | |
| 
377810fd718e
datatype lexicon: alternative representation using nested Symtab.table;
 wenzelm parents: 
27765diff
changeset | 308 | datatype lexicon = Lexicon of (bool * lexicon) Symtab.table; | 
| 
377810fd718e
datatype lexicon: alternative representation using nested Symtab.table;
 wenzelm parents: 
27765diff
changeset | 309 | |
| 
377810fd718e
datatype lexicon: alternative representation using nested Symtab.table;
 wenzelm parents: 
27765diff
changeset | 310 | val empty_lexicon = Lexicon Symtab.empty; | 
| 59071 | 311 | fun is_empty_lexicon (Lexicon tab) = Symtab.is_empty tab; | 
| 6116 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 312 | |
| 27782 
377810fd718e
datatype lexicon: alternative representation using nested Symtab.table;
 wenzelm parents: 
27765diff
changeset | 313 | fun is_literal _ [] = false | 
| 32784 | 314 | | is_literal (Lexicon tab) (c :: cs) = | 
| 27782 
377810fd718e
datatype lexicon: alternative representation using nested Symtab.table;
 wenzelm parents: 
27765diff
changeset | 315 | (case Symtab.lookup tab c of | 
| 
377810fd718e
datatype lexicon: alternative representation using nested Symtab.table;
 wenzelm parents: 
27765diff
changeset | 316 | SOME (tip, lex) => tip andalso null cs orelse is_literal lex cs | 
| 
377810fd718e
datatype lexicon: alternative representation using nested Symtab.table;
 wenzelm parents: 
27765diff
changeset | 317 | | NONE => false); | 
| 6116 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 318 | |
| 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 319 | |
| 27782 
377810fd718e
datatype lexicon: alternative representation using nested Symtab.table;
 wenzelm parents: 
27765diff
changeset | 320 | (* scan longest match *) | 
| 27765 
5df443dd9deb
reorganized lexicon: allow scanning of annotated symbols, tuned representation and interfaces;
 wenzelm parents: 
27731diff
changeset | 321 | |
| 27782 
377810fd718e
datatype lexicon: alternative representation using nested Symtab.table;
 wenzelm parents: 
27765diff
changeset | 322 | fun literal lexicon = | 
| 27765 
5df443dd9deb
reorganized lexicon: allow scanning of annotated symbols, tuned representation and interfaces;
 wenzelm parents: 
27731diff
changeset | 323 | let | 
| 27782 
377810fd718e
datatype lexicon: alternative representation using nested Symtab.table;
 wenzelm parents: 
27765diff
changeset | 324 | fun finish (SOME (res, rest)) = (rev res, rest) | 
| 
377810fd718e
datatype lexicon: alternative representation using nested Symtab.table;
 wenzelm parents: 
27765diff
changeset | 325 | | finish NONE = raise FAIL NONE; | 
| 58850 | 326 | fun scan _ res (Lexicon tab) [] = | 
| 327 | if Symtab.is_empty tab then finish res else raise MORE () | |
| 32784 | 328 | | scan path res (Lexicon tab) (c :: cs) = | 
| 27782 
377810fd718e
datatype lexicon: alternative representation using nested Symtab.table;
 wenzelm parents: 
27765diff
changeset | 329 | (case Symtab.lookup tab (fst c) of | 
| 
377810fd718e
datatype lexicon: alternative representation using nested Symtab.table;
 wenzelm parents: 
27765diff
changeset | 330 | SOME (tip, lex) => | 
| 
377810fd718e
datatype lexicon: alternative representation using nested Symtab.table;
 wenzelm parents: 
27765diff
changeset | 331 | let val path' = c :: path | 
| 
377810fd718e
datatype lexicon: alternative representation using nested Symtab.table;
 wenzelm parents: 
27765diff
changeset | 332 | in scan path' (if tip then SOME (path', cs) else res) lex cs end | 
| 27784 | 333 | | NONE => finish res); | 
| 27782 
377810fd718e
datatype lexicon: alternative representation using nested Symtab.table;
 wenzelm parents: 
27765diff
changeset | 334 | in scan [] NONE lexicon end; | 
| 6116 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 335 | |
| 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 336 | |
| 27765 
5df443dd9deb
reorganized lexicon: allow scanning of annotated symbols, tuned representation and interfaces;
 wenzelm parents: 
27731diff
changeset | 337 | (* build lexicons *) | 
| 6116 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 338 | |
| 27765 
5df443dd9deb
reorganized lexicon: allow scanning of annotated symbols, tuned representation and interfaces;
 wenzelm parents: 
27731diff
changeset | 339 | fun extend_lexicon chrs lexicon = | 
| 
5df443dd9deb
reorganized lexicon: allow scanning of annotated symbols, tuned representation and interfaces;
 wenzelm parents: 
27731diff
changeset | 340 | let | 
| 27782 
377810fd718e
datatype lexicon: alternative representation using nested Symtab.table;
 wenzelm parents: 
27765diff
changeset | 341 | fun ext [] lex = lex | 
| 32784 | 342 | | ext (c :: cs) (Lexicon tab) = | 
| 27782 
377810fd718e
datatype lexicon: alternative representation using nested Symtab.table;
 wenzelm parents: 
27765diff
changeset | 343 | (case Symtab.lookup tab c of | 
| 
377810fd718e
datatype lexicon: alternative representation using nested Symtab.table;
 wenzelm parents: 
27765diff
changeset | 344 | SOME (tip, lex) => Lexicon (Symtab.update (c, (tip orelse null cs, ext cs lex)) tab) | 
| 
377810fd718e
datatype lexicon: alternative representation using nested Symtab.table;
 wenzelm parents: 
27765diff
changeset | 345 | | NONE => Lexicon (Symtab.update (c, (null cs, ext cs empty_lexicon)) tab)); | 
| 27765 
5df443dd9deb
reorganized lexicon: allow scanning of annotated symbols, tuned representation and interfaces;
 wenzelm parents: 
27731diff
changeset | 346 | in if is_literal lexicon chrs then lexicon else ext chrs lexicon end; | 
| 6116 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 347 | |
| 27765 
5df443dd9deb
reorganized lexicon: allow scanning of annotated symbols, tuned representation and interfaces;
 wenzelm parents: 
27731diff
changeset | 348 | fun make_lexicon chrss = fold extend_lexicon chrss empty_lexicon; | 
| 6116 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 349 | |
| 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 350 | |
| 27765 
5df443dd9deb
reorganized lexicon: allow scanning of annotated symbols, tuned representation and interfaces;
 wenzelm parents: 
27731diff
changeset | 351 | (* merge lexicons *) | 
| 6116 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 352 | |
| 27782 
377810fd718e
datatype lexicon: alternative representation using nested Symtab.table;
 wenzelm parents: 
27765diff
changeset | 353 | fun dest path (Lexicon tab) = Symtab.fold (fn (d, (tip, lex)) => | 
| 6116 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 354 | let | 
| 27782 
377810fd718e
datatype lexicon: alternative representation using nested Symtab.table;
 wenzelm parents: 
27765diff
changeset | 355 | val path' = d :: path; | 
| 
377810fd718e
datatype lexicon: alternative representation using nested Symtab.table;
 wenzelm parents: 
27765diff
changeset | 356 | val content = dest path' lex; | 
| 
377810fd718e
datatype lexicon: alternative representation using nested Symtab.table;
 wenzelm parents: 
27765diff
changeset | 357 | in append (if tip then rev path' :: content else content) end) tab []; | 
| 27765 
5df443dd9deb
reorganized lexicon: allow scanning of annotated symbols, tuned representation and interfaces;
 wenzelm parents: 
27731diff
changeset | 358 | |
| 59196 | 359 | val dest_lexicon = sort_strings o map implode o dest []; | 
| 59071 | 360 | |
| 361 | fun merge_lexicons (lex1, lex2) = | |
| 362 | if pointer_eq (lex1, lex2) then lex1 | |
| 363 | else if is_empty_lexicon lex1 then lex2 | |
| 364 | else fold extend_lexicon (dest [] lex2) lex1; | |
| 6116 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 365 | |
| 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 366 | end; | 
| 
8ba2f25610f7
files scan.ML, source.ML, symbol.ML, pretty.ML moved to Pure/General;
 wenzelm parents: diff
changeset | 367 | |
| 37216 
3165bc303f66
modernized some structure names, keeping a few legacy aliases;
 wenzelm parents: 
33957diff
changeset | 368 | structure Basic_Scan: BASIC_SCAN = Scan; | 
| 
3165bc303f66
modernized some structure names, keeping a few legacy aliases;
 wenzelm parents: 
33957diff
changeset | 369 | open Basic_Scan; |