author | wenzelm |
Mon, 28 Nov 2011 22:05:32 +0100 | |
changeset 45666 | d83797ef0d2d |
parent 44736 | c2a3f1c84179 |
child 48743 | a72f8ffecf31 |
permissions | -rw-r--r-- |
24579 | 1 |
(* Title: Pure/ML/ml_lex.ML |
2 |
Author: Makarius |
|
3 |
||
4 |
Lexical syntax for SML. |
|
5 |
*) |
|
6 |
||
7 |
signature ML_LEX = |
|
8 |
sig |
|
9 |
datatype token_kind = |
|
24596 | 10 |
Keyword | Ident | LongIdent | TypeVar | Word | Int | Real | Char | String | |
24579 | 11 |
Space | Comment | Error of string | EOF |
12 |
eqtype token |
|
27732 | 13 |
val stopper: token Scan.stopper |
24596 | 14 |
val is_regular: token -> bool |
15 |
val is_improper: token -> bool |
|
30683
e8ac1f9d9469
datatype antiquote: maintain original Position.range, which is eventually attached to the resulting ML tokens;
wenzelm
parents:
30645
diff
changeset
|
16 |
val set_range: Position.range -> token -> token |
30636 | 17 |
val pos_of: token -> Position.T |
31474 | 18 |
val end_pos_of: token -> Position.T |
24579 | 19 |
val kind_of: token -> token_kind |
27817 | 20 |
val content_of: token -> string |
31426 | 21 |
val check_content_of: token -> string |
31332 | 22 |
val flatten: token list -> string |
24579 | 23 |
val keywords: string list |
24596 | 24 |
val source: (Symbol.symbol, 'a) Source.source -> |
30573 | 25 |
(token, (Symbol_Pos.T, Position.T * (Symbol.symbol, 'a) Source.source) |
27772 | 26 |
Source.source) Source.source |
30591 | 27 |
val tokenize: string -> token list |
37198
3af985b10550
replaced ML_Lex.read_antiq by more concise ML_Lex.read, which includes full read/report with explicit position information;
wenzelm
parents:
37195
diff
changeset
|
28 |
val read: Position.T -> Symbol_Pos.text -> token Antiquote.antiquote list |
24579 | 29 |
end; |
30 |
||
31 |
structure ML_Lex: ML_LEX = |
|
32 |
struct |
|
33 |
||
34 |
(** tokens **) |
|
35 |
||
36 |
(* datatype token *) |
|
37 |
||
38 |
datatype token_kind = |
|
24596 | 39 |
Keyword | Ident | LongIdent | TypeVar | Word | Int | Real | Char | String | |
24579 | 40 |
Space | Comment | Error of string | EOF; |
41 |
||
27772 | 42 |
datatype token = Token of Position.range * (token_kind * string); |
43 |
||
44 |
||
45 |
(* position *) |
|
46 |
||
30683
e8ac1f9d9469
datatype antiquote: maintain original Position.range, which is eventually attached to the resulting ML tokens;
wenzelm
parents:
30645
diff
changeset
|
47 |
fun set_range range (Token (_, x)) = Token (range, x); |
e8ac1f9d9469
datatype antiquote: maintain original Position.range, which is eventually attached to the resulting ML tokens;
wenzelm
parents:
30645
diff
changeset
|
48 |
|
30636 | 49 |
fun pos_of (Token ((pos, _), _)) = pos; |
50 |
fun end_pos_of (Token ((_, pos), _)) = pos; |
|
24579 | 51 |
|
52 |
||
24596 | 53 |
(* control tokens *) |
24579 | 54 |
|
27772 | 55 |
fun mk_eof pos = Token ((pos, Position.none), (EOF, "")); |
56 |
val eof = mk_eof Position.none; |
|
24579 | 57 |
|
58 |
fun is_eof (Token (_, (EOF, _))) = true |
|
59 |
| is_eof _ = false; |
|
60 |
||
27772 | 61 |
val stopper = |
30636 | 62 |
Scan.stopper (fn [] => eof | toks => mk_eof (end_pos_of (List.last toks))) is_eof; |
27772 | 63 |
|
24579 | 64 |
|
27772 | 65 |
(* token content *) |
66 |
||
31426 | 67 |
fun kind_of (Token (_, (k, _))) = k; |
68 |
||
27817 | 69 |
fun content_of (Token (_, (_, x))) = x; |
70 |
fun token_leq (tok, tok') = content_of tok <= content_of tok'; |
|
27772 | 71 |
|
41502
967cbbc77abd
refined ML_Lex.flatten: ensure proper separation of tokens;
wenzelm
parents:
40627
diff
changeset
|
72 |
fun is_regular (Token (_, (Error _, _))) = false |
967cbbc77abd
refined ML_Lex.flatten: ensure proper separation of tokens;
wenzelm
parents:
40627
diff
changeset
|
73 |
| is_regular (Token (_, (EOF, _))) = false |
967cbbc77abd
refined ML_Lex.flatten: ensure proper separation of tokens;
wenzelm
parents:
40627
diff
changeset
|
74 |
| is_regular _ = true; |
967cbbc77abd
refined ML_Lex.flatten: ensure proper separation of tokens;
wenzelm
parents:
40627
diff
changeset
|
75 |
|
967cbbc77abd
refined ML_Lex.flatten: ensure proper separation of tokens;
wenzelm
parents:
40627
diff
changeset
|
76 |
fun is_improper (Token (_, (Space, _))) = true |
967cbbc77abd
refined ML_Lex.flatten: ensure proper separation of tokens;
wenzelm
parents:
40627
diff
changeset
|
77 |
| is_improper (Token (_, (Comment, _))) = true |
967cbbc77abd
refined ML_Lex.flatten: ensure proper separation of tokens;
wenzelm
parents:
40627
diff
changeset
|
78 |
| is_improper _ = false; |
967cbbc77abd
refined ML_Lex.flatten: ensure proper separation of tokens;
wenzelm
parents:
40627
diff
changeset
|
79 |
|
40337
d25bbb5f1c9e
warn in correlation with report -- avoid spurious message duplicates;
wenzelm
parents:
40319
diff
changeset
|
80 |
fun warn tok = |
d25bbb5f1c9e
warn in correlation with report -- avoid spurious message duplicates;
wenzelm
parents:
40319
diff
changeset
|
81 |
(case tok of |
d25bbb5f1c9e
warn in correlation with report -- avoid spurious message duplicates;
wenzelm
parents:
40319
diff
changeset
|
82 |
Token (_, (Keyword, ":>")) => |
d25bbb5f1c9e
warn in correlation with report -- avoid spurious message duplicates;
wenzelm
parents:
40319
diff
changeset
|
83 |
warning ("Opaque signature matching (:>) fails to work with ML pretty printing --\n\ |
d25bbb5f1c9e
warn in correlation with report -- avoid spurious message duplicates;
wenzelm
parents:
40319
diff
changeset
|
84 |
\prefer non-opaque matching (:) possibly with abstype" ^ |
d25bbb5f1c9e
warn in correlation with report -- avoid spurious message duplicates;
wenzelm
parents:
40319
diff
changeset
|
85 |
Position.str_of (pos_of tok)) |
d25bbb5f1c9e
warn in correlation with report -- avoid spurious message duplicates;
wenzelm
parents:
40319
diff
changeset
|
86 |
| _ => ()); |
d25bbb5f1c9e
warn in correlation with report -- avoid spurious message duplicates;
wenzelm
parents:
40319
diff
changeset
|
87 |
|
31426 | 88 |
fun check_content_of tok = |
30636 | 89 |
(case kind_of tok of |
30645 | 90 |
Error msg => error msg |
40337
d25bbb5f1c9e
warn in correlation with report -- avoid spurious message duplicates;
wenzelm
parents:
40319
diff
changeset
|
91 |
| _ => content_of tok); |
30636 | 92 |
|
41502
967cbbc77abd
refined ML_Lex.flatten: ensure proper separation of tokens;
wenzelm
parents:
40627
diff
changeset
|
93 |
fun flatten_content (tok :: (toks as tok' :: _)) = |
967cbbc77abd
refined ML_Lex.flatten: ensure proper separation of tokens;
wenzelm
parents:
40627
diff
changeset
|
94 |
Symbol.escape (check_content_of tok) :: |
967cbbc77abd
refined ML_Lex.flatten: ensure proper separation of tokens;
wenzelm
parents:
40627
diff
changeset
|
95 |
(if is_improper tok orelse is_improper tok' then flatten_content toks |
967cbbc77abd
refined ML_Lex.flatten: ensure proper separation of tokens;
wenzelm
parents:
40627
diff
changeset
|
96 |
else Symbol.space :: flatten_content toks) |
967cbbc77abd
refined ML_Lex.flatten: ensure proper separation of tokens;
wenzelm
parents:
40627
diff
changeset
|
97 |
| flatten_content toks = map (Symbol.escape o check_content_of) toks; |
31332 | 98 |
|
41502
967cbbc77abd
refined ML_Lex.flatten: ensure proper separation of tokens;
wenzelm
parents:
40627
diff
changeset
|
99 |
val flatten = implode o flatten_content; |
24596 | 100 |
|
101 |
||
30614 | 102 |
(* markup *) |
103 |
||
37195 | 104 |
local |
105 |
||
30645 | 106 |
val token_kind_markup = |
45666 | 107 |
fn Keyword => Isabelle_Markup.ML_keyword |
44706
fe319b45315c
eliminated markup for plain identifiers (frequent but insignificant);
wenzelm
parents:
43947
diff
changeset
|
108 |
| Ident => Markup.empty |
fe319b45315c
eliminated markup for plain identifiers (frequent but insignificant);
wenzelm
parents:
43947
diff
changeset
|
109 |
| LongIdent => Markup.empty |
45666 | 110 |
| TypeVar => Isabelle_Markup.ML_tvar |
111 |
| Word => Isabelle_Markup.ML_numeral |
|
112 |
| Int => Isabelle_Markup.ML_numeral |
|
113 |
| Real => Isabelle_Markup.ML_numeral |
|
114 |
| Char => Isabelle_Markup.ML_char |
|
115 |
| String => Isabelle_Markup.ML_string |
|
38474
e498dc2eb576
uniform Markup.empty/Markup.Empty in ML and Scala;
wenzelm
parents:
37209
diff
changeset
|
116 |
| Space => Markup.empty |
45666 | 117 |
| Comment => Isabelle_Markup.ML_comment |
118 |
| Error _ => Isabelle_Markup.ML_malformed |
|
38474
e498dc2eb576
uniform Markup.empty/Markup.Empty in ML and Scala;
wenzelm
parents:
37209
diff
changeset
|
119 |
| EOF => Markup.empty; |
30614 | 120 |
|
37195 | 121 |
fun token_markup kind x = |
122 |
if kind = Keyword andalso exists_string (not o Symbol.is_ascii_letter) x |
|
45666 | 123 |
then Isabelle_Markup.ML_delimiter |
37195 | 124 |
else token_kind_markup kind; |
125 |
||
126 |
in |
|
127 |
||
44736 | 128 |
fun report_of_token (Token ((pos, _), (kind, x))) = (pos, token_markup kind x); |
37195 | 129 |
|
130 |
end; |
|
30614 | 131 |
|
132 |
||
24579 | 133 |
|
134 |
(** scanners **) |
|
135 |
||
30573 | 136 |
open Basic_Symbol_Pos; |
24579 | 137 |
|
43947
9b00f09f7721
defer evaluation of Scan.message, for improved performance in the frequent situation where failure is handled later (e.g. via ||);
wenzelm
parents:
41502
diff
changeset
|
138 |
fun !!! msg = Symbol_Pos.!!! (fn () => "SML lexical error: " ^ msg); |
24579 | 139 |
|
140 |
||
27772 | 141 |
(* blanks *) |
24579 | 142 |
|
40525
14a2e686bdac
eliminated slightly odd pervasive Symbol_Pos.symbol;
wenzelm
parents:
40523
diff
changeset
|
143 |
val scan_blank = Scan.one (Symbol.is_ascii_blank o Symbol_Pos.symbol); |
27772 | 144 |
val scan_blanks1 = Scan.repeat1 scan_blank; |
24579 | 145 |
|
146 |
||
147 |
(* keywords *) |
|
148 |
||
149 |
val keywords = ["#", "(", ")", ",", "->", "...", ":", ":>", ";", "=", |
|
150 |
"=>", "[", "]", "_", "{", "|", "}", "abstype", "and", "andalso", "as", |
|
151 |
"case", "datatype", "do", "else", "end", "eqtype", "exception", "fn", |
|
152 |
"fun", "functor", "handle", "if", "in", "include", "infix", "infixr", |
|
153 |
"let", "local", "nonfix", "of", "op", "open", "orelse", "raise", "rec", |
|
154 |
"sharing", "sig", "signature", "struct", "structure", "then", "type", |
|
155 |
"val", "where", "while", "with", "withtype"]; |
|
156 |
||
40627
becf5d5187cc
renamed raw "explode" function to "raw_explode" to emphasize its meaning;
wenzelm
parents:
40525
diff
changeset
|
157 |
val lex = Scan.make_lexicon (map raw_explode keywords); |
27772 | 158 |
fun scan_keyword x = Scan.literal lex x; |
24579 | 159 |
|
160 |
||
161 |
(* identifiers *) |
|
162 |
||
24596 | 163 |
local |
164 |
||
24579 | 165 |
val scan_letdigs = |
40525
14a2e686bdac
eliminated slightly odd pervasive Symbol_Pos.symbol;
wenzelm
parents:
40523
diff
changeset
|
166 |
Scan.many |
14a2e686bdac
eliminated slightly odd pervasive Symbol_Pos.symbol;
wenzelm
parents:
40523
diff
changeset
|
167 |
((Symbol.is_ascii_letter orf Symbol.is_ascii_digit orf Symbol.is_ascii_quasi) o |
14a2e686bdac
eliminated slightly odd pervasive Symbol_Pos.symbol;
wenzelm
parents:
40523
diff
changeset
|
168 |
Symbol_Pos.symbol); |
24579 | 169 |
|
40525
14a2e686bdac
eliminated slightly odd pervasive Symbol_Pos.symbol;
wenzelm
parents:
40523
diff
changeset
|
170 |
val scan_alphanumeric = |
14a2e686bdac
eliminated slightly odd pervasive Symbol_Pos.symbol;
wenzelm
parents:
40523
diff
changeset
|
171 |
Scan.one (Symbol.is_ascii_letter o Symbol_Pos.symbol) -- scan_letdigs >> op ::; |
24579 | 172 |
|
40525
14a2e686bdac
eliminated slightly odd pervasive Symbol_Pos.symbol;
wenzelm
parents:
40523
diff
changeset
|
173 |
val scan_symbolic = |
40627
becf5d5187cc
renamed raw "explode" function to "raw_explode" to emphasize its meaning;
wenzelm
parents:
40525
diff
changeset
|
174 |
Scan.many1 (member (op =) (raw_explode "!#$%&*+-/:<=>?@\\^`|~") o Symbol_Pos.symbol); |
24579 | 175 |
|
24596 | 176 |
in |
177 |
||
24579 | 178 |
val scan_ident = scan_alphanumeric || scan_symbolic; |
179 |
||
180 |
val scan_longident = |
|
27772 | 181 |
(Scan.repeat1 (scan_alphanumeric @@@ $$$ ".") >> flat) @@@ (scan_ident || $$$ "="); |
24579 | 182 |
|
27772 | 183 |
val scan_typevar = $$$ "'" @@@ scan_letdigs; |
24579 | 184 |
|
24596 | 185 |
end; |
24579 | 186 |
|
187 |
||
188 |
(* numerals *) |
|
189 |
||
24596 | 190 |
local |
191 |
||
40525
14a2e686bdac
eliminated slightly odd pervasive Symbol_Pos.symbol;
wenzelm
parents:
40523
diff
changeset
|
192 |
val scan_dec = Scan.many1 (Symbol.is_ascii_digit o Symbol_Pos.symbol); |
14a2e686bdac
eliminated slightly odd pervasive Symbol_Pos.symbol;
wenzelm
parents:
40523
diff
changeset
|
193 |
val scan_hex = Scan.many1 (Symbol.is_ascii_hex o Symbol_Pos.symbol); |
27772 | 194 |
val scan_sign = Scan.optional ($$$ "~") []; |
195 |
val scan_decint = scan_sign @@@ scan_dec; |
|
24579 | 196 |
|
24596 | 197 |
in |
198 |
||
27772 | 199 |
val scan_word = |
200 |
$$$ "0" @@@ $$$ "w" @@@ $$$ "x" @@@ scan_hex || |
|
201 |
$$$ "0" @@@ $$$ "w" @@@ scan_dec; |
|
24579 | 202 |
|
27772 | 203 |
val scan_int = scan_sign @@@ ($$$ "0" @@@ $$$ "x" @@@ scan_hex || scan_dec); |
24579 | 204 |
|
27772 | 205 |
val scan_exp = ($$$ "E" || $$$ "e") @@@ scan_decint; |
24579 | 206 |
|
207 |
val scan_real = |
|
27772 | 208 |
scan_decint @@@ $$$ "." @@@ scan_dec @@@ Scan.optional scan_exp [] || |
209 |
scan_decint @@@ scan_exp; |
|
24579 | 210 |
|
24596 | 211 |
end; |
212 |
||
24579 | 213 |
|
214 |
(* chars and strings *) |
|
215 |
||
24596 | 216 |
local |
217 |
||
218 |
val scan_escape = |
|
40627
becf5d5187cc
renamed raw "explode" function to "raw_explode" to emphasize its meaning;
wenzelm
parents:
40525
diff
changeset
|
219 |
Scan.one (member (op =) (raw_explode "\"\\abtnvfr") o Symbol_Pos.symbol) >> single || |
27772 | 220 |
$$$ "^" @@@ (Scan.one (fn (s, _) => ord "@" <= ord s andalso ord s <= ord "_") >> single) || |
40525
14a2e686bdac
eliminated slightly odd pervasive Symbol_Pos.symbol;
wenzelm
parents:
40523
diff
changeset
|
221 |
Scan.one (Symbol.is_ascii_digit o Symbol_Pos.symbol) -- |
14a2e686bdac
eliminated slightly odd pervasive Symbol_Pos.symbol;
wenzelm
parents:
40523
diff
changeset
|
222 |
Scan.one (Symbol.is_ascii_digit o Symbol_Pos.symbol) -- |
14a2e686bdac
eliminated slightly odd pervasive Symbol_Pos.symbol;
wenzelm
parents:
40523
diff
changeset
|
223 |
Scan.one (Symbol.is_ascii_digit o Symbol_Pos.symbol) >> (fn ((a, b), c) => [a, b, c]); |
24596 | 224 |
|
225 |
val scan_str = |
|
30600
de241396389c
allow non-printable symbols within string tokens;
wenzelm
parents:
30593
diff
changeset
|
226 |
Scan.one (fn (s, _) => Symbol.is_regular s andalso s <> "\"" andalso s <> "\\" andalso |
de241396389c
allow non-printable symbols within string tokens;
wenzelm
parents:
30593
diff
changeset
|
227 |
(not (Symbol.is_char s) orelse Symbol.is_printable s)) >> single || |
27772 | 228 |
$$$ "\\" @@@ !!! "bad escape character in string" scan_escape; |
24596 | 229 |
|
27772 | 230 |
val scan_gap = $$$ "\\" @@@ scan_blanks1 @@@ $$$ "\\"; |
231 |
val scan_gaps = Scan.repeat scan_gap >> flat; |
|
24579 | 232 |
|
24596 | 233 |
in |
24579 | 234 |
|
235 |
val scan_char = |
|
27772 | 236 |
$$$ "#" @@@ $$$ "\"" @@@ scan_gaps @@@ scan_str @@@ scan_gaps @@@ $$$ "\""; |
24579 | 237 |
|
238 |
val scan_string = |
|
27772 | 239 |
$$$ "\"" @@@ !!! "missing quote at end of string" |
240 |
((Scan.repeat (scan_gap || scan_str) >> flat) @@@ $$$ "\""); |
|
24596 | 241 |
|
242 |
end; |
|
24579 | 243 |
|
244 |
||
30645 | 245 |
(* scan tokens *) |
24579 | 246 |
|
247 |
local |
|
248 |
||
30593 | 249 |
fun token k ss = Token (Symbol_Pos.range ss, (k, Symbol_Pos.content ss)); |
24579 | 250 |
|
30593 | 251 |
val scan_ml = |
27772 | 252 |
(scan_char >> token Char || |
253 |
scan_string >> token String || |
|
254 |
scan_blanks1 >> token Space || |
|
30573 | 255 |
Symbol_Pos.scan_comment !!! >> token Comment || |
27772 | 256 |
Scan.max token_leq |
257 |
(scan_keyword >> token Keyword) |
|
258 |
(scan_word >> token Word || |
|
259 |
scan_real >> token Real || |
|
260 |
scan_int >> token Int || |
|
261 |
scan_longident >> token LongIdent || |
|
262 |
scan_ident >> token Ident || |
|
263 |
scan_typevar >> token TypeVar)); |
|
264 |
||
30645 | 265 |
val scan_antiq = Antiquote.scan || scan_ml >> Antiquote.Text; |
266 |
||
27772 | 267 |
fun recover msg = |
40525
14a2e686bdac
eliminated slightly odd pervasive Symbol_Pos.symbol;
wenzelm
parents:
40523
diff
changeset
|
268 |
Scan.many (((not o Symbol.is_blank) andf Symbol.is_regular) o Symbol_Pos.symbol) |
27772 | 269 |
>> (fn cs => [token (Error msg) cs]); |
24579 | 270 |
|
271 |
in |
|
272 |
||
24596 | 273 |
fun source src = |
30573 | 274 |
Symbol_Pos.source (Position.line 1) src |
30593 | 275 |
|> Source.source Symbol_Pos.stopper (Scan.bulk (!!! "bad input" scan_ml)) (SOME (false, recover)); |
30591 | 276 |
|
40523
1050315f6ee2
simplified/robustified treatment of malformed symbols, which are now fully internalized (total Symbol.explode etc.);
wenzelm
parents:
40337
diff
changeset
|
277 |
val tokenize = Source.of_string #> Symbol.source #> source #> Source.exhaust; |
24579 | 278 |
|
37198
3af985b10550
replaced ML_Lex.read_antiq by more concise ML_Lex.read, which includes full read/report with explicit position information;
wenzelm
parents:
37195
diff
changeset
|
279 |
fun read pos txt = |
3af985b10550
replaced ML_Lex.read_antiq by more concise ML_Lex.read, which includes full read/report with explicit position information;
wenzelm
parents:
37195
diff
changeset
|
280 |
let |
45666 | 281 |
val _ = Position.report pos Isabelle_Markup.ML_source; |
37198
3af985b10550
replaced ML_Lex.read_antiq by more concise ML_Lex.read, which includes full read/report with explicit position information;
wenzelm
parents:
37195
diff
changeset
|
282 |
val syms = Symbol_Pos.explode (txt, pos); |
37209
1c8cf0048934
terminate ML compiler input produced by ML_Lex.read (cf. 85e864045497);
wenzelm
parents:
37198
diff
changeset
|
283 |
val termination = |
1c8cf0048934
terminate ML compiler input produced by ML_Lex.read (cf. 85e864045497);
wenzelm
parents:
37198
diff
changeset
|
284 |
if null syms then [] |
1c8cf0048934
terminate ML compiler input produced by ML_Lex.read (cf. 85e864045497);
wenzelm
parents:
37198
diff
changeset
|
285 |
else |
1c8cf0048934
terminate ML compiler input produced by ML_Lex.read (cf. 85e864045497);
wenzelm
parents:
37198
diff
changeset
|
286 |
let |
1c8cf0048934
terminate ML compiler input produced by ML_Lex.read (cf. 85e864045497);
wenzelm
parents:
37198
diff
changeset
|
287 |
val pos1 = List.last syms |-> Position.advance; |
1c8cf0048934
terminate ML compiler input produced by ML_Lex.read (cf. 85e864045497);
wenzelm
parents:
37198
diff
changeset
|
288 |
val pos2 = Position.advance Symbol.space pos1; |
1c8cf0048934
terminate ML compiler input produced by ML_Lex.read (cf. 85e864045497);
wenzelm
parents:
37198
diff
changeset
|
289 |
in [Antiquote.Text (Token (Position.range pos1 pos2, (Space, Symbol.space)))] end; |
1c8cf0048934
terminate ML compiler input produced by ML_Lex.read (cf. 85e864045497);
wenzelm
parents:
37198
diff
changeset
|
290 |
val input = |
1c8cf0048934
terminate ML compiler input produced by ML_Lex.read (cf. 85e864045497);
wenzelm
parents:
37198
diff
changeset
|
291 |
(Source.of_list syms |
1c8cf0048934
terminate ML compiler input produced by ML_Lex.read (cf. 85e864045497);
wenzelm
parents:
37198
diff
changeset
|
292 |
|> Source.source Symbol_Pos.stopper (Scan.bulk (!!! "bad input" scan_antiq)) |
1c8cf0048934
terminate ML compiler input produced by ML_Lex.read (cf. 85e864045497);
wenzelm
parents:
37198
diff
changeset
|
293 |
(SOME (false, fn msg => recover msg >> map Antiquote.Text)) |
1c8cf0048934
terminate ML compiler input produced by ML_Lex.read (cf. 85e864045497);
wenzelm
parents:
37198
diff
changeset
|
294 |
|> Source.exhaust |
44736 | 295 |
|> tap (Position.reports o Antiquote.reports_of (single o report_of_token)) |
37209
1c8cf0048934
terminate ML compiler input produced by ML_Lex.read (cf. 85e864045497);
wenzelm
parents:
37198
diff
changeset
|
296 |
|> tap Antiquote.check_nesting |
40337
d25bbb5f1c9e
warn in correlation with report -- avoid spurious message duplicates;
wenzelm
parents:
40319
diff
changeset
|
297 |
|> tap (List.app (fn Antiquote.Text tok => (check_content_of tok; warn tok) | _ => ()))) |
37209
1c8cf0048934
terminate ML compiler input produced by ML_Lex.read (cf. 85e864045497);
wenzelm
parents:
37198
diff
changeset
|
298 |
handle ERROR msg => |
1c8cf0048934
terminate ML compiler input produced by ML_Lex.read (cf. 85e864045497);
wenzelm
parents:
37198
diff
changeset
|
299 |
cat_error msg ("The error(s) above occurred in ML source" ^ Position.str_of pos); |
1c8cf0048934
terminate ML compiler input produced by ML_Lex.read (cf. 85e864045497);
wenzelm
parents:
37198
diff
changeset
|
300 |
in input @ termination end; |
30645 | 301 |
|
24579 | 302 |
end; |
303 |
||
24596 | 304 |
end; |
24579 | 305 |