author | wenzelm |
Mon, 22 Jul 2019 11:39:30 +0200 | |
changeset 70393 | 9e53a98702b9 |
parent 69891 | def3ec9cdb7e |
child 73550 | 2f6855142a8c |
permissions | -rw-r--r-- |
30587
ad19c99529eb
moved Isar/antiquote.ML to General/antiquote.ML, which is loaded early;
wenzelm
parents:
30573
diff
changeset
|
1 |
(* Title: Pure/General/antiquote.ML |
55511
984e210d412e
antiquotations within plain text: Scala version in accordance to ML;
wenzelm
parents:
55107
diff
changeset
|
2 |
Author: Makarius |
9138
6a4fae41a75f
Text with antiquotations of inner items (terms, types etc.).
wenzelm
parents:
diff
changeset
|
3 |
|
55511
984e210d412e
antiquotations within plain text: Scala version in accordance to ML;
wenzelm
parents:
55107
diff
changeset
|
4 |
Antiquotations within plain text. |
9138
6a4fae41a75f
Text with antiquotations of inner items (terms, types etc.).
wenzelm
parents:
diff
changeset
|
5 |
*) |
6a4fae41a75f
Text with antiquotations of inner items (terms, types etc.).
wenzelm
parents:
diff
changeset
|
6 |
|
6a4fae41a75f
Text with antiquotations of inner items (terms, types etc.).
wenzelm
parents:
diff
changeset
|
7 |
signature ANTIQUOTE = |
6a4fae41a75f
Text with antiquotations of inner items (terms, types etc.).
wenzelm
parents:
diff
changeset
|
8 |
sig |
61473
34d1913f0b20
clarified control antiquotations: decode control symbol to get name;
wenzelm
parents:
61471
diff
changeset
|
9 |
type control = {range: Position.range, name: string * Position.T, body: Symbol_Pos.T list} |
34d1913f0b20
clarified control antiquotations: decode control symbol to get name;
wenzelm
parents:
61471
diff
changeset
|
10 |
type antiq = {start: Position.T, stop: Position.T, range: Position.range, body: Symbol_Pos.T list} |
34d1913f0b20
clarified control antiquotations: decode control symbol to get name;
wenzelm
parents:
61471
diff
changeset
|
11 |
datatype 'a antiquote = Text of 'a | Control of control | Antiq of antiq |
61434 | 12 |
type text_antiquote = Symbol_Pos.T list antiquote |
67467 | 13 |
val text_antiquote_range: text_antiquote -> Position.range |
14 |
val text_range: text_antiquote list -> Position.range |
|
61434 | 15 |
val split_lines: text_antiquote list -> text_antiquote list list |
61457 | 16 |
val antiq_reports: 'a antiquote list -> Position.report list |
69592
a80d8ec6c998
support for isabelle update -u control_cartouches;
wenzelm
parents:
67735
diff
changeset
|
17 |
val update_reports: bool -> Position.T -> string list -> Position.report_text list |
67426 | 18 |
val scan_control: control scanner |
19 |
val scan_antiq: antiq scanner |
|
20 |
val scan_antiquote: text_antiquote scanner |
|
67571
f858fe5531ac
more uniform treatment of formal comments within document source;
wenzelm
parents:
67522
diff
changeset
|
21 |
val scan_antiquote_comments: text_antiquote scanner |
f858fe5531ac
more uniform treatment of formal comments within document source;
wenzelm
parents:
67522
diff
changeset
|
22 |
val parse_comments: Position.T -> Symbol_Pos.T list -> text_antiquote list |
f858fe5531ac
more uniform treatment of formal comments within document source;
wenzelm
parents:
67522
diff
changeset
|
23 |
val read_comments: Input.source -> text_antiquote list |
9138
6a4fae41a75f
Text with antiquotations of inner items (terms, types etc.).
wenzelm
parents:
diff
changeset
|
24 |
end; |
6a4fae41a75f
Text with antiquotations of inner items (terms, types etc.).
wenzelm
parents:
diff
changeset
|
25 |
|
6a4fae41a75f
Text with antiquotations of inner items (terms, types etc.).
wenzelm
parents:
diff
changeset
|
26 |
structure Antiquote: ANTIQUOTE = |
6a4fae41a75f
Text with antiquotations of inner items (terms, types etc.).
wenzelm
parents:
diff
changeset
|
27 |
struct |
6a4fae41a75f
Text with antiquotations of inner items (terms, types etc.).
wenzelm
parents:
diff
changeset
|
28 |
|
6a4fae41a75f
Text with antiquotations of inner items (terms, types etc.).
wenzelm
parents:
diff
changeset
|
29 |
(* datatype antiquote *) |
6a4fae41a75f
Text with antiquotations of inner items (terms, types etc.).
wenzelm
parents:
diff
changeset
|
30 |
|
61473
34d1913f0b20
clarified control antiquotations: decode control symbol to get name;
wenzelm
parents:
61471
diff
changeset
|
31 |
type control = {range: Position.range, name: string * Position.T, body: Symbol_Pos.T list}; |
34d1913f0b20
clarified control antiquotations: decode control symbol to get name;
wenzelm
parents:
61471
diff
changeset
|
32 |
type antiq = {start: Position.T, stop: Position.T, range: Position.range, body: Symbol_Pos.T list}; |
34d1913f0b20
clarified control antiquotations: decode control symbol to get name;
wenzelm
parents:
61471
diff
changeset
|
33 |
datatype 'a antiquote = Text of 'a | Control of control | Antiq of antiq; |
9138
6a4fae41a75f
Text with antiquotations of inner items (terms, types etc.).
wenzelm
parents:
diff
changeset
|
34 |
|
61434 | 35 |
type text_antiquote = Symbol_Pos.T list antiquote; |
36 |
||
67467 | 37 |
fun text_antiquote_range (Text ss) = Symbol_Pos.range ss |
38 |
| text_antiquote_range (Control {range, ...}) = range |
|
39 |
| text_antiquote_range (Antiq {range, ...}) = range; |
|
61450 | 40 |
|
67467 | 41 |
fun text_range ants = |
61450 | 42 |
if null ants then Position.no_range |
67467 | 43 |
else |
44 |
Position.range (#1 (text_antiquote_range (hd ants)), #2 (text_antiquote_range (List.last ants))); |
|
61450 | 45 |
|
61434 | 46 |
|
47 |
(* split lines *) |
|
48 |
||
49 |
fun split_lines input = |
|
50 |
let |
|
51 |
fun add a (line, lines) = (a :: line, lines); |
|
52 |
fun flush (line, lines) = ([], rev line :: lines); |
|
53 |
fun split (a as Text ss) = |
|
67522 | 54 |
(case chop_prefix (fn ("\n", _) => false | _ => true) ss of |
61434 | 55 |
([], []) => I |
56 |
| (_, []) => add a |
|
57 |
| ([], _ :: rest) => flush #> split (Text rest) |
|
58 |
| (prefix, _ :: rest) => add (Text prefix) #> flush #> split (Text rest)) |
|
59 |
| split a = add a; |
|
61440 | 60 |
in if null input then [] else rev (#2 (flush (fold split input ([], [])))) end; |
61434 | 61 |
|
27342 | 62 |
|
44736 | 63 |
(* reports *) |
30641
72980f8d7ee8
export report -- version that actually covers all cases;
wenzelm
parents:
30635
diff
changeset
|
64 |
|
61457 | 65 |
fun antiq_reports ants = ants |> maps |
61471 | 66 |
(fn Text _ => [] |
61473
34d1913f0b20
clarified control antiquotations: decode control symbol to get name;
wenzelm
parents:
61471
diff
changeset
|
67 |
| Control {range = (pos, _), ...} => [(pos, Markup.antiquoted)] |
34d1913f0b20
clarified control antiquotations: decode control symbol to get name;
wenzelm
parents:
61471
diff
changeset
|
68 |
| Antiq {start, stop, range = (pos, _), ...} => |
61471 | 69 |
[(start, Markup.antiquote), |
70 |
(stop, Markup.antiquote), |
|
71 |
(pos, Markup.antiquoted), |
|
72 |
(pos, Markup.language_antiquotation)]); |
|
9138
6a4fae41a75f
Text with antiquotations of inner items (terms, types etc.).
wenzelm
parents:
diff
changeset
|
73 |
|
6a4fae41a75f
Text with antiquotations of inner items (terms, types etc.).
wenzelm
parents:
diff
changeset
|
74 |
|
69592
a80d8ec6c998
support for isabelle update -u control_cartouches;
wenzelm
parents:
67735
diff
changeset
|
75 |
(* update *) |
a80d8ec6c998
support for isabelle update -u control_cartouches;
wenzelm
parents:
67735
diff
changeset
|
76 |
|
a80d8ec6c998
support for isabelle update -u control_cartouches;
wenzelm
parents:
67735
diff
changeset
|
77 |
fun update_reports embedded pos src = |
a80d8ec6c998
support for isabelle update -u control_cartouches;
wenzelm
parents:
67735
diff
changeset
|
78 |
let |
a80d8ec6c998
support for isabelle update -u control_cartouches;
wenzelm
parents:
67735
diff
changeset
|
79 |
val n = length src; |
a80d8ec6c998
support for isabelle update -u control_cartouches;
wenzelm
parents:
67735
diff
changeset
|
80 |
val no_arg = n = 1; |
a80d8ec6c998
support for isabelle update -u control_cartouches;
wenzelm
parents:
67735
diff
changeset
|
81 |
val embedded_arg = n = 2 andalso embedded; |
a80d8ec6c998
support for isabelle update -u control_cartouches;
wenzelm
parents:
67735
diff
changeset
|
82 |
val control = |
a80d8ec6c998
support for isabelle update -u control_cartouches;
wenzelm
parents:
67735
diff
changeset
|
83 |
(case src of |
a80d8ec6c998
support for isabelle update -u control_cartouches;
wenzelm
parents:
67735
diff
changeset
|
84 |
name :: _ => |
a80d8ec6c998
support for isabelle update -u control_cartouches;
wenzelm
parents:
67735
diff
changeset
|
85 |
if Symbol.is_ascii_identifier name andalso name <> "cartouche" andalso |
a80d8ec6c998
support for isabelle update -u control_cartouches;
wenzelm
parents:
67735
diff
changeset
|
86 |
(no_arg orelse embedded_arg) |
a80d8ec6c998
support for isabelle update -u control_cartouches;
wenzelm
parents:
67735
diff
changeset
|
87 |
then SOME (Symbol.control_prefix ^ name ^ Symbol.control_suffix) |
a80d8ec6c998
support for isabelle update -u control_cartouches;
wenzelm
parents:
67735
diff
changeset
|
88 |
else NONE |
a80d8ec6c998
support for isabelle update -u control_cartouches;
wenzelm
parents:
67735
diff
changeset
|
89 |
| [] => NONE); |
a80d8ec6c998
support for isabelle update -u control_cartouches;
wenzelm
parents:
67735
diff
changeset
|
90 |
val arg = if embedded_arg then cartouche (nth src 1) else ""; |
a80d8ec6c998
support for isabelle update -u control_cartouches;
wenzelm
parents:
67735
diff
changeset
|
91 |
in |
a80d8ec6c998
support for isabelle update -u control_cartouches;
wenzelm
parents:
67735
diff
changeset
|
92 |
(case control of |
a80d8ec6c998
support for isabelle update -u control_cartouches;
wenzelm
parents:
67735
diff
changeset
|
93 |
SOME sym => [((pos, Markup.update), sym ^ arg)] |
a80d8ec6c998
support for isabelle update -u control_cartouches;
wenzelm
parents:
67735
diff
changeset
|
94 |
| NONE => []) |
a80d8ec6c998
support for isabelle update -u control_cartouches;
wenzelm
parents:
67735
diff
changeset
|
95 |
end; |
a80d8ec6c998
support for isabelle update -u control_cartouches;
wenzelm
parents:
67735
diff
changeset
|
96 |
|
a80d8ec6c998
support for isabelle update -u control_cartouches;
wenzelm
parents:
67735
diff
changeset
|
97 |
|
a80d8ec6c998
support for isabelle update -u control_cartouches;
wenzelm
parents:
67735
diff
changeset
|
98 |
|
30590
1d9c9fcf8513
parameterized datatype antiquote and read operation;
wenzelm
parents:
30589
diff
changeset
|
99 |
(* scan *) |
9138
6a4fae41a75f
Text with antiquotations of inner items (terms, types etc.).
wenzelm
parents:
diff
changeset
|
100 |
|
30573 | 101 |
open Basic_Symbol_Pos; |
9138
6a4fae41a75f
Text with antiquotations of inner items (terms, types etc.).
wenzelm
parents:
diff
changeset
|
102 |
|
22114 | 103 |
local |
9138
6a4fae41a75f
Text with antiquotations of inner items (terms, types etc.).
wenzelm
parents:
diff
changeset
|
104 |
|
48764 | 105 |
val err_prefix = "Antiquotation lexical error: "; |
106 |
||
67193 | 107 |
val scan_nl = Scan.one (fn (s, _) => s = "\n") >> single; |
67571
f858fe5531ac
more uniform treatment of formal comments within document source;
wenzelm
parents:
67522
diff
changeset
|
108 |
val scan_nl_opt = Scan.optional scan_nl []; |
67193 | 109 |
|
67571
f858fe5531ac
more uniform treatment of formal comments within document source;
wenzelm
parents:
67522
diff
changeset
|
110 |
val scan_plain_txt = |
f858fe5531ac
more uniform treatment of formal comments within document source;
wenzelm
parents:
67522
diff
changeset
|
111 |
Scan.many1 (fn (s, _) => |
f858fe5531ac
more uniform treatment of formal comments within document source;
wenzelm
parents:
67522
diff
changeset
|
112 |
not (Comment.is_symbol s) andalso |
f858fe5531ac
more uniform treatment of formal comments within document source;
wenzelm
parents:
67522
diff
changeset
|
113 |
not (Symbol.is_control s) andalso |
f858fe5531ac
more uniform treatment of formal comments within document source;
wenzelm
parents:
67522
diff
changeset
|
114 |
s <> Symbol.open_ andalso |
f858fe5531ac
more uniform treatment of formal comments within document source;
wenzelm
parents:
67522
diff
changeset
|
115 |
s <> "@" andalso |
f858fe5531ac
more uniform treatment of formal comments within document source;
wenzelm
parents:
67522
diff
changeset
|
116 |
s <> "\n" andalso |
f858fe5531ac
more uniform treatment of formal comments within document source;
wenzelm
parents:
67522
diff
changeset
|
117 |
Symbol.not_eof s) || |
f858fe5531ac
more uniform treatment of formal comments within document source;
wenzelm
parents:
67522
diff
changeset
|
118 |
Scan.one (Comment.is_symbol o Symbol_Pos.symbol) >> single || |
f858fe5531ac
more uniform treatment of formal comments within document source;
wenzelm
parents:
67522
diff
changeset
|
119 |
$$$ "@" --| Scan.ahead (~$$ "{"); |
f858fe5531ac
more uniform treatment of formal comments within document source;
wenzelm
parents:
67522
diff
changeset
|
120 |
|
f858fe5531ac
more uniform treatment of formal comments within document source;
wenzelm
parents:
67522
diff
changeset
|
121 |
val scan_text = |
f858fe5531ac
more uniform treatment of formal comments within document source;
wenzelm
parents:
67522
diff
changeset
|
122 |
scan_nl || Scan.repeats1 scan_plain_txt @@@ scan_nl_opt; |
f858fe5531ac
more uniform treatment of formal comments within document source;
wenzelm
parents:
67522
diff
changeset
|
123 |
|
f858fe5531ac
more uniform treatment of formal comments within document source;
wenzelm
parents:
67522
diff
changeset
|
124 |
val scan_text_comments = |
69891
def3ec9cdb7e
document markers are formal comments, and may thus occur anywhere in the command-span;
wenzelm
parents:
69592
diff
changeset
|
125 |
scan_nl || Scan.repeats1 (Comment.scan_inner >> #2 || scan_plain_txt) @@@ scan_nl_opt; |
9138
6a4fae41a75f
Text with antiquotations of inner items (terms, types etc.).
wenzelm
parents:
diff
changeset
|
126 |
|
55512 | 127 |
val scan_antiq_body = |
48764 | 128 |
Scan.trace (Symbol_Pos.scan_string_qq err_prefix || Symbol_Pos.scan_string_bq err_prefix) >> #2 || |
61481 | 129 |
Symbol_Pos.scan_cartouche err_prefix || |
69891
def3ec9cdb7e
document markers are formal comments, and may thus occur anywhere in the command-span;
wenzelm
parents:
69592
diff
changeset
|
130 |
Comment.scan_inner -- |
67735
e2e002d4a4de
clarified syntax: reject formal comments explicitly, instead of ignoring them silently;
wenzelm
parents:
67571
diff
changeset
|
131 |
Symbol_Pos.!!! (fn () => err_prefix ^ "bad formal comment in antiquote body") Scan.fail |
e2e002d4a4de
clarified syntax: reject formal comments explicitly, instead of ignoring them silently;
wenzelm
parents:
67571
diff
changeset
|
132 |
>> K [] || |
58854 | 133 |
Scan.one (fn (s, _) => s <> "}" andalso Symbol.not_eof s) >> single; |
9138
6a4fae41a75f
Text with antiquotations of inner items (terms, types etc.).
wenzelm
parents:
diff
changeset
|
134 |
|
61491
97261e6c1d42
another antiquotation short form: undecorated cartouche as alias for @{text};
wenzelm
parents:
61481
diff
changeset
|
135 |
fun control_name sym = (case Symbol.decode sym of Symbol.Control name => name); |
97261e6c1d42
another antiquotation short form: undecorated cartouche as alias for @{text};
wenzelm
parents:
61481
diff
changeset
|
136 |
|
42508
e21362bf1d93
allow nested @{antiq} (nonterminal) and @@{antiq} terminal;
wenzelm
parents:
42503
diff
changeset
|
137 |
in |
e21362bf1d93
allow nested @{antiq} (nonterminal) and @@{antiq} terminal;
wenzelm
parents:
42503
diff
changeset
|
138 |
|
61471 | 139 |
val scan_control = |
61491
97261e6c1d42
another antiquotation short form: undecorated cartouche as alias for @{text};
wenzelm
parents:
61481
diff
changeset
|
140 |
Scan.option (Scan.one (Symbol.is_control o Symbol_Pos.symbol)) -- |
61481 | 141 |
Symbol_Pos.scan_cartouche err_prefix >> |
61491
97261e6c1d42
another antiquotation short form: undecorated cartouche as alias for @{text};
wenzelm
parents:
61481
diff
changeset
|
142 |
(fn (opt_control, body) => |
61473
34d1913f0b20
clarified control antiquotations: decode control symbol to get name;
wenzelm
parents:
61471
diff
changeset
|
143 |
let |
61491
97261e6c1d42
another antiquotation short form: undecorated cartouche as alias for @{text};
wenzelm
parents:
61481
diff
changeset
|
144 |
val (name, range) = |
97261e6c1d42
another antiquotation short form: undecorated cartouche as alias for @{text};
wenzelm
parents:
61481
diff
changeset
|
145 |
(case opt_control of |
97261e6c1d42
another antiquotation short form: undecorated cartouche as alias for @{text};
wenzelm
parents:
61481
diff
changeset
|
146 |
SOME (sym, pos) => ((control_name sym, pos), Symbol_Pos.range ((sym, pos) :: body)) |
97261e6c1d42
another antiquotation short form: undecorated cartouche as alias for @{text};
wenzelm
parents:
61481
diff
changeset
|
147 |
| NONE => (("cartouche", #2 (hd body)), Symbol_Pos.range body)); |
61595 | 148 |
in {name = name, range = range, body = body} end) || |
149 |
Scan.one (Symbol.is_control o Symbol_Pos.symbol) >> |
|
150 |
(fn (sym, pos) => |
|
151 |
{name = (control_name sym, pos), range = Symbol_Pos.range [(sym, pos)], body = []}); |
|
61471 | 152 |
|
9138
6a4fae41a75f
Text with antiquotations of inner items (terms, types etc.).
wenzelm
parents:
diff
changeset
|
153 |
val scan_antiq = |
55526 | 154 |
Symbol_Pos.scan_pos -- ($$ "@" |-- $$ "{" |-- Symbol_Pos.scan_pos -- |
48764 | 155 |
Symbol_Pos.!!! (fn () => err_prefix ^ "missing closing brace") |
61476 | 156 |
(Scan.repeats scan_antiq_body -- Symbol_Pos.scan_pos -- ($$ "}" |-- Symbol_Pos.scan_pos))) >> |
61473
34d1913f0b20
clarified control antiquotations: decode control symbol to get name;
wenzelm
parents:
61471
diff
changeset
|
157 |
(fn (pos1, (pos2, ((body, pos3), pos4))) => |
62797 | 158 |
{start = Position.range_position (pos1, pos2), |
159 |
stop = Position.range_position (pos3, pos4), |
|
160 |
range = Position.range (pos1, pos4), |
|
61476 | 161 |
body = body}); |
30590
1d9c9fcf8513
parameterized datatype antiquote and read operation;
wenzelm
parents:
30589
diff
changeset
|
162 |
|
61471 | 163 |
val scan_antiquote = |
67571
f858fe5531ac
more uniform treatment of formal comments within document source;
wenzelm
parents:
67522
diff
changeset
|
164 |
scan_text >> Text || scan_control >> Control || scan_antiq >> Antiq; |
f858fe5531ac
more uniform treatment of formal comments within document source;
wenzelm
parents:
67522
diff
changeset
|
165 |
|
f858fe5531ac
more uniform treatment of formal comments within document source;
wenzelm
parents:
67522
diff
changeset
|
166 |
val scan_antiquote_comments = |
f858fe5531ac
more uniform treatment of formal comments within document source;
wenzelm
parents:
67522
diff
changeset
|
167 |
scan_text_comments >> Text || scan_control >> Control || scan_antiq >> Antiq; |
9138
6a4fae41a75f
Text with antiquotations of inner items (terms, types etc.).
wenzelm
parents:
diff
changeset
|
168 |
|
6a4fae41a75f
Text with antiquotations of inner items (terms, types etc.).
wenzelm
parents:
diff
changeset
|
169 |
end; |
6a4fae41a75f
Text with antiquotations of inner items (terms, types etc.).
wenzelm
parents:
diff
changeset
|
170 |
|
6a4fae41a75f
Text with antiquotations of inner items (terms, types etc.).
wenzelm
parents:
diff
changeset
|
171 |
|
67571
f858fe5531ac
more uniform treatment of formal comments within document source;
wenzelm
parents:
67522
diff
changeset
|
172 |
(* parse and read (with formal comments) *) |
9138
6a4fae41a75f
Text with antiquotations of inner items (terms, types etc.).
wenzelm
parents:
diff
changeset
|
173 |
|
67571
f858fe5531ac
more uniform treatment of formal comments within document source;
wenzelm
parents:
67522
diff
changeset
|
174 |
fun parse_comments pos syms = |
f858fe5531ac
more uniform treatment of formal comments within document source;
wenzelm
parents:
67522
diff
changeset
|
175 |
(case Scan.read Symbol_Pos.stopper (Scan.repeat scan_antiquote_comments) syms of |
62749 | 176 |
SOME ants => ants |
61456 | 177 |
| NONE => error ("Malformed quotation/antiquotation source" ^ Position.here pos)); |
178 |
||
67571
f858fe5531ac
more uniform treatment of formal comments within document source;
wenzelm
parents:
67522
diff
changeset
|
179 |
fun read_comments source = |
62749 | 180 |
let |
67571
f858fe5531ac
more uniform treatment of formal comments within document source;
wenzelm
parents:
67522
diff
changeset
|
181 |
val ants = parse_comments (Input.pos_of source) (Input.source_explode source); |
62749 | 182 |
val _ = Position.reports (antiq_reports ants); |
183 |
in ants end; |
|
9138
6a4fae41a75f
Text with antiquotations of inner items (terms, types etc.).
wenzelm
parents:
diff
changeset
|
184 |
|
6a4fae41a75f
Text with antiquotations of inner items (terms, types etc.).
wenzelm
parents:
diff
changeset
|
185 |
end; |