| author | wenzelm | 
| Thu, 21 Jan 2016 22:16:48 +0100 | |
| changeset 62230 | 949d2c9f6ff7 | 
| parent 61814 | 1ca1142e1711 | 
| child 62529 | 8b7bdfc09f3b | 
| permissions | -rw-r--r-- | 
| 36949 
080e85d46108
renamed structure OuterKeyword to Keyword and OuterParse to Parse, keeping the old names as legacy aliases for some time;
 wenzelm parents: 
35838diff
changeset | 1 | (* Title: Pure/Isar/parse.ML | 
| 5826 | 2 | Author: Markus Wenzel, TU Muenchen | 
| 3 | ||
| 4 | Generic parsers for Isabelle/Isar outer syntax. | |
| 5 | *) | |
| 6 | ||
| 36949 
080e85d46108
renamed structure OuterKeyword to Keyword and OuterParse to Parse, keeping the old names as legacy aliases for some time;
 wenzelm parents: 
35838diff
changeset | 7 | signature PARSE = | 
| 5826 | 8 | sig | 
| 44357 | 9 | val group: (unit -> string) -> (Token.T list -> 'a) -> Token.T list -> 'a | 
| 36959 
f5417836dbea
renamed structure OuterLex to Token and type token to Token.T, keeping legacy aliases for some time;
 wenzelm parents: 
36955diff
changeset | 10 | val !!! : (Token.T list -> 'a) -> Token.T list -> 'a | 
| 
f5417836dbea
renamed structure OuterLex to Token and type token to Token.T, keeping legacy aliases for some time;
 wenzelm parents: 
36955diff
changeset | 11 | val !!!! : (Token.T list -> 'a) -> Token.T list -> 'a | 
| 
f5417836dbea
renamed structure OuterLex to Token and type token to Token.T, keeping legacy aliases for some time;
 wenzelm parents: 
36955diff
changeset | 12 | val not_eof: Token.T parser | 
| 56201 | 13 | val token: 'a parser -> Token.T parser | 
| 59029 
c907cbe36713
more careful ML source positions, for improved PIDE markup;
 wenzelm parents: 
58908diff
changeset | 14 |   val range: 'a parser -> ('a * Position.range) parser
 | 
| 42326 | 15 |   val position: 'a parser -> ('a * Position.T) parser
 | 
| 59809 | 16 | val input: 'a parser -> Input.source parser | 
| 42326 | 17 | val inner_syntax: 'a parser -> string parser | 
| 58908 | 18 | val command_: string parser | 
| 29310 | 19 | val keyword: string parser | 
| 20 | val short_ident: string parser | |
| 21 | val long_ident: string parser | |
| 22 | val sym_ident: string parser | |
| 60629 | 23 | val dots: string parser | 
| 29310 | 24 | val minus: string parser | 
| 25 | val term_var: string parser | |
| 26 | val type_ident: string parser | |
| 27 | val type_var: string parser | |
| 28 | val number: string parser | |
| 40290 
47f572aff50a
support for floating-point tokens in outer syntax (coinciding with inner syntax version);
 wenzelm parents: 
36959diff
changeset | 29 | val float_number: string parser | 
| 29310 | 30 | val string: string parser | 
| 31 | val alt_string: string parser | |
| 32 | val verbatim: string parser | |
| 55033 | 33 | val cartouche: string parser | 
| 29310 | 34 | val eof: string parser | 
| 58908 | 35 | val command: string -> string parser | 
| 29310 | 36 | val keyword_with: (string -> bool) -> string parser | 
| 56202 | 37 | val keyword_markup: bool * Markup.T -> string -> string parser | 
| 38 | val keyword_improper: string -> string parser | |
| 29310 | 39 | val $$$ : string -> string parser | 
| 40 | val reserved: string -> string parser | |
| 41 | val underscore: string parser | |
| 42 | val maybe: 'a parser -> 'a option parser | |
| 43 | val tag_name: string parser | |
| 44 | val tags: string list parser | |
| 45 | val opt_keyword: string -> bool parser | |
| 59917 
9830c944670f
more uniform "verbose" option to print name space;
 wenzelm parents: 
59809diff
changeset | 46 | val opt_bang: bool parser | 
| 29310 | 47 | val begin: string parser | 
| 48 | val opt_begin: bool parser | |
| 49 | val nat: int parser | |
| 50 | val int: int parser | |
| 40290 
47f572aff50a
support for floating-point tokens in outer syntax (coinciding with inner syntax version);
 wenzelm parents: 
36959diff
changeset | 51 | val real: real parser | 
| 55764 | 52 |   val enum_positions: string -> 'a parser -> ('a list * Position.T list) parser
 | 
| 53 |   val enum1_positions: string -> 'a parser -> ('a list * Position.T list) parser
 | |
| 29310 | 54 | val enum: string -> 'a parser -> 'a list parser | 
| 55 | val enum1: string -> 'a parser -> 'a list parser | |
| 56 | val and_list: 'a parser -> 'a list parser | |
| 57 | val and_list1: 'a parser -> 'a list parser | |
| 30511 | 58 | val enum': string -> 'a context_parser -> 'a list context_parser | 
| 59 | val enum1': string -> 'a context_parser -> 'a list context_parser | |
| 60 | val and_list': 'a context_parser -> 'a list context_parser | |
| 61 | val and_list1': 'a context_parser -> 'a list context_parser | |
| 29310 | 62 | val list: 'a parser -> 'a list parser | 
| 63 | val list1: 'a parser -> 'a list parser | |
| 43775 
b361c7d184e7
added Parse.properties (again) -- allow empty list like Parse_Value.properties but unlike Parse.properties of ef86de9c98aa;
 wenzelm parents: 
42657diff
changeset | 64 | val properties: Properties.T parser | 
| 29310 | 65 | val name: bstring parser | 
| 29581 | 66 | val binding: binding parser | 
| 29310 | 67 | val xname: xstring parser | 
| 68 | val text: string parser | |
| 48881 
46e053eda5dd
clarified Parse.path vs. Parse.explode -- prefer errors in proper transaction context;
 wenzelm parents: 
46922diff
changeset | 69 | val path: string parser | 
| 59693 | 70 | val theory_name: bstring parser | 
| 71 | val theory_xname: xstring parser | |
| 40800 
330eb65c9469
Parse.liberal_name for document antiquotations and attributes;
 wenzelm parents: 
40793diff
changeset | 72 | val liberal_name: xstring parser | 
| 29310 | 73 | val parname: string parser | 
| 29581 | 74 | val parbinding: binding parser | 
| 46922 
3717f3878714
source positions for locale and class expressions;
 wenzelm parents: 
45596diff
changeset | 75 | val class: string parser | 
| 29310 | 76 | val sort: string parser | 
| 46922 
3717f3878714
source positions for locale and class expressions;
 wenzelm parents: 
45596diff
changeset | 77 | val type_const: string parser | 
| 29310 | 78 | val arity: (string * string list * string) parser | 
| 79 | val multi_arity: (string list * string list * string) parser | |
| 80 | val type_args: string list parser | |
| 35838 | 81 | val type_args_constrained: (string * string option) list parser | 
| 29310 | 82 | val typ_group: string parser | 
| 83 | val typ: string parser | |
| 84 | val mixfix: mixfix parser | |
| 85 | val mixfix': mixfix parser | |
| 86 | val opt_mixfix: mixfix parser | |
| 87 | val opt_mixfix': mixfix parser | |
| 88 | val where_: string parser | |
| 42299 | 89 | val const_decl: (string * string * mixfix) parser | 
| 30339 | 90 | val const_binding: (binding * string * mixfix) parser | 
| 60448 | 91 | val params: (binding * string option * mixfix) list parser | 
| 29581 | 92 | val fixes: (binding * string option * mixfix) list parser | 
| 93 | val for_fixes: (binding * string option * mixfix) list parser | |
| 59064 | 94 | val ML_source: Input.source parser | 
| 95 | val document_source: Input.source parser | |
| 29310 | 96 | val term_group: string parser | 
| 97 | val prop_group: string parser | |
| 98 | val term: string parser | |
| 99 | val prop: string parser | |
| 42300 
0d1cbc1fe579
notation: proper markup for type constructor / constant;
 wenzelm parents: 
42299diff
changeset | 100 | val const: string parser | 
| 40793 
d21aedaa91e7
added Parse.literal_fact with proper inner_syntax markup (source position);
 wenzelm parents: 
40296diff
changeset | 101 | val literal_fact: string parser | 
| 29310 | 102 | val propp: (string * string list) parser | 
| 103 | val termp: (string * string list) parser | |
| 59924 
801b979ec0c2
more general notion of command span: command keyword not necessarily at start;
 wenzelm parents: 
59918diff
changeset | 104 | val private: Position.T parser | 
| 59990 
a81dc82ecba3
clarified keyword 'qualified' in accordance to a similar keyword from Haskell (despite unrelated Binding.qualified in Isabelle/ML);
 wenzelm parents: 
59939diff
changeset | 105 | val qualified: Position.T parser | 
| 45488 
6d71d9e52369
pass positions for named targets, for formal links in the document model;
 wenzelm parents: 
45331diff
changeset | 106 | val target: (xstring * Position.T) parser | 
| 
6d71d9e52369
pass positions for named targets, for formal links in the document model;
 wenzelm parents: 
45331diff
changeset | 107 | val opt_target: (xstring * Position.T) option parser | 
| 56201 | 108 | val args: Token.T list parser | 
| 109 | val args1: (string -> bool) -> Token.T list parser | |
| 58028 
e4250d370657
tuned signature -- define some elementary operations earlier;
 wenzelm parents: 
58011diff
changeset | 110 | val attribs: Token.src list parser | 
| 
e4250d370657
tuned signature -- define some elementary operations earlier;
 wenzelm parents: 
58011diff
changeset | 111 | val opt_attribs: Token.src list parser | 
| 
e4250d370657
tuned signature -- define some elementary operations earlier;
 wenzelm parents: 
58011diff
changeset | 112 | val thm_sel: Facts.interval list parser | 
| 
e4250d370657
tuned signature -- define some elementary operations earlier;
 wenzelm parents: 
58011diff
changeset | 113 | val xthm: (Facts.ref * Token.src list) parser | 
| 
e4250d370657
tuned signature -- define some elementary operations earlier;
 wenzelm parents: 
58011diff
changeset | 114 | val xthms1: (Facts.ref * Token.src list) list parser | 
| 5826 | 115 | end; | 
| 116 | ||
| 36949 
080e85d46108
renamed structure OuterKeyword to Keyword and OuterParse to Parse, keeping the old names as legacy aliases for some time;
 wenzelm parents: 
35838diff
changeset | 117 | structure Parse: PARSE = | 
| 5826 | 118 | struct | 
| 119 | ||
| 120 | (** error handling **) | |
| 121 | ||
| 122 | (* group atomic parsers (no cuts!) *) | |
| 123 | ||
| 44357 | 124 | fun group s scan = scan || Scan.fail_with | 
| 48911 
5debc3e4fa81
tuned messages: end-of-input rarely means physical end-of-file from the past;
 wenzelm parents: 
48881diff
changeset | 125 | (fn [] => (fn () => s () ^ " expected,\nbut end-of-input was found") | 
| 42519 | 126 | | tok :: _ => | 
| 43947 
9b00f09f7721
defer evaluation of Scan.message, for improved performance in the frequent situation where failure is handled later (e.g. via ||);
 wenzelm parents: 
43775diff
changeset | 127 | (fn () => | 
| 
9b00f09f7721
defer evaluation of Scan.message, for improved performance in the frequent situation where failure is handled later (e.g. via ||);
 wenzelm parents: 
43775diff
changeset | 128 | (case Token.text_of tok of | 
| 
9b00f09f7721
defer evaluation of Scan.message, for improved performance in the frequent situation where failure is handled later (e.g. via ||);
 wenzelm parents: 
43775diff
changeset | 129 | (txt, "") => | 
| 55708 | 130 | s () ^ " expected,\nbut " ^ txt ^ Position.here (Token.pos_of tok) ^ | 
| 131 | " was found" | |
| 43947 
9b00f09f7721
defer evaluation of Scan.message, for improved performance in the frequent situation where failure is handled later (e.g. via ||);
 wenzelm parents: 
43775diff
changeset | 132 | | (txt1, txt2) => | 
| 55708 | 133 | s () ^ " expected,\nbut " ^ txt1 ^ Position.here (Token.pos_of tok) ^ | 
| 134 | " was found:\n" ^ txt2))); | |
| 5826 | 135 | |
| 136 | ||
| 5877 | 137 | (* cut *) | 
| 5826 | 138 | |
| 8581 
5c7ed2af8bfb
!!!! = cut "Corrupted outer syntax in presentation";
 wenzelm parents: 
8350diff
changeset | 139 | fun cut kind scan = | 
| 5826 | 140 | let | 
| 48911 
5debc3e4fa81
tuned messages: end-of-input rarely means physical end-of-file from the past;
 wenzelm parents: 
48881diff
changeset | 141 | fun get_pos [] = " (end-of-input)" | 
| 55708 | 142 | | get_pos (tok :: _) = Position.here (Token.pos_of tok); | 
| 5826 | 143 | |
| 43947 
9b00f09f7721
defer evaluation of Scan.message, for improved performance in the frequent situation where failure is handled later (e.g. via ||);
 wenzelm parents: 
43775diff
changeset | 144 | fun err (toks, NONE) = (fn () => kind ^ get_pos toks) | 
| 25625 | 145 | | err (toks, SOME msg) = | 
| 43947 
9b00f09f7721
defer evaluation of Scan.message, for improved performance in the frequent situation where failure is handled later (e.g. via ||);
 wenzelm parents: 
43775diff
changeset | 146 | (fn () => | 
| 
9b00f09f7721
defer evaluation of Scan.message, for improved performance in the frequent situation where failure is handled later (e.g. via ||);
 wenzelm parents: 
43775diff
changeset | 147 | let val s = msg () in | 
| 
9b00f09f7721
defer evaluation of Scan.message, for improved performance in the frequent situation where failure is handled later (e.g. via ||);
 wenzelm parents: 
43775diff
changeset | 148 | if String.isPrefix kind s then s | 
| 
9b00f09f7721
defer evaluation of Scan.message, for improved performance in the frequent situation where failure is handled later (e.g. via ||);
 wenzelm parents: 
43775diff
changeset | 149 | else kind ^ get_pos toks ^ ": " ^ s | 
| 
9b00f09f7721
defer evaluation of Scan.message, for improved performance in the frequent situation where failure is handled later (e.g. via ||);
 wenzelm parents: 
43775diff
changeset | 150 | end); | 
| 5826 | 151 | in Scan.!! err scan end; | 
| 152 | ||
| 8586 | 153 | fun !!! scan = cut "Outer syntax error" scan; | 
| 154 | fun !!!! scan = cut "Corrupted outer syntax in presentation" scan; | |
| 8581 
5c7ed2af8bfb
!!!! = cut "Corrupted outer syntax in presentation";
 wenzelm parents: 
8350diff
changeset | 155 | |
| 5826 | 156 | |
| 157 | ||
| 158 | (** basic parsers **) | |
| 159 | ||
| 160 | (* tokens *) | |
| 161 | ||
| 27815 | 162 | fun RESET_VALUE atom = (*required for all primitive parsers*) | 
| 36959 
f5417836dbea
renamed structure OuterLex to Token and type token to Token.T, keeping legacy aliases for some time;
 wenzelm parents: 
36955diff
changeset | 163 | Scan.ahead (Scan.one (K true)) -- atom >> (fn (arg, x) => (Token.assign NONE arg; x)); | 
| 27815 | 164 | |
| 165 | ||
| 36959 
f5417836dbea
renamed structure OuterLex to Token and type token to Token.T, keeping legacy aliases for some time;
 wenzelm parents: 
36955diff
changeset | 166 | val not_eof = RESET_VALUE (Scan.one Token.not_eof); | 
| 15703 | 167 | |
| 56201 | 168 | fun token atom = Scan.ahead not_eof --| atom; | 
| 169 | ||
| 59029 
c907cbe36713
more careful ML source positions, for improved PIDE markup;
 wenzelm parents: 
58908diff
changeset | 170 | fun range scan = (Scan.ahead not_eof >> (Token.range_of o single)) -- scan >> Library.swap; | 
| 55708 | 171 | fun position scan = (Scan.ahead not_eof >> Token.pos_of) -- scan >> Library.swap; | 
| 59809 | 172 | fun input atom = Scan.ahead atom |-- not_eof >> Token.input_of; | 
| 55111 | 173 | fun inner_syntax atom = Scan.ahead atom |-- not_eof >> Token.inner_syntax_of; | 
| 5826 | 174 | |
| 175 | fun kind k = | |
| 44357 | 176 | group (fn () => Token.str_of_kind k) | 
| 177 | (RESET_VALUE (Scan.one (Token.is_kind k) >> Token.content_of)); | |
| 5826 | 178 | |
| 58908 | 179 | val command_ = kind Token.Command; | 
| 36959 
f5417836dbea
renamed structure OuterLex to Token and type token to Token.T, keeping legacy aliases for some time;
 wenzelm parents: 
36955diff
changeset | 180 | val keyword = kind Token.Keyword; | 
| 
f5417836dbea
renamed structure OuterLex to Token and type token to Token.T, keeping legacy aliases for some time;
 wenzelm parents: 
36955diff
changeset | 181 | val short_ident = kind Token.Ident; | 
| 59081 | 182 | val long_ident = kind Token.Long_Ident; | 
| 183 | val sym_ident = kind Token.Sym_Ident; | |
| 36959 
f5417836dbea
renamed structure OuterLex to Token and type token to Token.T, keeping legacy aliases for some time;
 wenzelm parents: 
36955diff
changeset | 184 | val term_var = kind Token.Var; | 
| 59081 | 185 | val type_ident = kind Token.Type_Ident; | 
| 186 | val type_var = kind Token.Type_Var; | |
| 36959 
f5417836dbea
renamed structure OuterLex to Token and type token to Token.T, keeping legacy aliases for some time;
 wenzelm parents: 
36955diff
changeset | 187 | val number = kind Token.Nat; | 
| 40290 
47f572aff50a
support for floating-point tokens in outer syntax (coinciding with inner syntax version);
 wenzelm parents: 
36959diff
changeset | 188 | val float_number = kind Token.Float; | 
| 36959 
f5417836dbea
renamed structure OuterLex to Token and type token to Token.T, keeping legacy aliases for some time;
 wenzelm parents: 
36955diff
changeset | 189 | val string = kind Token.String; | 
| 59081 | 190 | val alt_string = kind Token.Alt_String; | 
| 36959 
f5417836dbea
renamed structure OuterLex to Token and type token to Token.T, keeping legacy aliases for some time;
 wenzelm parents: 
36955diff
changeset | 191 | val verbatim = kind Token.Verbatim; | 
| 55033 | 192 | val cartouche = kind Token.Cartouche; | 
| 36959 
f5417836dbea
renamed structure OuterLex to Token and type token to Token.T, keeping legacy aliases for some time;
 wenzelm parents: 
36955diff
changeset | 193 | val eof = kind Token.EOF; | 
| 5826 | 194 | |
| 58908 | 195 | fun command x = | 
| 48927 
ef462b5558eb
theory def/ref position reports, which enable hyperlinks etc.;
 wenzelm parents: 
48911diff
changeset | 196 | group (fn () => Token.str_of_kind Token.Command ^ " " ^ quote x) | 
| 
ef462b5558eb
theory def/ref position reports, which enable hyperlinks etc.;
 wenzelm parents: 
48911diff
changeset | 197 | (RESET_VALUE (Scan.one (fn tok => Token.is_command tok andalso Token.content_of tok = x))) | 
| 
ef462b5558eb
theory def/ref position reports, which enable hyperlinks etc.;
 wenzelm parents: 
48911diff
changeset | 198 | >> Token.content_of; | 
| 
ef462b5558eb
theory def/ref position reports, which enable hyperlinks etc.;
 wenzelm parents: 
48911diff
changeset | 199 | |
| 56202 | 200 | fun keyword_with pred = RESET_VALUE (Scan.one (Token.keyword_with pred) >> Token.content_of); | 
| 201 | ||
| 202 | fun keyword_markup markup x = | |
| 44357 | 203 | group (fn () => Token.str_of_kind Token.Keyword ^ " " ^ quote x) | 
| 56063 | 204 | (Scan.ahead not_eof -- keyword_with (fn y => x = y)) | 
| 56202 | 205 | >> (fn (tok, x) => (Token.assign (SOME (Token.Literal markup)) tok; x)); | 
| 206 | ||
| 207 | val keyword_improper = keyword_markup (true, Markup.improper); | |
| 208 | val $$$ = keyword_markup (false, Markup.quasi_keyword); | |
| 9131 | 209 | |
| 16030 | 210 | fun reserved x = | 
| 44357 | 211 | group (fn () => "reserved identifier " ^ quote x) | 
| 36959 
f5417836dbea
renamed structure OuterLex to Token and type token to Token.T, keeping legacy aliases for some time;
 wenzelm parents: 
36955diff
changeset | 212 | (RESET_VALUE (Scan.one (Token.ident_with (fn y => x = y)) >> Token.content_of)); | 
| 16030 | 213 | |
| 60629 | 214 | val dots = sym_ident :-- (fn "\\<dots>" => Scan.succeed () | _ => Scan.fail) >> #1; | 
| 215 | ||
| 15703 | 216 | val minus = sym_ident :-- (fn "-" => Scan.succeed () | _ => Scan.fail) >> #1; | 
| 60629 | 217 | |
| 11792 
311eee3d63b6
parser for underscore (actually a symbolic identifier!);
 wenzelm parents: 
11651diff
changeset | 218 | val underscore = sym_ident :-- (fn "_" => Scan.succeed () | _ => Scan.fail) >> #1; | 
| 15703 | 219 | fun maybe scan = underscore >> K NONE || scan >> SOME; | 
| 11792 
311eee3d63b6
parser for underscore (actually a symbolic identifier!);
 wenzelm parents: 
11651diff
changeset | 220 | |
| 14835 | 221 | val nat = number >> (#1 o Library.read_int o Symbol.explode); | 
| 27815 | 222 | val int = Scan.optional (minus >> K ~1) 1 -- nat >> op *; | 
| 51988 | 223 | val real = float_number >> Markup.parse_real || int >> Real.fromInt; | 
| 5826 | 224 | |
| 44357 | 225 | val tag_name = group (fn () => "tag name") (short_ident || string); | 
| 17070 | 226 | val tags = Scan.repeat ($$$ "%" |-- !!! tag_name); | 
| 227 | ||
| 14646 | 228 | fun opt_keyword s = Scan.optional ($$$ "(" |-- !!! (($$$ s >> K true) --| $$$ ")")) false;
 | 
| 59917 
9830c944670f
more uniform "verbose" option to print name space;
 wenzelm parents: 
59809diff
changeset | 229 | val opt_bang = Scan.optional ($$$ "!" >> K true) false; | 
| 14646 | 230 | |
| 20983 | 231 | val begin = $$$ "begin"; | 
| 232 | val opt_begin = Scan.optional (begin >> K true) false; | |
| 20961 | 233 | |
| 5826 | 234 | |
| 235 | (* enumerations *) | |
| 236 | ||
| 55764 | 237 | fun enum1_positions sep scan = | 
| 238 | scan -- Scan.repeat (position ($$$ sep) -- !!! scan) >> | |
| 239 | (fn (x, ys) => (x :: map #2 ys, map (#2 o #1) ys)); | |
| 240 | fun enum_positions sep scan = | |
| 241 | enum1_positions sep scan || Scan.succeed ([], []); | |
| 242 | ||
| 25999 | 243 | fun enum1 sep scan = scan ::: Scan.repeat ($$$ sep |-- !!! scan); | 
| 5826 | 244 | fun enum sep scan = enum1 sep scan || Scan.succeed []; | 
| 245 | ||
| 27815 | 246 | fun enum1' sep scan = scan ::: Scan.repeat (Scan.lift ($$$ sep) |-- scan); | 
| 247 | fun enum' sep scan = enum1' sep scan || Scan.succeed []; | |
| 5826 | 248 | |
| 6013 | 249 | fun and_list1 scan = enum1 "and" scan; | 
| 250 | fun and_list scan = enum "and" scan; | |
| 251 | ||
| 27815 | 252 | fun and_list1' scan = enum1' "and" scan; | 
| 253 | fun and_list' scan = enum' "and" scan; | |
| 254 | ||
| 255 | fun list1 scan = enum1 "," scan; | |
| 256 | fun list scan = enum "," scan; | |
| 257 | ||
| 43775 
b361c7d184e7
added Parse.properties (again) -- allow empty list like Parse_Value.properties but unlike Parse.properties of ef86de9c98aa;
 wenzelm parents: 
42657diff
changeset | 258 | val properties = $$$ "(" |-- !!! (list (string -- ($$$ "=" |-- string)) --| $$$ ")");
 | 
| 
b361c7d184e7
added Parse.properties (again) -- allow empty list like Parse_Value.properties but unlike Parse.properties of ef86de9c98aa;
 wenzelm parents: 
42657diff
changeset | 259 | |
| 5826 | 260 | |
| 5960 | 261 | (* names and text *) | 
| 5826 | 262 | |
| 44357 | 263 | val name = group (fn () => "name declaration") (short_ident || sym_ident || string || number); | 
| 264 | ||
| 30223 
24d975352879
renamed Binding.name_pos to Binding.make, renamed Binding.base_name to Binding.name_of, renamed Binding.map_base to Binding.map_name, added mandatory flag to Binding.qualify;
 wenzelm parents: 
29581diff
changeset | 265 | val binding = position name >> Binding.make; | 
| 44357 | 266 | |
| 267 | val xname = group (fn () => "name reference") | |
| 268 | (short_ident || long_ident || sym_ident || string || number); | |
| 269 | ||
| 270 | val text = group (fn () => "text") | |
| 56499 
7e0178c84994
allow text cartouches in regular outer syntax categories "text" and "altstring";
 wenzelm parents: 
56202diff
changeset | 271 | (short_ident || long_ident || sym_ident || string || number || verbatim || cartouche); | 
| 44357 | 272 | |
| 48881 
46e053eda5dd
clarified Parse.path vs. Parse.explode -- prefer errors in proper transaction context;
 wenzelm parents: 
46922diff
changeset | 273 | val path = group (fn () => "file name/path specification") name; | 
| 6553 | 274 | |
| 59693 | 275 | val theory_name = group (fn () => "theory name") name; | 
| 276 | val theory_xname = group (fn () => "theory name reference") xname; | |
| 277 | ||
| 56063 | 278 | val liberal_name = keyword_with Token.ident_or_symbolic || xname; | 
| 40800 
330eb65c9469
Parse.liberal_name for document antiquotations and attributes;
 wenzelm parents: 
40793diff
changeset | 279 | |
| 18898 | 280 | val parname = Scan.optional ($$$ "(" |-- name --| $$$ ")") "";
 | 
| 28965 | 281 | val parbinding = Scan.optional ($$$ "(" |-- binding --| $$$ ")") Binding.empty;
 | 
| 18898 | 282 | |
| 6553 | 283 | |
| 46922 
3717f3878714
source positions for locale and class expressions;
 wenzelm parents: 
45596diff
changeset | 284 | (* type classes *) | 
| 
3717f3878714
source positions for locale and class expressions;
 wenzelm parents: 
45596diff
changeset | 285 | |
| 
3717f3878714
source positions for locale and class expressions;
 wenzelm parents: 
45596diff
changeset | 286 | val class = group (fn () => "type class") (inner_syntax xname); | 
| 5826 | 287 | |
| 44357 | 288 | val sort = group (fn () => "sort") (inner_syntax xname); | 
| 5826 | 289 | |
| 46922 
3717f3878714
source positions for locale and class expressions;
 wenzelm parents: 
45596diff
changeset | 290 | val type_const = inner_syntax (group (fn () => "type constructor") xname); | 
| 
3717f3878714
source positions for locale and class expressions;
 wenzelm parents: 
45596diff
changeset | 291 | |
| 
3717f3878714
source positions for locale and class expressions;
 wenzelm parents: 
45596diff
changeset | 292 | val arity = type_const -- ($$$ "::" |-- !!! | 
| 61466 | 293 |   (Scan.optional ($$$ "(" |-- !!! (list1 sort --| $$$ ")")) [] -- sort)) >> Scan.triple2;
 | 
| 5826 | 294 | |
| 46922 
3717f3878714
source positions for locale and class expressions;
 wenzelm parents: 
45596diff
changeset | 295 | val multi_arity = and_list1 type_const -- ($$$ "::" |-- !!! | 
| 61466 | 296 |   (Scan.optional ($$$ "(" |-- !!! (list1 sort --| $$$ ")")) [] -- sort)) >> Scan.triple2;
 | 
| 25541 | 297 | |
| 5826 | 298 | |
| 299 | (* types *) | |
| 300 | ||
| 44357 | 301 | val typ_group = | 
| 302 | group (fn () => "type") | |
| 303 | (short_ident || long_ident || sym_ident || type_ident || type_var || string || number); | |
| 5826 | 304 | |
| 27753 
94b672153b49
sort/typ/term/prop: inner_syntax markup encodes original source position;
 wenzelm parents: 
27737diff
changeset | 305 | val typ = inner_syntax typ_group; | 
| 
94b672153b49
sort/typ/term/prop: inner_syntax markup encodes original source position;
 wenzelm parents: 
27737diff
changeset | 306 | |
| 35838 | 307 | fun type_arguments arg = | 
| 308 | arg >> single || | |
| 309 |   $$$ "(" |-- !!! (list1 arg --| $$$ ")") ||
 | |
| 5826 | 310 | Scan.succeed []; | 
| 311 | ||
| 35838 | 312 | val type_args = type_arguments type_ident; | 
| 313 | val type_args_constrained = type_arguments (type_ident -- Scan.option ($$$ "::" |-- !!! sort)); | |
| 314 | ||
| 5826 | 315 | |
| 316 | (* mixfix annotations *) | |
| 317 | ||
| 51654 
8450b944e58a
just one syntax category "mixfix" -- check structure annotation semantically;
 wenzelm parents: 
51627diff
changeset | 318 | local | 
| 
8450b944e58a
just one syntax category "mixfix" -- check structure annotation semantically;
 wenzelm parents: 
51627diff
changeset | 319 | |
| 18669 | 320 | val mfix = string -- | 
| 321 | !!! (Scan.optional ($$$ "[" |-- !!! (list nat --| $$$ "]")) [] -- | |
| 61466 | 322 | Scan.optional nat 1000) >> (Mixfix o Scan.triple2); | 
| 18669 | 323 | |
| 35130 | 324 | val infx = $$$ "infix" |-- !!! (string -- nat >> Infix); | 
| 325 | val infxl = $$$ "infixl" |-- !!! (string -- nat >> Infixl); | |
| 326 | val infxr = $$$ "infixr" |-- !!! (string -- nat >> Infixr); | |
| 51654 
8450b944e58a
just one syntax category "mixfix" -- check structure annotation semantically;
 wenzelm parents: 
51627diff
changeset | 327 | val strcture = $$$ "structure" >> K Structure; | 
| 5826 | 328 | |
| 18669 | 329 | val binder = $$$ "binder" |-- | 
| 330 | !!! (string -- ($$$ "[" |-- nat --| $$$ "]" -- nat || nat >> (fn n => (n, n)))) | |
| 61466 | 331 | >> (Binder o Scan.triple2); | 
| 18669 | 332 | |
| 51654 
8450b944e58a
just one syntax category "mixfix" -- check structure annotation semantically;
 wenzelm parents: 
51627diff
changeset | 333 | val mixfix_body = mfix || strcture || binder || infxl || infxr || infx; | 
| 
8450b944e58a
just one syntax category "mixfix" -- check structure annotation semantically;
 wenzelm parents: 
51627diff
changeset | 334 | |
| 
8450b944e58a
just one syntax category "mixfix" -- check structure annotation semantically;
 wenzelm parents: 
51627diff
changeset | 335 | fun annotation guard body = $$$ "(" |-- guard (body --| $$$ ")");
 | 
| 
8450b944e58a
just one syntax category "mixfix" -- check structure annotation semantically;
 wenzelm parents: 
51627diff
changeset | 336 | fun opt_annotation guard body = Scan.optional (annotation guard body) NoSyn; | 
| 
8450b944e58a
just one syntax category "mixfix" -- check structure annotation semantically;
 wenzelm parents: 
51627diff
changeset | 337 | |
| 
8450b944e58a
just one syntax category "mixfix" -- check structure annotation semantically;
 wenzelm parents: 
51627diff
changeset | 338 | in | 
| 18669 | 339 | |
| 51654 
8450b944e58a
just one syntax category "mixfix" -- check structure annotation semantically;
 wenzelm parents: 
51627diff
changeset | 340 | val mixfix = annotation !!! mixfix_body; | 
| 
8450b944e58a
just one syntax category "mixfix" -- check structure annotation semantically;
 wenzelm parents: 
51627diff
changeset | 341 | val mixfix' = annotation I mixfix_body; | 
| 
8450b944e58a
just one syntax category "mixfix" -- check structure annotation semantically;
 wenzelm parents: 
51627diff
changeset | 342 | val opt_mixfix = opt_annotation !!! mixfix_body; | 
| 
8450b944e58a
just one syntax category "mixfix" -- check structure annotation semantically;
 wenzelm parents: 
51627diff
changeset | 343 | val opt_mixfix' = opt_annotation I mixfix_body; | 
| 
8450b944e58a
just one syntax category "mixfix" -- check structure annotation semantically;
 wenzelm parents: 
51627diff
changeset | 344 | |
| 
8450b944e58a
just one syntax category "mixfix" -- check structure annotation semantically;
 wenzelm parents: 
51627diff
changeset | 345 | end; | 
| 5826 | 346 | |
| 347 | ||
| 18669 | 348 | (* fixes *) | 
| 5826 | 349 | |
| 21400 | 350 | val where_ = $$$ "where"; | 
| 351 | ||
| 61466 | 352 | val const_decl = name -- ($$$ "::" |-- !!! typ) -- opt_mixfix >> Scan.triple1; | 
| 353 | val const_binding = binding -- ($$$ "::" |-- !!! typ) -- opt_mixfix >> Scan.triple1; | |
| 18669 | 354 | |
| 61466 | 355 | val param_mixfix = binding -- Scan.option ($$$ "::" |-- typ) -- mixfix' >> (single o Scan.triple1); | 
| 60448 | 356 | val params = | 
| 357 | Scan.repeat1 binding -- Scan.option ($$$ "::" |-- !!! typ) | |
| 358 | >> (fn (xs, T) => map (fn x => (x, T, NoSyn)) xs); | |
| 18669 | 359 | |
| 60448 | 360 | val fixes = and_list1 (param_mixfix || params) >> flat; | 
| 19845 | 361 | val for_fixes = Scan.optional ($$$ "for" |-- !!! fixes) []; | 
| 362 | ||
| 5826 | 363 | |
| 27877 | 364 | (* embedded source text *) | 
| 27872 
631371a02b8c
P.doc_source and P.ml_sorce for proper SymbolPos.text;
 wenzelm parents: 
27815diff
changeset | 365 | |
| 59809 | 366 | val ML_source = input (group (fn () => "ML source") text); | 
| 367 | val document_source = input (group (fn () => "document source") text); | |
| 27872 
631371a02b8c
P.doc_source and P.ml_sorce for proper SymbolPos.text;
 wenzelm parents: 
27815diff
changeset | 368 | |
| 
631371a02b8c
P.doc_source and P.ml_sorce for proper SymbolPos.text;
 wenzelm parents: 
27815diff
changeset | 369 | |
| 5826 | 370 | (* terms *) | 
| 371 | ||
| 40793 
d21aedaa91e7
added Parse.literal_fact with proper inner_syntax markup (source position);
 wenzelm parents: 
40296diff
changeset | 372 | val tm = short_ident || long_ident || sym_ident || term_var || number || string; | 
| 5826 | 373 | |
| 44357 | 374 | val term_group = group (fn () => "term") tm; | 
| 375 | val prop_group = group (fn () => "proposition") tm; | |
| 27753 
94b672153b49
sort/typ/term/prop: inner_syntax markup encodes original source position;
 wenzelm parents: 
27737diff
changeset | 376 | |
| 
94b672153b49
sort/typ/term/prop: inner_syntax markup encodes original source position;
 wenzelm parents: 
27737diff
changeset | 377 | val term = inner_syntax term_group; | 
| 
94b672153b49
sort/typ/term/prop: inner_syntax markup encodes original source position;
 wenzelm parents: 
27737diff
changeset | 378 | val prop = inner_syntax prop_group; | 
| 5826 | 379 | |
| 44357 | 380 | val const = inner_syntax (group (fn () => "constant") xname); | 
| 42300 
0d1cbc1fe579
notation: proper markup for type constructor / constant;
 wenzelm parents: 
42299diff
changeset | 381 | |
| 56499 
7e0178c84994
allow text cartouches in regular outer syntax categories "text" and "altstring";
 wenzelm parents: 
56202diff
changeset | 382 | val literal_fact = inner_syntax (group (fn () => "literal fact") (alt_string || cartouche)); | 
| 40793 
d21aedaa91e7
added Parse.literal_fact with proper inner_syntax markup (source position);
 wenzelm parents: 
40296diff
changeset | 383 | |
| 5826 | 384 | |
| 6949 | 385 | (* patterns *) | 
| 6935 | 386 | |
| 6949 | 387 | val is_terms = Scan.repeat1 ($$$ "is" |-- term); | 
| 6935 | 388 | val is_props = Scan.repeat1 ($$$ "is" |-- prop); | 
| 389 | ||
| 19585 | 390 | val propp = prop -- Scan.optional ($$$ "(" |-- !!! (is_props --| $$$ ")")) [];
 | 
| 6949 | 391 | val termp = term -- Scan.optional ($$$ "(" |-- !!! (is_terms --| $$$ ")")) [];
 | 
| 6935 | 392 | |
| 393 | ||
| 59924 
801b979ec0c2
more general notion of command span: command keyword not necessarily at start;
 wenzelm parents: 
59918diff
changeset | 394 | (* target information *) | 
| 
801b979ec0c2
more general notion of command span: command keyword not necessarily at start;
 wenzelm parents: 
59918diff
changeset | 395 | |
| 
801b979ec0c2
more general notion of command span: command keyword not necessarily at start;
 wenzelm parents: 
59918diff
changeset | 396 | val private = position ($$$ "private") >> #2; | 
| 59990 
a81dc82ecba3
clarified keyword 'qualified' in accordance to a similar keyword from Haskell (despite unrelated Binding.qualified in Isabelle/ML);
 wenzelm parents: 
59939diff
changeset | 397 | val qualified = position ($$$ "qualified") >> #2; | 
| 19811 | 398 | |
| 45488 
6d71d9e52369
pass positions for named targets, for formal links in the document model;
 wenzelm parents: 
45331diff
changeset | 399 | val target = ($$$ "(" -- $$$ "in") |-- !!! (position xname --| $$$ ")");
 | 
| 22119 | 400 | val opt_target = Scan.option target; | 
| 12272 | 401 | |
| 56201 | 402 | |
| 403 | (* arguments within outer syntax *) | |
| 404 | ||
| 405 | local | |
| 406 | ||
| 407 | val argument_kinds = | |
| 59081 | 408 | [Token.Ident, Token.Long_Ident, Token.Sym_Ident, Token.Var, Token.Type_Ident, Token.Type_Var, | 
| 409 | Token.Nat, Token.Float, Token.String, Token.Alt_String, Token.Cartouche, Token.Verbatim]; | |
| 56201 | 410 | |
| 411 | fun arguments is_symid = | |
| 412 | let | |
| 413 | fun argument blk = | |
| 414 | group (fn () => "argument") | |
| 415 | (Scan.one (fn tok => | |
| 416 | let val kind = Token.kind_of tok in | |
| 417 | member (op =) argument_kinds kind orelse | |
| 418 | Token.keyword_with is_symid tok orelse | |
| 419 | (blk andalso Token.keyword_with (fn s => s = ",") tok) | |
| 420 | end)); | |
| 421 | ||
| 422 | fun args blk x = Scan.optional (args1 blk) [] x | |
| 423 | and args1 blk x = | |
| 61476 | 424 |       (Scan.repeats1 (Scan.repeat1 (argument blk) || argsp "(" ")" || argsp "[" "]")) x
 | 
| 56201 | 425 | and argsp l r x = (token ($$$ l) ::: !!! (args true @@@ (token ($$$ r) >> single))) x; | 
| 426 | in (args, args1) end; | |
| 427 | ||
| 428 | in | |
| 429 | ||
| 430 | val args = #1 (arguments Token.ident_or_symbolic) false; | |
| 431 | fun args1 is_symid = #2 (arguments is_symid) false; | |
| 432 | ||
| 433 | end; | |
| 434 | ||
| 58028 
e4250d370657
tuned signature -- define some elementary operations earlier;
 wenzelm parents: 
58011diff
changeset | 435 | |
| 
e4250d370657
tuned signature -- define some elementary operations earlier;
 wenzelm parents: 
58011diff
changeset | 436 | (* attributes *) | 
| 
e4250d370657
tuned signature -- define some elementary operations earlier;
 wenzelm parents: 
58011diff
changeset | 437 | |
| 61814 
1ca1142e1711
clarified type Token.src: plain token list, with usual implicit value assignment;
 wenzelm parents: 
61476diff
changeset | 438 | val attrib = token liberal_name ::: !!! args; | 
| 58028 
e4250d370657
tuned signature -- define some elementary operations earlier;
 wenzelm parents: 
58011diff
changeset | 439 | val attribs = $$$ "[" |-- list attrib --| $$$ "]"; | 
| 
e4250d370657
tuned signature -- define some elementary operations earlier;
 wenzelm parents: 
58011diff
changeset | 440 | val opt_attribs = Scan.optional attribs []; | 
| 
e4250d370657
tuned signature -- define some elementary operations earlier;
 wenzelm parents: 
58011diff
changeset | 441 | |
| 
e4250d370657
tuned signature -- define some elementary operations earlier;
 wenzelm parents: 
58011diff
changeset | 442 | |
| 
e4250d370657
tuned signature -- define some elementary operations earlier;
 wenzelm parents: 
58011diff
changeset | 443 | (* theorem references *) | 
| 
e4250d370657
tuned signature -- define some elementary operations earlier;
 wenzelm parents: 
58011diff
changeset | 444 | |
| 
e4250d370657
tuned signature -- define some elementary operations earlier;
 wenzelm parents: 
58011diff
changeset | 445 | val thm_sel = $$$ "(" |-- list1
 | 
| 
e4250d370657
tuned signature -- define some elementary operations earlier;
 wenzelm parents: 
58011diff
changeset | 446 | (nat --| minus -- nat >> Facts.FromTo || | 
| 
e4250d370657
tuned signature -- define some elementary operations earlier;
 wenzelm parents: 
58011diff
changeset | 447 | nat --| minus >> Facts.From || | 
| 
e4250d370657
tuned signature -- define some elementary operations earlier;
 wenzelm parents: 
58011diff
changeset | 448 | nat >> Facts.Single) --| $$$ ")"; | 
| 
e4250d370657
tuned signature -- define some elementary operations earlier;
 wenzelm parents: 
58011diff
changeset | 449 | |
| 
e4250d370657
tuned signature -- define some elementary operations earlier;
 wenzelm parents: 
58011diff
changeset | 450 | val xthm = | 
| 
e4250d370657
tuned signature -- define some elementary operations earlier;
 wenzelm parents: 
58011diff
changeset | 451 | $$$ "[" |-- attribs --| $$$ "]" >> pair (Facts.named "") || | 
| 
e4250d370657
tuned signature -- define some elementary operations earlier;
 wenzelm parents: 
58011diff
changeset | 452 | (literal_fact >> Facts.Fact || | 
| 
e4250d370657
tuned signature -- define some elementary operations earlier;
 wenzelm parents: 
58011diff
changeset | 453 | position xname -- Scan.option thm_sel >> Facts.Named) -- opt_attribs; | 
| 
e4250d370657
tuned signature -- define some elementary operations earlier;
 wenzelm parents: 
58011diff
changeset | 454 | |
| 
e4250d370657
tuned signature -- define some elementary operations earlier;
 wenzelm parents: 
58011diff
changeset | 455 | val xthms1 = Scan.repeat1 xthm; | 
| 
e4250d370657
tuned signature -- define some elementary operations earlier;
 wenzelm parents: 
58011diff
changeset | 456 | |
| 12272 | 457 | end; |