1 (* Title: Pure/Thy/thy_parse.ML
3 Author: Markus Wenzel, TU Muenchen
5 The parser for theory files.
8 infix 5 -- --$$ $$-- ^^;
15 val !! : ('a -> 'b * 'c) -> 'a -> 'b * 'c
16 val >> : ('a -> 'b * 'c) * ('b -> 'd) -> 'a -> 'd * 'c
17 val || : ('a -> 'b) * ('a -> 'b) -> 'a -> 'b
18 val -- : ('a -> 'b * 'c) * ('c -> 'd * 'e) -> 'a -> ('b * 'd) * 'e
19 val ^^ : ('a -> string * 'b) * ('b -> string * 'c) -> 'a -> string * 'c
20 val $$ : string -> token list -> string * token list
21 val $$-- : string * (token list -> 'b * 'c) -> token list -> 'b * 'c
22 val --$$ : ('a -> 'b * token list) * string -> 'a -> 'b * token list
23 val ident: token list -> string * token list
24 val long_ident: token list -> string * token list
25 val long_id: token list -> string * token list
26 val type_var: token list -> string * token list
27 val type_args: token list -> string list * token list
28 val nat: token list -> string * token list
29 val string: token list -> string * token list
30 val verbatim: token list -> string * token list
31 val empty: 'a -> 'b list * 'a
32 val optional: ('a -> 'b * 'a) -> 'b -> 'a -> 'b * 'a
33 val repeat: ('a -> 'b * 'a) -> 'a -> 'b list * 'a
34 val repeat1: ('a -> 'b * 'a) -> 'a -> 'b list * 'a
35 val enum: string -> (token list -> 'a * token list)
36 -> token list -> 'a list * token list
37 val enum1: string -> (token list -> 'a * token list)
38 -> token list -> 'a list * token list
39 val list: (token list -> 'a * token list)
40 -> token list -> 'a list * token list
41 val list1: (token list -> 'a * token list)
42 -> token list -> 'a list * token list
43 val name: token list -> string * token list
44 val sort: token list -> string * token list
45 val opt_infix: token list -> string * token list
46 val opt_mixfix: token list -> string * token list
47 val opt_witness: token list -> string * token list
49 val make_syntax: string list ->
50 (string * (token list -> (string * string) * token list)) list -> syntax
51 val parse_thy: syntax -> string -> string -> string
52 val section: string -> string -> (token list -> string * token list)
53 -> (string * (token list -> (string * string) * token list))
54 val axm_section: string -> string
55 -> (token list -> (string * string list) * token list)
56 -> (string * (token list -> (string * string) * token list))
57 val pure_keywords: string list
59 (string * (token list -> (string * string) * token list)) list
60 (*items for building strings*)
61 val cat: string -> string -> string
62 val parens: string -> string
63 val brackets: string -> string
64 val mk_list: string list -> string
65 val mk_big_list: string list -> string
66 val mk_pair: string * string -> string
67 val mk_triple: string * string * string -> string
68 val strip_quotes: string -> string
71 functor ThyParseFun(structure Symtab: SYMTAB and ThyScan: THY_SCAN): THY_PARSE =
77 (** parser toolbox **)
79 type token = token_kind * string * int;
84 exception SYNTAX_ERROR of string * string * int;
86 fun syn_err s1 s2 n = raise SYNTAX_ERROR (s1, s2, n);
88 fun eof_err () = error "Unexpected end-of-file";
90 (*Similar to Prolog's cut: reports any syntax error instead of backtracking
91 through a superior || *)
92 fun !! parse toks = parse toks
93 handle SYNTAX_ERROR (s1, s2, n) => error ("Syntax error on line " ^
94 string_of_int n ^ ": " ^ s1 ^ " expected and " ^ s2 ^ " was found");
97 (* parser combinators *)
99 fun (parse >> f) toks = apfst f (parse toks);
101 fun (parse1 || parse2) toks =
102 parse1 toks handle SYNTAX_ERROR _ => parse2 toks;
104 fun (parse1 -- parse2) toks =
106 val (x, toks') = parse1 toks;
107 val (y, toks'') = parse2 toks';
112 fun (parse1 ^^ parse2) = parse1 -- parse2 >> op ^;
115 (* generic parsers *)
117 fun $$ a ((k, b, n) :: toks) =
118 if k = Keyword andalso a = b then (a, toks)
119 else syn_err (quote a) (quote b) n
120 | $$ _ [] = eof_err ();
122 fun (a $$-- parse) = $$ a -- parse >> #2;
124 fun (parse --$$ a) = parse -- $$ a >> #1;
127 fun kind k1 ((k2, s, n) :: toks) =
128 if k1 = k2 then (s, toks)
129 else syn_err (name_of_kind k1) (quote s) n
130 | kind _ [] = eof_err ();
132 val ident = kind Ident;
133 val long_ident = kind LongIdent;
134 val long_id = ident || long_ident;
135 val type_var = kind TypeVar >> quote;
137 val string = kind String;
138 val verbatim = kind Verbatim;
141 fun empty toks = ([], toks);
143 fun optional parse def = parse || empty >> K def;
145 fun repeat parse toks = (parse -- repeat parse >> op :: || empty) toks;
146 fun repeat1 parse = parse -- repeat parse >> op ::;
148 fun enum1 sep parse = parse -- repeat (sep $$-- parse) >> op ::;
149 fun enum sep parse = enum1 sep parse || empty;
152 val list1 = enum1 ",";
155 (** theory parsers **)
159 fun cat s1 s2 = s1 ^ " " ^ s2;
161 val parens = enclose "(" ")";
162 val brackets = enclose "[" "]";
164 val mk_list = brackets o commas;
165 val mk_big_list = brackets o space_implode ",\n ";
167 fun mk_pair (x, y) = parens (commas [x, y]);
168 fun mk_triple (x, y, z) = parens (commas [x, y, z]);
169 fun mk_triple1 ((x, y), z) = mk_triple (x, y, z);
170 fun mk_triple2 (x, (y, z)) = mk_triple (x, y, z);
172 val split_decls = flat o map (fn (xs, y) => map (rpair y) xs);
174 fun strip_quotes str =
175 implode (tl (take (size str - 1, explode str)));
180 val name = ident >> quote || string;
181 val names = list name;
182 val names1 = list1 name;
183 val name_list = names >> mk_list;
184 val name_list1 = names1 >> mk_list;
189 val subclass = name -- optional ("<" $$-- !! name_list1) "[]";
191 val class_decls = repeat1 (subclass >> mk_pair) >> mk_big_list;
198 "{" $$-- name_list --$$ "}";
200 val sort_list1 = list1 sort >> mk_list;
203 val arity = optional ("(" $$-- !! (sort_list1 --$$")")) "[]" -- sort;
205 val arity_decls = repeat1 (names1 --$$ "::" -- !! arity)
206 >> (mk_big_list o map mk_triple2 o split_decls);
209 (* mixfix annotations *)
211 val infxl = "infixl" $$-- !! nat >> cat "Infixl";
212 val infxr = "infixr" $$-- !! nat >> cat "Infixr";
214 val binder = "binder" $$--
215 !! (string -- ( ("[" $$-- nat --$$ "]") -- nat
216 || nat >> (fn n => (n,n))
218 >> (cat "Binder" o mk_triple2);
220 val opt_pris = optional ("[" $$-- !! (list nat --$$ "]")) [] >> mk_list;
222 val mixfix = string -- !! (opt_pris -- optional nat "max_pri")
223 >> (cat "Mixfix" o mk_triple2);
225 fun opt_syn fx = optional ("(" $$-- fx --$$ ")") "NoSyn";
227 val opt_infix = opt_syn (infxl || infxr);
228 val opt_mixfix = opt_syn (mixfix || infxl || infxr || binder);
233 fun mk_old_type_decl ((ts, n), syn) =
234 map (fn t => (mk_triple (t, n, syn), false)) ts;
236 fun mk_type_decl (((xs, t), None), syn) =
237 [(mk_triple (t, string_of_int (length xs), syn), false)]
238 | mk_type_decl (((xs, t), Some rhs), syn) =
239 [(parens (commas [t, mk_list xs, rhs, syn]), true)];
241 fun mk_type_decls tys =
242 "|> add_types\n" ^ mk_big_list (keyfilter tys false) ^ "\n\n\
243 \|> add_tyabbrs\n" ^ mk_big_list (keyfilter tys true);
246 val old_type_decl = names1 -- nat -- opt_infix >> mk_old_type_decl;
249 type_var >> (fn x => [x]) ||
250 "(" $$-- !! (list1 type_var --$$ ")") ||
253 val type_decl = type_args -- name -- optional ("=" $$-- !! string >> Some) None
254 -- opt_infix >> mk_type_decl;
256 val type_decls = repeat1 (old_type_decl || type_decl) >> (mk_type_decls o flat);
261 val const_decls = repeat1 (names1 --$$ "::" -- !! (string -- opt_mixfix))
262 >> (mk_big_list o map mk_triple2 o split_decls);
268 optional ("(" $$-- !! (name --$$ ")")) "\"logic\"" -- string >> mk_pair;
271 $$ "=>" >> K " |-> " ||
272 $$ "<=" >> K " <-| " ||
273 $$ "==" >> K " <-> ";
275 val trans_decls = repeat1 (trans_pat ^^ !! (trans_arrow ^^ trans_pat))
279 (* ML translations *)
282 " val parse_ast_translation = [];\n\
283 \ val parse_translation = [];\n\
284 \ val print_translation = [];\n\
285 \ val print_ast_translation = [];";
288 "(parse_ast_translation, parse_translation, \
289 \print_translation, print_ast_translation)";
296 \ " ^ trfun_args ^ "\n\
299 val mltrans = verbatim >> mk_mltrans;
304 val mk_axms = mk_big_list o map (mk_pair o apfst quote);
306 fun mk_axiom_decls axms = (mk_axms axms, map fst axms);
308 val axiom_decls = repeat1 (ident -- !! string) >> mk_axiom_decls;
313 fun mk_axclass_decl ((c, cs), axms) =
314 (mk_pair (c, cs) ^ "\n" ^ mk_axms axms,
315 (strip_quotes c ^ "I") :: map fst axms);
317 val axclass_decl = subclass -- repeat (ident -- !! string) >> mk_axclass_decl;
322 fun mk_witness (axths, opt_tac) =
323 mk_list (keyfilter axths false) ^ "\n" ^
324 mk_list (keyfilter axths true) ^ "\n" ^
328 string >> rpair false ||
329 long_id >> rpair true;
333 optional ("(" $$-- list1 axm_or_thm --$$ ")") [] --
334 optional (verbatim >> (parens o cat "Some" o parens)) "None"
338 (name --$$ "<" -- name >> (pair "|> AxClass.add_inst_subclass" o mk_pair) ||
339 name --$$ "::" -- arity >> (pair "|> AxClass.add_inst_arity" o mk_triple2))
341 >> (fn ((x, y), z) => (cat_lines [x, y, z]));
345 (** theory syntax **)
348 lexicon * (token list -> (string * string) * token list) Symtab.table;
350 fun make_syntax keywords sects =
351 (make_lexicon (map fst sects @ keywords),
352 Symtab.make sects handle Symtab.DUPS dups =>
353 error ("Duplicate sections in theory file syntax: " ^ commas_quote dups));
358 fun mk_header (thy_name, bases) =
359 (thy_name, "mk_base " ^ mk_list bases ^ " " ^ quote thy_name);
362 ident >> (cat "Thy" o quote) ||
363 string >> cat "File";
365 val header = ident --$$ "=" -- enum1 "+" base >> mk_header;
370 fun mk_extension (txts, mltxt) =
372 val cat_sects = space_implode "\n\n" o filter_out (equal "");
373 val (extxts, postxts) = split_list txts;
375 (cat_sects extxts, cat_sects postxts, mltxt)
378 fun sect tab ((Keyword, s, n) :: toks) =
379 (case Symtab.lookup (tab, s) of
380 Some parse => !! parse toks
381 | None => syn_err "section" s n)
382 | sect _ ((_, s, n) :: _) = syn_err "section" s n
383 | sect _ [] = eof_err ();
385 fun extension sectab = "+" $$-- !! (repeat (sect sectab) --$$ "end") --
386 optional ("ML" $$-- verbatim) "" >> mk_extension;
389 (* theory definition *)
391 fun mk_structure tname ((thy_name, old_thys), opt_txts) =
392 if thy_name <> tname then
393 error ("Filename \"" ^ tname ^ ".thy\" and theory name "
394 ^ quote thy_name ^ " are different")
397 Some (extxt, postxt, mltxt) =>
398 "val thy = " ^ old_thys ^ " true;\n\n\
399 \structure " ^ thy_name ^ " =\n\
415 \|> add_thyname " ^ quote thy_name ^ ";\n\
417 \val _ = store_theory (thy, " ^ quote thy_name ^ ");\n\
425 "val thy = " ^ old_thys ^ " false;\n\
427 \structure " ^ thy_name ^ " =\n\
432 \val _ = store_theory (thy, " ^ quote thy_name ^ ");\n\
436 fun theory_defn sectab tname =
437 header -- optional (extension sectab >> Some) None -- eof
438 >> (mk_structure tname o #1);
440 fun parse_thy (lex, sectab) tname str =
441 #1 (!! (theory_defn sectab tname) (tokenize lex str));
444 (* standard sections *)
446 fun mk_val ax = "val " ^ ax ^ " = get_axiom thy " ^ quote ax ^ ";";
447 val mk_vals = cat_lines o map mk_val;
449 fun mk_axm_sect "" (txt, axs) = (txt, mk_vals axs)
450 | mk_axm_sect pretxt (txt, axs) = (pretxt ^ "\n" ^ txt, mk_vals axs);
452 fun axm_section name pretxt parse =
453 (name, parse >> mk_axm_sect pretxt);
455 fun section name pretxt parse =
456 axm_section name pretxt (parse >> rpair []);
460 ["end", "ML", "mixfix", "infixr", "infixl", "binder", "=", "+", ",", "<",
461 "{", "}", "(", ")", "[", "]", "::", "==", "=>", "<="];
464 [section "classes" "|> add_classes" class_decls,
465 section "default" "|> add_defsort" sort,
466 section "types" "" type_decls,
467 section "arities" "|> add_arities" arity_decls,
468 section "consts" "|> add_consts" const_decls,
469 section "syntax" "|> add_syntax" const_decls,
470 section "translations" "|> add_trrules" trans_decls,
471 section "MLtrans" "|> add_trfuns" mltrans,
472 section "MLtext" "" verbatim,
473 axm_section "rules" "|> add_axioms" axiom_decls,
474 axm_section "defs" "|> add_defs" axiom_decls,
475 axm_section "axclass" "|> AxClass.add_axclass" axclass_decl,
476 section "instance" "" instance_decl];