wenzelm@18: (* Title: Pure/Syntax/syntax.ML clasohm@0: ID: $Id$ clasohm@0: Author: Tobias Nipkow and Markus Wenzel, TU Muenchen wenzelm@18: wenzelm@18: Root of Isabelle's syntax module. clasohm@0: *) clasohm@0: wenzelm@556: infix |-> <-| <->; wenzelm@556: wenzelm@260: signature BASIC_SYNTAX = wenzelm@260: sig wenzelm@260: include AST0 wenzelm@556: include SYN_TRANS0 wenzelm@556: include MIXFIX0 wenzelm@260: include PRINTER0 wenzelm@556: datatype xrule = wenzelm@556: op |-> of (string * string) * (string * string) | wenzelm@556: op <-| of (string * string) * (string * string) | wenzelm@556: op <-> of (string * string) * (string * string) wenzelm@260: end; wenzelm@260: clasohm@0: signature SYNTAX = clasohm@0: sig wenzelm@260: include AST1 clasohm@0: include LEXICON0 wenzelm@237: include SYN_EXT0 clasohm@0: include TYPE_EXT0 wenzelm@556: include SYN_TRANS1 wenzelm@556: include MIXFIX1 clasohm@0: include PRINTER0 wenzelm@383: sharing type ast = Parser.SynExt.Ast.ast wenzelm@556: datatype xrule = wenzelm@556: op |-> of (string * string) * (string * string) | wenzelm@556: op <-| of (string * string) * (string * string) | wenzelm@556: op <-> of (string * string) * (string * string) wenzelm@556: type syntax wenzelm@556: val extend_log_types: syntax -> string list -> syntax wenzelm@556: val extend_type_gram: syntax -> (string * int * mixfix) list -> syntax wenzelm@556: val extend_const_gram: syntax -> (string * typ * mixfix) list -> syntax wenzelm@556: val extend_consts: syntax -> string list -> syntax wenzelm@556: val extend_trfuns: syntax -> wenzelm@556: (string * (ast list -> ast)) list * wenzelm@556: (string * (term list -> term)) list * wenzelm@556: (string * (term list -> term)) list * wenzelm@556: (string * (ast list -> ast)) list -> syntax wenzelm@556: val extend_trrules: syntax -> xrule list -> syntax wenzelm@556: val merge_syntaxes: syntax -> syntax -> syntax wenzelm@556: val type_syn: syntax wenzelm@556: val print_gram: syntax -> unit wenzelm@556: val print_trans: syntax -> unit wenzelm@556: val print_syntax: syntax -> unit wenzelm@556: val test_read: syntax -> string -> string -> unit wenzelm@556: val read: syntax -> typ -> string -> term wenzelm@556: val read_typ: syntax -> (indexname -> sort) -> string -> typ wenzelm@556: val simple_read_typ: string -> typ wenzelm@556: val pretty_term: syntax -> term -> Pretty.T wenzelm@556: val pretty_typ: syntax -> typ -> Pretty.T wenzelm@556: val string_of_term: syntax -> term -> string wenzelm@556: val string_of_typ: syntax -> typ -> string wenzelm@556: val simple_string_of_typ: typ -> string wenzelm@556: val simple_pprint_typ: typ -> pprint_args -> unit clasohm@0: end; clasohm@0: clasohm@0: functor SyntaxFun(structure Symtab: SYMTAB and TypeExt: TYPE_EXT wenzelm@556: and SynTrans: SYN_TRANS and Mixfix: MIXFIX and Printer: PRINTER wenzelm@556: sharing Mixfix.SynExt = SynTrans.Parser.SynExt = TypeExt.SynExt = Printer.SynExt) wenzelm@383: : SYNTAX = clasohm@0: struct clasohm@0: wenzelm@237: structure SynExt = TypeExt.SynExt; wenzelm@556: structure Parser = SynTrans.Parser; wenzelm@237: structure Lexicon = Parser.Lexicon; wenzelm@556: open Lexicon SynExt SynExt.Ast Parser TypeExt SynTrans Mixfix Printer; wenzelm@237: wenzelm@237: wenzelm@237: (** tables of translation functions **) wenzelm@237: wenzelm@237: (*the ref serves as unique id*) wenzelm@237: type 'a trtab = (('a list -> 'a) * unit ref) Symtab.table; wenzelm@237: wenzelm@383: val dest_trtab = Symtab.dest; wenzelm@237: wenzelm@237: fun lookup_trtab tab c = wenzelm@237: apsome fst (Symtab.lookup (tab, c)); clasohm@0: clasohm@0: wenzelm@237: (* empty, extend, merge trtabs *) wenzelm@237: wenzelm@383: fun err_dup_trfuns name cs = wenzelm@383: error ("More than one " ^ name ^ " for " ^ commas_quote cs); wenzelm@237: wenzelm@237: val empty_trtab = Symtab.null; wenzelm@237: wenzelm@237: fun extend_trtab tab trfuns name = wenzelm@383: Symtab.extend_new (tab, map (fn (c, f) => (c, (f, ref ()))) trfuns) wenzelm@383: handle Symtab.DUPS cs => err_dup_trfuns name cs; wenzelm@237: wenzelm@237: fun merge_trtabs tab1 tab2 name = wenzelm@237: Symtab.merge eq_snd (tab1, tab2) wenzelm@383: handle Symtab.DUPS cs => err_dup_trfuns name cs; wenzelm@237: wenzelm@237: wenzelm@237: wenzelm@237: (** tables of translation rules **) wenzelm@237: wenzelm@237: type ruletab = (ast * ast) list Symtab.table; wenzelm@237: wenzelm@383: fun dest_ruletab tab = flat (map snd (Symtab.dest tab)); wenzelm@237: wenzelm@237: wenzelm@237: (* lookup_ruletab *) wenzelm@237: wenzelm@237: fun lookup_ruletab tab = wenzelm@237: if Symtab.is_null tab then None wenzelm@237: else Some (fn a => Symtab.lookup_multi (tab, a)); wenzelm@237: wenzelm@237: wenzelm@237: (* empty, extend, merge ruletabs *) wenzelm@237: wenzelm@237: val empty_ruletab = Symtab.null; wenzelm@237: wenzelm@237: fun extend_ruletab tab rules = wenzelm@237: generic_extend (op =) Symtab.dest_multi Symtab.make_multi tab wenzelm@237: (map (fn r => (head_of_rule r, r)) (distinct rules)); wenzelm@237: wenzelm@237: fun merge_ruletabs tab1 tab2 = wenzelm@237: generic_merge (op =) Symtab.dest_multi Symtab.make_multi tab1 tab2; clasohm@0: clasohm@0: clasohm@0: clasohm@0: (** datatype syntax **) clasohm@0: wenzelm@237: datatype syntax = wenzelm@237: Syntax of { wenzelm@18: lexicon: lexicon, wenzelm@18: roots: string list, wenzelm@18: gram: gram, wenzelm@18: consts: string list, wenzelm@237: parse_ast_trtab: ast trtab, wenzelm@237: parse_ruletab: ruletab, wenzelm@237: parse_trtab: term trtab, wenzelm@237: print_trtab: term trtab, wenzelm@237: print_ruletab: ruletab, wenzelm@237: print_ast_trtab: ast trtab, wenzelm@18: prtab: prtab}; clasohm@0: wenzelm@18: wenzelm@237: (* empty_syntax *) wenzelm@18: wenzelm@237: val empty_syntax = wenzelm@237: Syntax { wenzelm@167: lexicon = empty_lexicon, wenzelm@167: roots = [], wenzelm@171: gram = empty_gram, wenzelm@167: consts = [], wenzelm@237: parse_ast_trtab = empty_trtab, wenzelm@237: parse_ruletab = empty_ruletab, wenzelm@237: parse_trtab = empty_trtab, wenzelm@237: print_trtab = empty_trtab, wenzelm@237: print_ruletab = empty_ruletab, wenzelm@237: print_ast_trtab = empty_trtab, wenzelm@167: prtab = empty_prtab}; wenzelm@167: wenzelm@167: wenzelm@237: (* extend_syntax *) wenzelm@167: wenzelm@237: fun extend_syntax (Syntax tabs) syn_ext = wenzelm@167: let wenzelm@167: val {lexicon, roots = roots1, gram, consts = consts1, parse_ast_trtab, wenzelm@237: parse_ruletab, parse_trtab, print_trtab, print_ruletab, print_ast_trtab, wenzelm@237: prtab} = tabs; wenzelm@237: val SynExt {roots = roots2, xprods, consts = consts2, parse_ast_translation, wenzelm@167: parse_rules, parse_translation, print_translation, print_rules, wenzelm@237: print_ast_translation} = syn_ext; wenzelm@167: in wenzelm@237: Syntax { wenzelm@237: lexicon = extend_lexicon lexicon (delims_of xprods), wenzelm@237: roots = extend_list roots1 roots2, wenzelm@556: gram = extend_gram gram xprods, wenzelm@167: consts = consts2 union consts1, wenzelm@167: parse_ast_trtab = wenzelm@167: extend_trtab parse_ast_trtab parse_ast_translation "parse ast translation", wenzelm@167: parse_ruletab = extend_ruletab parse_ruletab parse_rules, wenzelm@167: parse_trtab = extend_trtab parse_trtab parse_translation "parse translation", wenzelm@167: print_trtab = extend_trtab print_trtab print_translation "print translation", wenzelm@167: print_ruletab = extend_ruletab print_ruletab print_rules, wenzelm@237: print_ast_trtab = wenzelm@237: extend_trtab print_ast_trtab print_ast_translation "print ast translation", wenzelm@237: prtab = extend_prtab prtab xprods} wenzelm@18: end; wenzelm@18: wenzelm@18: wenzelm@237: (* merge_syntaxes *) clasohm@0: wenzelm@237: fun merge_syntaxes (Syntax tabs1) (Syntax tabs2) = clasohm@0: let wenzelm@237: val {lexicon = lexicon1, roots = roots1, gram = gram1, consts = consts1, wenzelm@237: parse_ast_trtab = parse_ast_trtab1, parse_ruletab = parse_ruletab1, wenzelm@237: parse_trtab = parse_trtab1, print_trtab = print_trtab1, wenzelm@237: print_ruletab = print_ruletab1, print_ast_trtab = print_ast_trtab1, wenzelm@237: prtab = prtab1} = tabs1; wenzelm@237: wenzelm@237: val {lexicon = lexicon2, roots = roots2, gram = gram2, consts = consts2, wenzelm@237: parse_ast_trtab = parse_ast_trtab2, parse_ruletab = parse_ruletab2, wenzelm@237: parse_trtab = parse_trtab2, print_trtab = print_trtab2, wenzelm@237: print_ruletab = print_ruletab2, print_ast_trtab = print_ast_trtab2, wenzelm@237: prtab = prtab2} = tabs2; clasohm@0: in wenzelm@237: Syntax { wenzelm@237: lexicon = merge_lexicons lexicon1 lexicon2, wenzelm@237: roots = merge_lists roots1 roots2, wenzelm@237: gram = merge_grams gram1 gram2, wenzelm@237: consts = merge_lists consts1 consts2, wenzelm@237: parse_ast_trtab = wenzelm@237: merge_trtabs parse_ast_trtab1 parse_ast_trtab2 "parse ast translation", wenzelm@237: parse_ruletab = merge_ruletabs parse_ruletab1 parse_ruletab2, wenzelm@237: parse_trtab = merge_trtabs parse_trtab1 parse_trtab2 "parse translation", wenzelm@237: print_trtab = merge_trtabs print_trtab1 print_trtab2 "print translation", wenzelm@237: print_ruletab = merge_ruletabs print_ruletab1 print_ruletab2, wenzelm@237: print_ast_trtab = wenzelm@237: merge_trtabs print_ast_trtab1 print_ast_trtab2 "print ast translation", wenzelm@237: prtab = merge_prtabs prtab1 prtab2} clasohm@0: end; clasohm@0: clasohm@0: wenzelm@260: (* type_syn *) wenzelm@260: wenzelm@260: val type_syn = extend_syntax empty_syntax type_ext; wenzelm@260: wenzelm@260: clasohm@0: wenzelm@237: (** inspect syntax **) clasohm@0: wenzelm@260: fun pretty_strs_qs name strs = wenzelm@260: Pretty.strs (name :: map quote (sort_strings strs)); clasohm@0: wenzelm@18: wenzelm@18: (* print_gram *) clasohm@0: wenzelm@237: fun print_gram (Syntax tabs) = clasohm@0: let wenzelm@237: val {lexicon, roots, gram, ...} = tabs; clasohm@0: in wenzelm@260: Pretty.writeln (pretty_strs_qs "lexicon:" (dest_lexicon lexicon)); wenzelm@260: Pretty.writeln (Pretty.strs ("roots:" :: roots)); wenzelm@260: Pretty.writeln (Pretty.big_list "prods:" (pretty_gram gram)) clasohm@0: end; clasohm@0: clasohm@0: wenzelm@18: (* print_trans *) clasohm@0: wenzelm@237: fun print_trans (Syntax tabs) = clasohm@0: let wenzelm@260: fun pretty_trtab name tab = wenzelm@260: pretty_strs_qs name (map fst (dest_trtab tab)); clasohm@0: wenzelm@260: fun pretty_ruletab name tab = wenzelm@260: Pretty.big_list name (map pretty_rule (dest_ruletab tab)); clasohm@0: wenzelm@237: val {consts, parse_ast_trtab, parse_ruletab, parse_trtab, print_trtab, wenzelm@237: print_ruletab, print_ast_trtab, ...} = tabs; clasohm@0: in wenzelm@260: Pretty.writeln (pretty_strs_qs "consts:" consts); wenzelm@260: Pretty.writeln (pretty_trtab "parse_ast_translation:" parse_ast_trtab); wenzelm@260: Pretty.writeln (pretty_ruletab "parse_rules:" parse_ruletab); wenzelm@260: Pretty.writeln (pretty_trtab "parse_translation:" parse_trtab); wenzelm@260: Pretty.writeln (pretty_trtab "print_translation:" print_trtab); wenzelm@260: Pretty.writeln (pretty_ruletab "print_rules:" print_ruletab); wenzelm@260: Pretty.writeln (pretty_trtab "print_ast_translation:" print_ast_trtab) clasohm@0: end; clasohm@0: clasohm@0: clasohm@0: (* print_syntax *) clasohm@0: wenzelm@237: fun print_syntax syn = (print_gram syn; print_trans syn); clasohm@0: clasohm@0: clasohm@0: wenzelm@237: (** read **) wenzelm@18: wenzelm@237: (* test_read *) wenzelm@18: wenzelm@237: fun test_read (Syntax tabs) root str = wenzelm@18: let wenzelm@237: val {lexicon, gram, parse_ast_trtab, parse_ruletab, ...} = tabs; wenzelm@18: wenzelm@18: val toks = tokenize lexicon false str; clasohm@330: val _ = writeln ("tokens: " ^ space_implode " " (map display_token toks)) wenzelm@18: wenzelm@383: fun show_pt pt = wenzelm@383: let wenzelm@383: val raw_ast = pt_to_ast (K None) pt; wenzelm@383: val _ = writeln ("raw: " ^ str_of_ast raw_ast); wenzelm@383: val pre_ast = pt_to_ast (lookup_trtab parse_ast_trtab) pt; wenzelm@383: val _ = normalize true true (lookup_ruletab parse_ruletab) pre_ast; wenzelm@383: in () end; wenzelm@383: in wenzelm@383: seq show_pt (parse gram root toks) wenzelm@383: end; wenzelm@18: wenzelm@18: wenzelm@260: (* read_ast *) wenzelm@260: wenzelm@260: fun read_ast (Syntax tabs) xids root str = wenzelm@260: let wenzelm@260: val {lexicon, gram, parse_ast_trtab, ...} = tabs; clasohm@330: val pts = parse gram root (tokenize lexicon xids str); clasohm@330: wenzelm@383: fun show_pt pt = wenzelm@383: writeln (str_of_ast (pt_to_ast (K None) pt)); wenzelm@260: in wenzelm@383: (case pts of wenzelm@383: [pt] => pt_to_ast (lookup_trtab parse_ast_trtab) pt wenzelm@383: | _ => clasohm@330: (writeln ("Ambiguous input " ^ quote str); wenzelm@556: writeln "produces the following parse trees:"; seq show_pt pts; wenzelm@556: error "Please disambiguate the grammar or your input.")) wenzelm@260: end; wenzelm@260: wenzelm@260: wenzelm@237: (* read *) clasohm@0: wenzelm@237: fun read (syn as Syntax tabs) ty str = clasohm@0: let wenzelm@237: val {parse_ruletab, parse_trtab, ...} = tabs; wenzelm@18: val ast = read_ast syn false (typ_to_nonterm ty) str; clasohm@0: in wenzelm@237: ast_to_term (lookup_trtab parse_trtab) wenzelm@237: (normalize_ast (lookup_ruletab parse_ruletab) ast) clasohm@0: end; clasohm@0: clasohm@0: wenzelm@237: (* read types *) clasohm@0: wenzelm@237: fun read_typ syn def_sort str = wenzelm@556: let wenzelm@556: val t = read syn typeT str; wenzelm@556: val sort_env = raw_term_sorts t; wenzelm@556: in wenzelm@556: typ_of_term sort_env def_sort t wenzelm@556: end; wenzelm@144: wenzelm@237: fun simple_read_typ str = read_typ type_syn (K []) str; wenzelm@144: wenzelm@144: wenzelm@237: (* read rules *) wenzelm@18: wenzelm@18: fun read_rule syn (xrule as ((_, lhs_src), (_, rhs_src))) = wenzelm@18: let wenzelm@237: val Syntax {consts, ...} = syn; wenzelm@18: wenzelm@18: fun constantify (ast as Constant _) = ast wenzelm@18: | constantify (ast as Variable x) = wenzelm@18: if x mem consts then Constant x else ast wenzelm@18: | constantify (Appl asts) = Appl (map constantify asts); clasohm@0: wenzelm@18: fun read_pat (root, str) = wenzelm@18: constantify (read_ast syn true root str) wenzelm@18: handle ERROR => error ("The error above occurred in " ^ quote str); wenzelm@18: wenzelm@18: val rule as (lhs, rhs) = (pairself read_pat) xrule; wenzelm@18: in wenzelm@18: (case rule_error rule of wenzelm@18: Some msg => wenzelm@18: error ("Error in syntax translation rule: " ^ msg ^ wenzelm@18: "\nexternal: " ^ quote lhs_src ^ " -> " ^ quote rhs_src ^ wenzelm@18: "\ninternal: " ^ str_of_ast lhs ^ " -> " ^ str_of_ast rhs) wenzelm@18: | None => rule) wenzelm@18: end; clasohm@0: wenzelm@556: wenzelm@556: datatype xrule = wenzelm@556: op |-> of (string * string) * (string * string) | wenzelm@556: op <-| of (string * string) * (string * string) | wenzelm@556: op <-> of (string * string) * (string * string); wenzelm@556: wenzelm@18: fun read_xrules syn xrules = wenzelm@18: let wenzelm@18: fun right_rule (xpat1 |-> xpat2) = Some (xpat1, xpat2) wenzelm@18: | right_rule (xpat1 <-| xpat2) = None wenzelm@18: | right_rule (xpat1 <-> xpat2) = Some (xpat1, xpat2); clasohm@0: wenzelm@18: fun left_rule (xpat1 |-> xpat2) = None wenzelm@18: | left_rule (xpat1 <-| xpat2) = Some (xpat2, xpat1) wenzelm@18: | left_rule (xpat1 <-> xpat2) = Some (xpat2, xpat1); wenzelm@18: in wenzelm@18: (map (read_rule syn) (mapfilter right_rule xrules), wenzelm@18: map (read_rule syn) (mapfilter left_rule xrules)) wenzelm@18: end; wenzelm@18: wenzelm@18: wenzelm@18: wenzelm@18: (** pretty terms or typs **) wenzelm@18: wenzelm@237: fun pretty_t t_to_ast pretty_t (syn as Syntax tabs) t = clasohm@0: let wenzelm@237: val {print_trtab, print_ruletab, print_ast_trtab, prtab, ...} = tabs; wenzelm@237: val ast = t_to_ast (lookup_trtab print_trtab) t; clasohm@0: in wenzelm@237: pretty_t prtab (lookup_trtab print_ast_trtab) wenzelm@237: (normalize_ast (lookup_ruletab print_ruletab) ast) clasohm@0: end; clasohm@0: clasohm@0: val pretty_term = pretty_t term_to_ast pretty_term_ast; clasohm@0: val pretty_typ = pretty_t typ_to_ast pretty_typ_ast; clasohm@0: clasohm@0: fun string_of_term syn t = Pretty.string_of (pretty_term syn t); wenzelm@260: fun string_of_typ syn ty = Pretty.string_of (pretty_typ syn ty); clasohm@0: wenzelm@260: val simple_string_of_typ = string_of_typ type_syn; wenzelm@260: val simple_pprint_typ = Pretty.pprint o Pretty.quote o (pretty_typ type_syn); clasohm@0: clasohm@0: clasohm@0: wenzelm@383: (** extend syntax (external interfaces) **) wenzelm@383: wenzelm@383: fun ext_syntax mk_syn_ext (syn as Syntax {roots, ...}) decls = wenzelm@383: extend_syntax syn (mk_syn_ext roots decls); wenzelm@383: wenzelm@167: wenzelm@383: fun extend_log_types (syn as Syntax {roots, ...}) all_roots = wenzelm@383: extend_syntax syn (syn_ext_roots all_roots (all_roots \\ roots)); wenzelm@383: wenzelm@556: val extend_type_gram = ext_syntax syn_ext_types; wenzelm@383: wenzelm@556: val extend_const_gram = ext_syntax syn_ext_consts; wenzelm@383: wenzelm@383: val extend_consts = ext_syntax syn_ext_const_names; wenzelm@383: wenzelm@383: val extend_trfuns = ext_syntax syn_ext_trfuns; wenzelm@383: wenzelm@383: fun extend_trrules syn xrules = wenzelm@383: ext_syntax syn_ext_rules syn (read_xrules syn xrules); wenzelm@383: wenzelm@383: clasohm@0: end; clasohm@0: