wenzelm@5829: (* Title: Pure/Isar/outer_syntax.ML wenzelm@5829: ID: $Id$ wenzelm@5829: Author: Markus Wenzel, TU Muenchen wenzelm@5829: wenzelm@5829: The global Isabelle/Isar outer syntax. wenzelm@5829: *) wenzelm@5829: wenzelm@5829: signature BASIC_OUTER_SYNTAX = wenzelm@5829: sig wenzelm@15830: structure Isar: wenzelm@15830: sig wenzelm@15830: val main: unit -> unit wenzelm@15830: val loop: unit -> unit wenzelm@15830: val sync_main: unit -> unit wenzelm@15830: val sync_loop: unit -> unit wenzelm@15830: end; wenzelm@5829: end; wenzelm@5829: wenzelm@5829: signature OUTER_SYNTAX = wenzelm@5829: sig wenzelm@5829: include BASIC_OUTER_SYNTAX wenzelm@5829: type token wenzelm@5829: type parser wenzelm@17071: val command: string -> string -> OuterKeyword.T -> wenzelm@6373: (token list -> (Toplevel.transition -> Toplevel.transition) * token list) -> parser wenzelm@17071: val markup_command: IsarOutput.markup -> string -> string -> OuterKeyword.T -> wenzelm@7789: (token list -> (Toplevel.transition -> Toplevel.transition) * token list) -> parser wenzelm@17071: val improper_command: string -> string -> OuterKeyword.T -> wenzelm@6373: (token list -> (Toplevel.transition -> Toplevel.transition) * token list) -> parser wenzelm@14687: val is_keyword: string -> bool wenzelm@7026: val dest_keywords: unit -> string list wenzelm@7026: val dest_parsers: unit -> (string * string * string * bool) list wenzelm@5883: val print_outer_syntax: unit -> unit wenzelm@9223: val print_commands: Toplevel.transition -> Toplevel.transition wenzelm@5829: val add_keywords: string list -> unit wenzelm@5829: val add_parsers: parser list -> unit wenzelm@17265: val check_text: string * Position.T -> Toplevel.state -> unit wenzelm@7940: val deps_thy: string -> bool -> Path.T -> string list * Path.T list wenzelm@6199: val load_thy: string -> bool -> bool -> Path.T -> unit nipkow@14091: val isar: bool -> bool -> unit Toplevel.isar wenzelm@16195: val scan: string -> OuterLex.token list wenzelm@16195: val read: OuterLex.token list -> (string * OuterLex.token list * Toplevel.transition) list wenzelm@5829: end; wenzelm@5829: aspinall@15224: structure OuterSyntax : OUTER_SYNTAX = wenzelm@5829: struct wenzelm@5829: wenzelm@7750: structure T = OuterLex; wenzelm@6860: structure P = OuterParse; wenzelm@6860: wenzelm@5829: wenzelm@5829: (** outer syntax **) wenzelm@5829: wenzelm@5829: (* parsers *) wenzelm@5829: wenzelm@7750: type token = T.token; wenzelm@5829: type parser_fn = token list -> (Toplevel.transition -> Toplevel.transition) * token list; wenzelm@5829: wenzelm@5829: datatype parser = wenzelm@17071: Parser of string * (string * OuterKeyword.T * IsarOutput.markup option) * bool * parser_fn; wenzelm@5829: wenzelm@7750: fun parser int_only markup name comment kind parse = wenzelm@7750: Parser (name, (comment, kind, markup), int_only, parse); wenzelm@5829: wenzelm@5829: wenzelm@5829: (* parse command *) wenzelm@5829: wenzelm@6860: local wenzelm@6199: wenzelm@14925: fun terminate false = Scan.succeed () wenzelm@14925: | terminate true = P.group "end of input" (Scan.option P.sync -- P.semicolon >> K ()); wenzelm@14925: wenzelm@14925: fun trace false parse = parse wenzelm@14925: | trace true parse = Scan.trace parse >> (fn (f, toks) => f o Toplevel.source toks); wenzelm@14925: wenzelm@17071: fun body cmd do_trace (name, _) = wenzelm@7026: (case cmd name of skalberg@15531: SOME (int_only, parse) => wenzelm@17118: P.!!! (Scan.prompt (name ^ "# ") (trace do_trace (P.tags |-- parse) >> pair int_only)) skalberg@15531: | NONE => sys_error ("no parser for outer syntax command " ^ quote name)); wenzelm@6860: wenzelm@6860: in wenzelm@5829: wenzelm@14925: fun command do_terminate do_trace cmd = skalberg@15531: P.semicolon >> K NONE || skalberg@15531: P.sync >> K NONE || wenzelm@17118: (P.position P.command :-- body cmd do_trace) --| terminate do_terminate wenzelm@6860: >> (fn ((name, pos), (int_only, f)) => skalberg@15531: SOME (Toplevel.empty |> Toplevel.name name |> Toplevel.position pos |> wenzelm@6860: Toplevel.interactive int_only |> f)); wenzelm@5829: wenzelm@6199: end; wenzelm@6199: wenzelm@5829: wenzelm@5829: wenzelm@9132: (** global outer syntax **) wenzelm@5829: wenzelm@7026: local wenzelm@7026: wenzelm@7026: val global_lexicons = ref (Scan.empty_lexicon, Scan.empty_lexicon); wenzelm@7750: val global_parsers = wenzelm@17071: ref (Symtab.empty: (((string * OuterKeyword.T) * (bool * parser_fn)) * IsarOutput.markup option) wenzelm@9132: Symtab.table); wenzelm@9132: val global_markups = ref ([]: (string * IsarOutput.markup) list); wenzelm@5952: wenzelm@7026: fun change_lexicons f = wenzelm@7026: let val lexs = f (! global_lexicons) in wenzelm@7026: (case (op inter_string) (pairself Scan.dest_lexicon lexs) of wenzelm@7026: [] => global_lexicons := lexs wenzelm@7026: | bads => error ("Clash of outer syntax commands and keywords: " ^ commas_quote bads)) wenzelm@7026: end; wenzelm@5829: wenzelm@17071: fun make_markups () = global_markups := wenzelm@17071: Symtab.fold (fn (name, (_, SOME m)) => cons (name, m) | _ => I) (! global_parsers) []; wenzelm@7750: wenzelm@9132: fun change_parsers f = (Library.change global_parsers f; make_markups ()); wenzelm@6722: wenzelm@7026: in wenzelm@7026: wenzelm@7750: wenzelm@9132: (* access current syntax *) wenzelm@7026: wenzelm@7026: (*Note: the syntax for files is statically determined at the very wenzelm@7026: beginning; for interactive processing it may change dynamically.*) wenzelm@7026: wenzelm@7026: fun get_lexicons () = ! global_lexicons; wenzelm@7026: fun get_parsers () = ! global_parsers; wenzelm@17221: fun get_parser () = Option.map (#2 o #1) o Symtab.curried_lookup (get_parsers ()); wenzelm@7789: wenzelm@17071: fun command_tags name = wenzelm@17221: (case Symtab.curried_lookup (get_parsers ()) name of wenzelm@17071: SOME (((_, k), _), _) => OuterKeyword.tags_of k wenzelm@17071: | NONE => []); wenzelm@17071: wenzelm@17184: fun is_markup kind name = (AList.lookup (op =) (! global_markups) name = SOME kind); wenzelm@5829: wenzelm@5829: wenzelm@5829: (* augment syntax *) wenzelm@5829: wenzelm@7026: fun add_keywords keywords = change_lexicons (apfst (fn lex => wenzelm@7026: (Scan.extend_lexicon lex (map Symbol.explode keywords)))); wenzelm@5829: wenzelm@17071: fun add_parser (Parser (name, (comment, kind, markup), int_only, parse)) tab = wenzelm@16894: (if not (Symtab.defined tab name) then () wenzelm@5829: else warning ("Redefined outer syntax command " ^ quote name); wenzelm@17221: Symtab.curried_update (name, (((comment, kind), (int_only, parse)), markup)) tab); wenzelm@5829: wenzelm@5829: fun add_parsers parsers = wenzelm@17071: (change_parsers (fold add_parser parsers); wenzelm@7026: change_lexicons (apsnd (fn lex => Scan.extend_lexicon lex wenzelm@7026: (map (fn Parser (name, _, _, _) => Symbol.explode name) parsers)))); wenzelm@7026: wenzelm@7026: end; wenzelm@5829: wenzelm@5829: wenzelm@7026: (* print syntax *) wenzelm@7026: wenzelm@14687: fun is_keyword s = Scan.is_literal (#1 (get_lexicons ())) (Symbol.explode s); wenzelm@7026: fun dest_keywords () = Scan.dest_lexicon (#1 (get_lexicons ())); wenzelm@7026: wenzelm@7026: fun dest_parsers () = wenzelm@16727: get_parsers () |> Symtab.dest |> sort_wrt #1 wenzelm@17071: |> map (fn (name, (((cmt, kind), (int_only, _)), _)) => wenzelm@17071: (name, cmt, OuterKeyword.kind_of kind, int_only)); wenzelm@5829: wenzelm@9223: fun print_outer_syntax () = wenzelm@7026: let wenzelm@7026: fun pretty_cmd (name, comment, _, _) = wenzelm@7026: Pretty.block [Pretty.str (name ^ ":"), Pretty.brk 2, Pretty.str comment]; skalberg@15570: val (int_cmds, cmds) = List.partition #4 (dest_parsers ()); wenzelm@7026: in wenzelm@8720: [Pretty.strs ("syntax keywords:" :: map quote (dest_keywords ())), wenzelm@8720: Pretty.big_list "proper commands:" (map pretty_cmd cmds), wenzelm@8720: Pretty.big_list "improper commands (interactive-only):" (map pretty_cmd int_cmds)] wenzelm@9223: |> Pretty.chunks |> Pretty.writeln wenzelm@7026: end; wenzelm@5829: wenzelm@9223: val print_commands = Toplevel.imperative print_outer_syntax; wenzelm@7367: wenzelm@5829: wenzelm@5829: wenzelm@9132: (** toplevel parsing **) wenzelm@5829: wenzelm@9132: (* basic sources *) wenzelm@6860: wenzelm@17071: fun toplevel_source term do_trace do_recover cmd src = wenzelm@9132: let wenzelm@9132: val no_terminator = wenzelm@9132: Scan.unless P.semicolon (Scan.one (T.not_sync andf T.not_eof)); skalberg@15531: fun recover x = (Scan.prompt "recover# " (Scan.repeat no_terminator) >> K [NONE]) x; wenzelm@9132: in wenzelm@9132: src wenzelm@12876: |> T.source_proper wenzelm@9132: |> Source.source T.stopper skalberg@15531: (Scan.bulk (P.$$$ "--" -- P.!!! P.text >> K NONE || P.not_eof >> SOME)) skalberg@15531: (if do_recover then SOME recover else NONE) wenzelm@12876: |> Source.mapfilter I wenzelm@17071: |> Source.source T.stopper (Scan.bulk (fn xs => P.!!! (command term do_trace (cmd ())) xs)) skalberg@15531: (if do_recover then SOME recover else NONE) wenzelm@9132: |> Source.mapfilter I wenzelm@9132: end; wenzelm@5829: wenzelm@7746: wenzelm@9132: (* interactive source of toplevel transformers *) wenzelm@5829: wenzelm@9132: fun isar term no_pos = wenzelm@9132: Source.tty wenzelm@9132: |> Symbol.source true wenzelm@9132: |> T.source true get_lexicons wenzelm@9132: (if no_pos then Position.none else Position.line_name 1 "stdin") wenzelm@14925: |> toplevel_source term false true get_parser; wenzelm@6199: wenzelm@6199: wenzelm@16195: (* scan text *) wenzelm@14925: aspinall@15144: fun scan str = wenzelm@16195: Source.of_string str wenzelm@16195: |> Symbol.source false wenzelm@16195: |> T.source true get_lexicons Position.none wenzelm@16195: |> Source.exhaust; wenzelm@16195: wenzelm@16195: wenzelm@16195: (* read tokens with trace *) wenzelm@14925: aspinall@15144: fun read toks = aspinall@15144: Source.of_list toks wenzelm@14925: |> toplevel_source false true true get_parser wenzelm@14925: |> Source.exhaust wenzelm@15973: |> map (fn tr => (Toplevel.name_of tr, the (Toplevel.source_of tr), tr)); nipkow@14091: nipkow@14091: wenzelm@16195: wenzelm@9132: (** read theory **) wenzelm@6247: wenzelm@12943: (* check_text *) wenzelm@12943: wenzelm@17265: fun check_text s state = (IsarOutput.eval_antiquote (#1 (get_lexicons ())) state s; ()); wenzelm@12943: wenzelm@12943: wenzelm@9132: (* deps_thy *) wenzelm@6199: wenzelm@7940: fun deps_thy name ml path = wenzelm@6199: let wenzelm@7735: val src = Source.of_string (File.read path); wenzelm@7735: val pos = Path.position path; wenzelm@9132: val (name', parents, files) = ThyHeader.scan (src, pos); wenzelm@6199: val ml_path = ThyLoad.ml_path name; wenzelm@15973: val ml_file = if ml andalso is_some (ThyLoad.check_file NONE ml_path) then [ml_path] else []; wenzelm@6199: in wenzelm@6199: if name <> name' then wenzelm@7940: error ("Filename " ^ quote (Path.pack path) ^ wenzelm@8078: " does not agree with theory name " ^ quote name') wenzelm@6247: else (parents, map (Path.unpack o #1) files @ ml_file) wenzelm@6199: end; wenzelm@6199: wenzelm@7746: wenzelm@9132: (* load_thy *) wenzelm@6199: wenzelm@7746: local wenzelm@7746: wenzelm@7940: fun try_ml_file name time = wenzelm@6199: let wenzelm@6199: val path = ThyLoad.ml_path name; wenzelm@7940: val tr = Toplevel.imperative (fn () => ThyInfo.load_file time path); wenzelm@6247: val tr_name = if time then "time_use" else "use"; wenzelm@6199: in skalberg@15531: if is_none (ThyLoad.check_file NONE path) then () wenzelm@9132: else Toplevel.excursion [Toplevel.empty |> Toplevel.name tr_name |> tr] wenzelm@6199: end; wenzelm@6199: wenzelm@6247: fun run_thy name path = wenzelm@7683: let wenzelm@7735: val pos = Path.position path; wenzelm@9132: val text = Library.untabify (explode (File.read path)); wenzelm@9132: val text_src = Source.of_list text; wenzelm@9132: fun present_text () = Source.exhaust (Symbol.source false text_src); wenzelm@7683: in wenzelm@7735: Present.init_theory name; wenzelm@9132: Present.verbatim_source name present_text; wenzelm@17237: if ThyHeader.is_old (text_src, pos) then wenzelm@17283: (warning ("Non-Isar file format for theory " ^ quote name ^ " -- deprecated"); wenzelm@17237: ThySyn.load_thy name text; wenzelm@9132: Present.old_symbol_source name present_text) (*note: text presented twice*) wenzelm@9132: else wenzelm@9132: let wenzelm@12876: val tok_src = text_src wenzelm@12876: |> Symbol.source false wenzelm@12876: |> T.source false (K (get_lexicons ())) pos wenzelm@12876: |> Source.exhausted; wenzelm@17071: val trs = wenzelm@17071: tok_src wenzelm@17071: |> toplevel_source false false false (K (get_parser ())) wenzelm@17071: |> Source.exhaust; wenzelm@17071: in wenzelm@17071: IsarOutput.present_thy (#1 (get_lexicons ())) command_tags is_markup trs tok_src wenzelm@17071: |> Buffer.content wenzelm@17071: |> Present.theory_output name wenzelm@17071: end wenzelm@6247: end; wenzelm@6199: wenzelm@7746: in wenzelm@7746: wenzelm@6199: fun load_thy name ml time path = wenzelm@6247: (if time then wenzelm@6247: timeit (fn () => wenzelm@6247: (writeln ("\n**** Starting theory " ^ quote name ^ " ****"); wenzelm@9036: run_thy name path; wenzelm@6247: writeln ("**** Finished theory " ^ quote name ^ " ****\n"))) wenzelm@6247: else run_thy name path; wenzelm@6247: Context.context (ThyInfo.get_theory name); wenzelm@7940: if ml then try_ml_file name time else ()); wenzelm@5829: wenzelm@7746: end; wenzelm@7746: wenzelm@5829: wenzelm@5829: wenzelm@5829: (** the read-eval-print loop **) wenzelm@5829: wenzelm@5923: (* main loop *) wenzelm@5923: wenzelm@7333: fun gen_loop term no_pos = wenzelm@7333: (Context.reset_context (); wenzelm@15989: Toplevel.loop (isar term no_pos); wenzelm@15989: ml_prompts "ML> " "ML# "); wenzelm@5829: wenzelm@7333: fun gen_main term no_pos = wenzelm@5829: (Toplevel.set_state Toplevel.toplevel; wenzelm@6199: writeln (Session.welcome ()); wenzelm@7333: gen_loop term no_pos); wenzelm@6860: wenzelm@15830: structure Isar = wenzelm@15830: struct wenzelm@15830: fun main () = gen_main false false; wenzelm@15830: fun loop () = gen_loop false false; wenzelm@15830: fun sync_main () = gen_main true true; wenzelm@15830: fun sync_loop () = gen_loop true true; wenzelm@15830: end; wenzelm@5829: wenzelm@5829: wenzelm@6373: (*final declarations of this structure!*) skalberg@15531: val command = parser false NONE; skalberg@15531: val markup_command = parser false o SOME; skalberg@15531: val improper_command = parser true NONE; wenzelm@6685: wenzelm@5829: end; wenzelm@5829: wenzelm@6199: (*setup theory syntax dependent operations*) wenzelm@6199: ThyLoad.deps_thy_fn := OuterSyntax.deps_thy; wenzelm@6199: ThyLoad.load_thy_fn := OuterSyntax.load_thy; wenzelm@6199: structure ThyLoad: THY_LOAD = ThyLoad; wenzelm@6199: wenzelm@5829: structure BasicOuterSyntax: BASIC_OUTER_SYNTAX = OuterSyntax; wenzelm@5829: open BasicOuterSyntax; wenzelm@15830: open Isar;