src/Pure/Isar/outer_syntax.ML
author wenzelm
Thu Apr 29 06:04:01 2004 +0200 (2004-04-29)
changeset 14687 e089757b952a
parent 14091 ad6ba9c55190
child 14925 0f86a8a694f8
permissions -rw-r--r--
added is_keyword;
wenzelm@5829
     1
(*  Title:      Pure/Isar/outer_syntax.ML
wenzelm@5829
     2
    ID:         $Id$
wenzelm@5829
     3
    Author:     Markus Wenzel, TU Muenchen
wenzelm@8807
     4
    License:    GPL (GNU GENERAL PUBLIC LICENSE)
wenzelm@5829
     5
wenzelm@5829
     6
The global Isabelle/Isar outer syntax.
wenzelm@5829
     7
*)
wenzelm@5829
     8
wenzelm@5829
     9
signature BASIC_OUTER_SYNTAX =
wenzelm@5829
    10
sig
wenzelm@5829
    11
  val main: unit -> unit
wenzelm@5883
    12
  val loop: unit -> unit
wenzelm@6860
    13
  val sync_main: unit -> unit
wenzelm@6860
    14
  val sync_loop: unit -> unit
wenzelm@5829
    15
end;
wenzelm@5829
    16
wenzelm@5829
    17
signature OUTER_SYNTAX =
wenzelm@5829
    18
sig
wenzelm@5829
    19
  include BASIC_OUTER_SYNTAX
wenzelm@6722
    20
  structure Keyword:
wenzelm@6722
    21
    sig
wenzelm@6722
    22
      val control: string
wenzelm@6722
    23
      val diag: string
wenzelm@6722
    24
      val thy_begin: string
wenzelm@7104
    25
      val thy_switch: string
wenzelm@6722
    26
      val thy_end: string
wenzelm@6722
    27
      val thy_heading: string
wenzelm@6722
    28
      val thy_decl: string
wenzelm@9588
    29
      val thy_script: string
wenzelm@6722
    30
      val thy_goal: string
wenzelm@6722
    31
      val qed: string
wenzelm@6733
    32
      val qed_block: string
wenzelm@8209
    33
      val qed_global: string
wenzelm@9552
    34
      val prf_heading: string
wenzelm@6722
    35
      val prf_goal: string
wenzelm@6722
    36
      val prf_block: string
wenzelm@9056
    37
      val prf_open: string
wenzelm@9056
    38
      val prf_close: string
wenzelm@6722
    39
      val prf_chain: string
wenzelm@6722
    40
      val prf_decl: string
wenzelm@6868
    41
      val prf_asm: string
wenzelm@7676
    42
      val prf_asm_goal: string
wenzelm@6722
    43
      val prf_script: string
wenzelm@6722
    44
      val kinds: string list
wenzelm@6722
    45
    end
wenzelm@5829
    46
  type token
wenzelm@5829
    47
  type parser
wenzelm@6722
    48
  val command: string -> string -> string ->
wenzelm@6373
    49
    (token list -> (Toplevel.transition -> Toplevel.transition) * token list) -> parser
wenzelm@9132
    50
  val markup_command: IsarOutput.markup -> string -> string -> string ->
wenzelm@7789
    51
    (token list -> (Toplevel.transition -> Toplevel.transition) * token list) -> parser
wenzelm@6722
    52
  val improper_command: string -> string -> string ->
wenzelm@6373
    53
    (token list -> (Toplevel.transition -> Toplevel.transition) * token list) -> parser
wenzelm@14687
    54
  val is_keyword: string -> bool
wenzelm@7026
    55
  val dest_keywords: unit -> string list
wenzelm@7026
    56
  val dest_parsers: unit -> (string * string * string * bool) list
wenzelm@5883
    57
  val print_outer_syntax: unit -> unit
wenzelm@9223
    58
  val print_commands: Toplevel.transition -> Toplevel.transition
wenzelm@5829
    59
  val add_keywords: string list -> unit
wenzelm@5829
    60
  val add_parsers: parser list -> unit
wenzelm@12943
    61
  val check_text: string * Position.T -> bool -> Toplevel.state -> unit
wenzelm@7940
    62
  val deps_thy: string -> bool -> Path.T -> string list * Path.T list
wenzelm@6199
    63
  val load_thy: string -> bool -> bool -> Path.T -> unit
nipkow@14091
    64
  val isar: bool -> bool -> unit Toplevel.isar
nipkow@14091
    65
  val isar_readstring: Position.T -> string -> (string list) Toplevel.isar
wenzelm@5829
    66
end;
wenzelm@5829
    67
wenzelm@5829
    68
structure OuterSyntax: OUTER_SYNTAX =
wenzelm@5829
    69
struct
wenzelm@5829
    70
wenzelm@7750
    71
structure T = OuterLex;
wenzelm@6860
    72
structure P = OuterParse;
wenzelm@6860
    73
wenzelm@5829
    74
wenzelm@5829
    75
(** outer syntax **)
wenzelm@5829
    76
wenzelm@6722
    77
(* command keyword classification *)
wenzelm@6722
    78
wenzelm@6722
    79
structure Keyword =
wenzelm@6722
    80
struct
wenzelm@6722
    81
  val control = "control";
wenzelm@6722
    82
  val diag = "diag";
wenzelm@6722
    83
  val thy_begin = "theory-begin";
wenzelm@7104
    84
  val thy_switch = "theory-switch";
wenzelm@6722
    85
  val thy_end = "theory-end";
wenzelm@6722
    86
  val thy_heading = "theory-heading";
wenzelm@6722
    87
  val thy_decl = "theory-decl";
wenzelm@9588
    88
  val thy_script = "theory-script";
wenzelm@6722
    89
  val thy_goal = "theory-goal";
wenzelm@6722
    90
  val qed = "qed";
wenzelm@6733
    91
  val qed_block = "qed-block";
wenzelm@8209
    92
  val qed_global = "qed-global";
wenzelm@9552
    93
  val prf_heading = "proof-heading";
wenzelm@6722
    94
  val prf_goal = "proof-goal";
wenzelm@6722
    95
  val prf_block = "proof-block";
wenzelm@9056
    96
  val prf_open = "proof-open";
wenzelm@9056
    97
  val prf_close = "proof-close";
wenzelm@6722
    98
  val prf_chain = "proof-chain";
wenzelm@6722
    99
  val prf_decl = "proof-decl";
wenzelm@6868
   100
  val prf_asm = "proof-asm";
wenzelm@7676
   101
  val prf_asm_goal = "proof-asm-goal";
wenzelm@6722
   102
  val prf_script = "proof-script";
wenzelm@6722
   103
wenzelm@9588
   104
  val kinds = [control, diag, thy_begin, thy_switch, thy_end, thy_heading, thy_decl, thy_script,
wenzelm@9588
   105
    thy_goal, qed, qed_block, qed_global, prf_heading, prf_goal, prf_block, prf_open, prf_close,
wenzelm@9588
   106
    prf_chain, prf_decl, prf_asm, prf_asm_goal, prf_script];
wenzelm@6722
   107
end;
wenzelm@6722
   108
wenzelm@6722
   109
wenzelm@5829
   110
(* parsers *)
wenzelm@5829
   111
wenzelm@7750
   112
type token = T.token;
wenzelm@5829
   113
type parser_fn = token list -> (Toplevel.transition -> Toplevel.transition) * token list;
wenzelm@5829
   114
wenzelm@5829
   115
datatype parser =
wenzelm@9132
   116
  Parser of string * (string * string * IsarOutput.markup option) * bool * parser_fn;
wenzelm@5829
   117
wenzelm@7750
   118
fun parser int_only markup name comment kind parse =
wenzelm@7750
   119
  Parser (name, (comment, kind, markup), int_only, parse);
wenzelm@5829
   120
wenzelm@5829
   121
wenzelm@5829
   122
(* parse command *)
wenzelm@5829
   123
wenzelm@6860
   124
local
wenzelm@6199
   125
wenzelm@5829
   126
fun command_body cmd (name, _) =
wenzelm@7026
   127
  (case cmd name of
wenzelm@7026
   128
    Some (int_only, parse) => P.!!! (Scan.prompt (name ^ "# ") (parse >> pair int_only))
wenzelm@7026
   129
  | None => sys_error ("no parser for outer syntax command " ^ quote name));
wenzelm@6860
   130
wenzelm@6860
   131
fun terminator false = Scan.succeed ()
wenzelm@9132
   132
  | terminator true = P.group "end of input" (Scan.option P.sync -- P.semicolon >> K ());
wenzelm@6860
   133
wenzelm@6860
   134
in
wenzelm@5829
   135
wenzelm@6860
   136
fun command term cmd =
wenzelm@9132
   137
  P.semicolon >> K None ||
wenzelm@6860
   138
  P.sync >> K None ||
wenzelm@7026
   139
  (P.position P.command :-- command_body cmd) --| terminator term
wenzelm@6860
   140
    >> (fn ((name, pos), (int_only, f)) =>
wenzelm@6860
   141
      Some (Toplevel.empty |> Toplevel.name name |> Toplevel.position pos |>
wenzelm@6860
   142
        Toplevel.interactive int_only |> f));
wenzelm@5829
   143
wenzelm@6199
   144
end;
wenzelm@6199
   145
wenzelm@5829
   146
wenzelm@5829
   147
wenzelm@9132
   148
(** global outer syntax **)
wenzelm@5829
   149
wenzelm@7026
   150
local
wenzelm@7026
   151
wenzelm@7026
   152
val global_lexicons = ref (Scan.empty_lexicon, Scan.empty_lexicon);
wenzelm@7750
   153
val global_parsers =
wenzelm@9132
   154
  ref (Symtab.empty: (((string * string) * (bool * parser_fn)) * IsarOutput.markup option)
wenzelm@9132
   155
    Symtab.table);
wenzelm@9132
   156
val global_markups = ref ([]: (string * IsarOutput.markup) list);
wenzelm@5952
   157
wenzelm@7026
   158
fun change_lexicons f =
wenzelm@7026
   159
  let val lexs = f (! global_lexicons) in
wenzelm@7026
   160
    (case (op inter_string) (pairself Scan.dest_lexicon lexs) of
wenzelm@7026
   161
      [] => global_lexicons := lexs
wenzelm@7026
   162
    | bads => error ("Clash of outer syntax commands and keywords: " ^ commas_quote bads))
wenzelm@7026
   163
  end;
wenzelm@5829
   164
wenzelm@7789
   165
fun get_markup (ms, (name, (_, Some m))) = (name, m) :: ms
wenzelm@7789
   166
  | get_markup (ms, _) = ms;
wenzelm@7750
   167
wenzelm@7750
   168
fun make_markups () = global_markups := Symtab.foldl get_markup ([], ! global_parsers);
wenzelm@9132
   169
fun change_parsers f = (Library.change global_parsers f; make_markups ());
wenzelm@6722
   170
wenzelm@7026
   171
in
wenzelm@7026
   172
wenzelm@7750
   173
wenzelm@9132
   174
(* access current syntax *)
wenzelm@7026
   175
wenzelm@7026
   176
(*Note: the syntax for files is statically determined at the very
wenzelm@7026
   177
  beginning; for interactive processing it may change dynamically.*)
wenzelm@7026
   178
wenzelm@7026
   179
fun get_lexicons () = ! global_lexicons;
wenzelm@7026
   180
fun get_parsers () = ! global_parsers;
wenzelm@7750
   181
fun get_parser () = apsome (#2 o #1) o curry Symtab.lookup (! global_parsers);
wenzelm@7789
   182
wenzelm@9132
   183
fun is_markup kind name =
wenzelm@9132
   184
  (case assoc (! global_markups, name) of Some k => k = kind | None => false);
wenzelm@9132
   185
fun markup kind = Scan.one (T.is_kind T.Command andf is_markup kind o T.val_of);
wenzelm@5829
   186
wenzelm@5829
   187
wenzelm@5829
   188
(* augment syntax *)
wenzelm@5829
   189
wenzelm@7026
   190
fun add_keywords keywords = change_lexicons (apfst (fn lex =>
wenzelm@7026
   191
  (Scan.extend_lexicon lex (map Symbol.explode keywords))));
wenzelm@5829
   192
wenzelm@7750
   193
fun add_parser (tab, Parser (name, (comment, kind, markup), int_only, parse)) =
wenzelm@5829
   194
 (if is_none (Symtab.lookup (tab, name)) then ()
wenzelm@5829
   195
  else warning ("Redefined outer syntax command " ^ quote name);
wenzelm@7750
   196
  Symtab.update ((name, (((comment, kind), (int_only, parse)), markup)), tab));
wenzelm@5829
   197
wenzelm@5829
   198
fun add_parsers parsers =
wenzelm@7026
   199
  (change_parsers (fn tab => foldl add_parser (tab, parsers));
wenzelm@7026
   200
    change_lexicons (apsnd (fn lex => Scan.extend_lexicon lex
wenzelm@7026
   201
      (map (fn Parser (name, _, _, _) => Symbol.explode name) parsers))));
wenzelm@7026
   202
wenzelm@7026
   203
end;
wenzelm@5829
   204
wenzelm@5829
   205
wenzelm@7026
   206
(* print syntax *)
wenzelm@7026
   207
wenzelm@14687
   208
fun is_keyword s = Scan.is_literal (#1 (get_lexicons ())) (Symbol.explode s);
wenzelm@7026
   209
fun dest_keywords () = Scan.dest_lexicon (#1 (get_lexicons ()));
wenzelm@7026
   210
wenzelm@7026
   211
fun dest_parsers () =
wenzelm@7750
   212
  map (fn (name, (((cmt, kind), (int_only, _)), _)) => (name, cmt, kind, int_only))
wenzelm@7026
   213
    (Symtab.dest (get_parsers ()));
wenzelm@5829
   214
wenzelm@9223
   215
fun print_outer_syntax () =
wenzelm@7026
   216
  let
wenzelm@7026
   217
    fun pretty_cmd (name, comment, _, _) =
wenzelm@7026
   218
      Pretty.block [Pretty.str (name ^ ":"), Pretty.brk 2, Pretty.str comment];
wenzelm@7026
   219
    val (int_cmds, cmds) = partition #4 (dest_parsers ());
wenzelm@7026
   220
  in
wenzelm@8720
   221
    [Pretty.strs ("syntax keywords:" :: map quote (dest_keywords ())),
wenzelm@8720
   222
      Pretty.big_list "proper commands:" (map pretty_cmd cmds),
wenzelm@8720
   223
      Pretty.big_list "improper commands (interactive-only):" (map pretty_cmd int_cmds)]
wenzelm@9223
   224
    |> Pretty.chunks |> Pretty.writeln
wenzelm@7026
   225
  end;
wenzelm@5829
   226
wenzelm@9223
   227
val print_commands = Toplevel.imperative print_outer_syntax;
wenzelm@7367
   228
wenzelm@5829
   229
wenzelm@5829
   230
wenzelm@9132
   231
(** toplevel parsing **)
wenzelm@5829
   232
wenzelm@9132
   233
(* basic sources *)
wenzelm@6860
   234
wenzelm@9132
   235
fun toplevel_source term do_recover cmd src =
wenzelm@9132
   236
  let
wenzelm@9132
   237
    val no_terminator =
wenzelm@9132
   238
      Scan.unless P.semicolon (Scan.one (T.not_sync andf T.not_eof));
wenzelm@12876
   239
    fun recover x = (Scan.prompt "recover# " (Scan.repeat no_terminator) >> K [None]) x;
wenzelm@9132
   240
  in
wenzelm@9132
   241
    src
wenzelm@12876
   242
    |> T.source_proper
wenzelm@9132
   243
    |> Source.source T.stopper
wenzelm@12876
   244
      (Scan.bulk (P.$$$ "--" -- P.!!! P.text >> K None || P.not_eof >> Some))
wenzelm@12876
   245
      (if do_recover then Some recover else None)
wenzelm@12876
   246
    |> Source.mapfilter I
wenzelm@12876
   247
    |> Source.source T.stopper (Scan.bulk (fn xs => P.!!! (command term (cmd ())) xs))
wenzelm@9132
   248
      (if do_recover then Some recover else None)
wenzelm@9132
   249
    |> Source.mapfilter I
wenzelm@9132
   250
  end;
wenzelm@5829
   251
wenzelm@7746
   252
wenzelm@9132
   253
(* interactive source of toplevel transformers *)
wenzelm@5829
   254
wenzelm@9132
   255
fun isar term no_pos =
wenzelm@9132
   256
  Source.tty
wenzelm@9132
   257
  |> Symbol.source true
wenzelm@9132
   258
  |> T.source true get_lexicons
wenzelm@9132
   259
    (if no_pos then Position.none else Position.line_name 1 "stdin")
wenzelm@9132
   260
  |> toplevel_source term true get_parser;
wenzelm@6199
   261
wenzelm@6199
   262
nipkow@14091
   263
(* string source of transformers (for Proof General) *)
nipkow@14091
   264
nipkow@14091
   265
fun isar_readstring pos str =
nipkow@14091
   266
  Source.of_string str
nipkow@14091
   267
  |> Symbol.source false
nipkow@14091
   268
  |> T.source false get_lexicons pos
nipkow@14091
   269
  |> toplevel_source false true get_parser;
nipkow@14091
   270
nipkow@14091
   271
wenzelm@7746
   272
wenzelm@9132
   273
(** read theory **)
wenzelm@6247
   274
wenzelm@12943
   275
(* check_text *)
wenzelm@12943
   276
wenzelm@12943
   277
fun check_text s true state = (IsarOutput.eval_antiquote (#1 (get_lexicons ())) state s; ())
wenzelm@12943
   278
  | check_text _ false _ = ();
wenzelm@12943
   279
wenzelm@12943
   280
wenzelm@9132
   281
(* deps_thy *)
wenzelm@6199
   282
wenzelm@7940
   283
fun deps_thy name ml path =
wenzelm@6199
   284
  let
wenzelm@7735
   285
    val src = Source.of_string (File.read path);
wenzelm@7735
   286
    val pos = Path.position path;
wenzelm@9132
   287
    val (name', parents, files) = ThyHeader.scan (src, pos);
wenzelm@6199
   288
    val ml_path = ThyLoad.ml_path name;
wenzelm@7940
   289
    val ml_file = if ml andalso is_some (ThyLoad.check_file ml_path) then [ml_path] else [];
wenzelm@6199
   290
  in
wenzelm@6199
   291
    if name <> name' then
wenzelm@7940
   292
      error ("Filename " ^ quote (Path.pack path) ^
wenzelm@8078
   293
        " does not agree with theory name " ^ quote name')
wenzelm@6247
   294
    else (parents, map (Path.unpack o #1) files @ ml_file)
wenzelm@6199
   295
  end;
wenzelm@6199
   296
wenzelm@7746
   297
wenzelm@9132
   298
(* load_thy *)
wenzelm@6199
   299
wenzelm@7746
   300
local
wenzelm@7746
   301
wenzelm@7940
   302
fun try_ml_file name time =
wenzelm@6199
   303
  let
wenzelm@6199
   304
    val path = ThyLoad.ml_path name;
wenzelm@7940
   305
    val tr = Toplevel.imperative (fn () => ThyInfo.load_file time path);
wenzelm@6247
   306
    val tr_name = if time then "time_use" else "use";
wenzelm@6199
   307
  in
wenzelm@7243
   308
    if is_none (ThyLoad.check_file path) then ()
wenzelm@9132
   309
    else Toplevel.excursion [Toplevel.empty |> Toplevel.name tr_name |> tr]
wenzelm@6199
   310
  end;
wenzelm@6199
   311
wenzelm@9132
   312
fun parse_thy src =
wenzelm@9132
   313
  src
wenzelm@9132
   314
  |> toplevel_source false false (K (get_parser ()))
wenzelm@7746
   315
  |> Source.exhaust;
wenzelm@5829
   316
wenzelm@6247
   317
fun run_thy name path =
wenzelm@7683
   318
  let
wenzelm@7735
   319
    val pos = Path.position path;
wenzelm@9132
   320
    val text = Library.untabify (explode (File.read path));
wenzelm@9132
   321
    val text_src = Source.of_list text;
wenzelm@9132
   322
    fun present_text () = Source.exhaust (Symbol.source false text_src);
wenzelm@7683
   323
  in
wenzelm@7735
   324
    Present.init_theory name;
wenzelm@9132
   325
    Present.verbatim_source name present_text;
wenzelm@9132
   326
    if ThyHeader.is_old (text_src, pos) then (ThySyn.load_thy name text;
wenzelm@9132
   327
      Present.old_symbol_source name present_text)   (*note: text presented twice*)
wenzelm@9132
   328
    else
wenzelm@9132
   329
      let
wenzelm@12876
   330
        val tok_src = text_src
wenzelm@12876
   331
          |> Symbol.source false
wenzelm@12876
   332
          |> T.source false (K (get_lexicons ())) pos
wenzelm@12876
   333
          |> Source.exhausted;
wenzelm@9132
   334
        val out = Toplevel.excursion_result
wenzelm@9132
   335
          (IsarOutput.parse_thy markup (#1 (get_lexicons ()))
wenzelm@9132
   336
            (parse_thy tok_src) tok_src);
wenzelm@9132
   337
      in Present.theory_output name (Buffer.content out) end
wenzelm@6247
   338
  end;
wenzelm@6199
   339
wenzelm@7746
   340
in
wenzelm@7746
   341
wenzelm@6199
   342
fun load_thy name ml time path =
wenzelm@6247
   343
 (if time then
wenzelm@6247
   344
    timeit (fn () =>
wenzelm@6247
   345
     (writeln ("\n**** Starting theory " ^ quote name ^ " ****");
wenzelm@9036
   346
      run_thy name path;
wenzelm@6247
   347
      writeln ("**** Finished theory " ^ quote name ^ " ****\n")))
wenzelm@6247
   348
  else run_thy name path;
wenzelm@6247
   349
  Context.context (ThyInfo.get_theory name);
wenzelm@7940
   350
  if ml then try_ml_file name time else ());
wenzelm@5829
   351
wenzelm@7746
   352
end;
wenzelm@7746
   353
wenzelm@5829
   354
wenzelm@5829
   355
wenzelm@5829
   356
(** the read-eval-print loop **)
wenzelm@5829
   357
wenzelm@5923
   358
(* main loop *)
wenzelm@5923
   359
wenzelm@7333
   360
fun gen_loop term no_pos =
wenzelm@7333
   361
 (Context.reset_context ();
wenzelm@7333
   362
  Toplevel.loop (isar term no_pos));
wenzelm@5829
   363
wenzelm@7333
   364
fun gen_main term no_pos =
wenzelm@5829
   365
 (Toplevel.set_state Toplevel.toplevel;
wenzelm@6199
   366
  writeln (Session.welcome ());
wenzelm@7333
   367
  gen_loop term no_pos);
wenzelm@6860
   368
wenzelm@7333
   369
fun main () = gen_main false false;
wenzelm@7333
   370
fun loop () = gen_loop false false;
wenzelm@7333
   371
fun sync_main () = gen_main true true;
wenzelm@7333
   372
fun sync_loop () = gen_loop true true;
wenzelm@5829
   373
wenzelm@5829
   374
wenzelm@5829
   375
(* help *)
wenzelm@5829
   376
wenzelm@5829
   377
fun help () =
wenzelm@5829
   378
  writeln ("This is Isabelle's underlying ML system (" ^ ml_system ^ ");\n\
wenzelm@9223
   379
    \invoke 'Isar.loop();' to get back to the Isar read-eval-print loop.");
wenzelm@5829
   380
wenzelm@5829
   381
wenzelm@6373
   382
(*final declarations of this structure!*)
wenzelm@7789
   383
val command = parser false None;
wenzelm@9132
   384
val markup_command = parser false o Some;
wenzelm@7789
   385
val improper_command = parser true None;
wenzelm@6685
   386
wenzelm@6373
   387
wenzelm@5829
   388
end;
wenzelm@5829
   389
wenzelm@6199
   390
(*setup theory syntax dependent operations*)
wenzelm@6199
   391
ThyLoad.deps_thy_fn := OuterSyntax.deps_thy;
wenzelm@6199
   392
ThyLoad.load_thy_fn := OuterSyntax.load_thy;
wenzelm@6199
   393
structure ThyLoad: THY_LOAD = ThyLoad;
wenzelm@6199
   394
wenzelm@5829
   395
structure BasicOuterSyntax: BASIC_OUTER_SYNTAX = OuterSyntax;
wenzelm@5829
   396
open BasicOuterSyntax;