src/Pure/Thy/parse.ML
author clasohm
Thu, 16 Sep 1993 12:20:38 +0200
changeset 0 a5a9c433f639
child 213 42f2b8a3581f
permissions -rw-r--r--
Initial revision
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
0
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
     1
(*  Title: 	Pure/Thy/parse
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
     2
    ID:         $Id$
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
     3
    Author: 	Sonia Mahjoub / Tobias Nipkow
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
     4
    Copyright   1992  TU Muenchen
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
     5
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
     6
The parser combinators.
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
     7
Adapted from Larry Paulson's ML for the Working Programmer.
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
     8
*)
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
     9
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
    10
(*Global infix declarations for the parsing primitives*)
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
    11
infix 5 -- --$$ $$--;
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
    12
infix 3 >>;
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
    13
infix 0 ||;
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
    14
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
    15
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
    16
signature PARSE = 
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
    17
sig
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
    18
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
    19
type token
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
    20
val $$     : string -> 
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
    21
             (token * int) list -> string * (token * int)list 
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
    22
val id     : (token * int) list -> string * (token * int)list 
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
    23
val nat    : (token * int) list -> string * (token * int)list 
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
    24
val stg    : (token * int) list -> string * (token * int)list 
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
    25
val txt    : (token * int) list -> string * (token * int)list 
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
    26
val >>     : ('a -> 'b * 'c) * ('b -> 'd) -> 'a -> 'd * 'c
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
    27
val ||     : ('a -> 'b) * ('a -> 'b) -> 'a -> 'b 
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
    28
val --     : ('a -> 'b * 'c) * ('c -> 'd * 'e) -> 
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
    29
             'a -> ('b * 'd) * 'e
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
    30
val $$--   : string * ((token * int)list -> 'b * 'c) -> 
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
    31
             (token * int) list -> 'b * 'c
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
    32
val --$$   : ( 'a -> 'b * (token * int)list ) * string -> 
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
    33
             'a -> 'b * (token * int)list 
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
    34
val !!     : ((token * int) list -> 'a * (token * int) list ) 
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
    35
             -> (token * int) list -> 'a * (token * int) list 
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
    36
val empty  : 'a -> 'b list * 'a
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
    37
val repeat : ('a -> 'b * 'a) -> 'a -> 'b list * 'a
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
    38
val repeat1: ('a -> 'b * 'a) -> 'a -> 'b list * 'a
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
    39
val list_of: ((token * int)list -> 'b * (token * int)list ) -> 
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
    40
             (token * int)list  -> 'b list * (token * int)list 
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
    41
val list_of1: ((token * int)list -> 'b * (token * int)list ) -> 
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
    42
             (token * int)list  -> 'b list * (token * int)list 
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
    43
val reader : ((token * int) list -> 'a * ('b * int) list )
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
    44
              -> string list -> 'a
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
    45
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
    46
end;
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
    47
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
    48
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
    49
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
    50
functor ParseFUN (Lex: LEXICAL): PARSE =
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
    51
struct
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
    52
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
    53
type token = Lex.token;
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
    54
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
    55
datatype synerr = Line of string * string * int | EOF of string;
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
    56
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
    57
exception SynError of synerr;
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
    58
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
    59
fun synerr(Line(s1, s2, n)) =
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
    60
      error("Syntax error on line " ^ (string_of_int n) ^ ": " ^ s1 ^
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
    61
            " expected and " ^ s2 ^ " was found")
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
    62
  | synerr(EOF(s)) = error("Syntax error on last line: " ^ s ^
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
    63
                           " expected and end-of-file was found"); 
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
    64
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
    65
fun string_of_token (Lex.Key b) = b
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
    66
  | string_of_token (Lex.Id b)  = b
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
    67
  | string_of_token (Lex.Nat b) = b
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
    68
  | string_of_token (Lex.Txt b) = b
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
    69
  | string_of_token (Lex.Stg b) = b;
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
    70
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
    71
fun line_err x = raise SynError(Line x);
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
    72
fun eof_err s =  raise SynError(EOF s);
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
    73
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
    74
fun $$a ((Lex.Key b,n) :: toks) =
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
    75
           if a = b then (a,toks) else line_err(a,b,n) 
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
    76
  | $$a ((t,n) :: toks) = line_err (a,string_of_token t, n)
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
    77
  | $$a _ = eof_err a;
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
    78
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
    79
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
    80
fun id ((Lex.Id b,n) :: toks) = (b, toks)
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
    81
  | id ((t,n) :: toks) = line_err ("identifier", string_of_token t, n)
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
    82
  | id _ = eof_err "identifier";
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
    83
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
    84
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
    85
fun nat ((Lex.Nat b,n) :: toks) = (b, toks)
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
    86
  | nat ((t,n) :: toks) = 
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
    87
	line_err ("natural number", string_of_token t, n)
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
    88
  | nat _ = eof_err "natural number";
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
    89
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
    90
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
    91
fun stg ((Lex.Stg b,n) :: toks) = (b, toks)
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
    92
  | stg ((t,n) :: toks) = line_err("string", string_of_token t, n)
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
    93
  | stg _ = eof_err"string";
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
    94
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
    95
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
    96
fun txt ((Lex.Txt b,n) :: toks) = (b, toks)
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
    97
  | txt ((t,n) :: toks) = line_err ("ML text", string_of_token t, n)
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
    98
  | txt _ = eof_err "ML text";
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
    99
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
   100
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
   101
fun ( ph >> f) toks = let val (x, toks2) = ph toks in (f x, toks2) end;
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
   102
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
   103
fun (ph1 || ph2) toks = ph1 toks handle SynError _ => ph2 toks;
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
   104
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
   105
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
   106
fun (ph1 -- ph2) toks =
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
   107
    let val (x, toks2) = ph1 toks
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
   108
        val (y, toks3) = ph2 toks2
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
   109
    in ((x,y), toks3) end;
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
   110
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
   111
fun (a $$-- ph)  =  $$a -- ph >> #2;
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
   112
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
   113
fun (ph --$$ a)  =  ph -- $$a >> #1;
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
   114
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
   115
fun !! ph toks = ph toks handle SynError s => synerr s;
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
   116
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
   117
fun empty toks = ([], toks);
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
   118
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
   119
fun repeat ph toks  = (   ph -- repeat ph >> (op::)
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
   120
                       || empty ) toks; 
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
   121
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
   122
fun repeat1 ph  =  ph -- repeat ph >> (op::);
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
   123
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
   124
fun list_of1 ph =  ph -- repeat("," $$-- !! ph) >> (op::);
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
   125
fun list_of ph  =  list_of1 ph || empty;
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
   126
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
   127
fun reader ph a = 
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
   128
       ( case ph (Lex.scan a) of 
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
   129
                (x,  []) => x
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
   130
              | (_,(_, n)::_) => error
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
   131
                ("Syntax error on line " ^ (string_of_int n) ^ ": " ^
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
   132
                 "Extra characters in phrase")
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
   133
       );
a5a9c433f639 Initial revision
clasohm
parents:
diff changeset
   134
end;