src/Doc/Implementation/Syntax.thy
author wenzelm
Fri, 20 Jun 2014 20:47:22 +0200
changeset 57346 1d6d44a0583f
parent 57345 8a9639888639
child 57496 94596c573b38
permissions -rw-r--r--
more on syntax phases; tuned;
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
57344
wenzelm
parents: 56420
diff changeset
     1
(*:wrap=hard:maxLineLen=78:*)
wenzelm
parents: 56420
diff changeset
     2
30124
b956bf0dc87c basic setup for chapter "Syntax and type-checking";
wenzelm
parents:
diff changeset
     3
theory Syntax
b956bf0dc87c basic setup for chapter "Syntax and type-checking";
wenzelm
parents:
diff changeset
     4
imports Base
b956bf0dc87c basic setup for chapter "Syntax and type-checking";
wenzelm
parents:
diff changeset
     5
begin
b956bf0dc87c basic setup for chapter "Syntax and type-checking";
wenzelm
parents:
diff changeset
     6
34924
520727474bbe theory data example;
wenzelm
parents: 30272
diff changeset
     7
chapter {* Concrete syntax and type-checking *}
30124
b956bf0dc87c basic setup for chapter "Syntax and type-checking";
wenzelm
parents:
diff changeset
     8
45258
97f8806c3ed6 some text on inner-syntax;
wenzelm
parents: 42510
diff changeset
     9
text {* Pure @{text "\<lambda>"}-calculus as introduced in \chref{ch:logic} is
97f8806c3ed6 some text on inner-syntax;
wenzelm
parents: 42510
diff changeset
    10
  an adequate foundation for logical languages --- in the tradition of
97f8806c3ed6 some text on inner-syntax;
wenzelm
parents: 42510
diff changeset
    11
  \emph{higher-order abstract syntax} --- but end-users require
97f8806c3ed6 some text on inner-syntax;
wenzelm
parents: 42510
diff changeset
    12
  additional means for reading and printing of terms and types.  This
97f8806c3ed6 some text on inner-syntax;
wenzelm
parents: 42510
diff changeset
    13
  important add-on outside the logical core is called \emph{inner
97f8806c3ed6 some text on inner-syntax;
wenzelm
parents: 42510
diff changeset
    14
  syntax} in Isabelle jargon, as opposed to the \emph{outer syntax} of
46484
50fca9d09528 updated refs;
wenzelm
parents: 45260
diff changeset
    15
  the theory and proof language (cf.\ \cite{isabelle-isar-ref}).
45258
97f8806c3ed6 some text on inner-syntax;
wenzelm
parents: 42510
diff changeset
    16
97f8806c3ed6 some text on inner-syntax;
wenzelm
parents: 42510
diff changeset
    17
  For example, according to \cite{church40} quantifiers are
97f8806c3ed6 some text on inner-syntax;
wenzelm
parents: 42510
diff changeset
    18
  represented as higher-order constants @{text "All :: ('a \<Rightarrow> bool) \<Rightarrow>
97f8806c3ed6 some text on inner-syntax;
wenzelm
parents: 42510
diff changeset
    19
  bool"} such that @{text "All (\<lambda>x::'a. B x)"} faithfully represents
97f8806c3ed6 some text on inner-syntax;
wenzelm
parents: 42510
diff changeset
    20
  the idea that is displayed as @{text "\<forall>x::'a. B x"} via @{keyword
97f8806c3ed6 some text on inner-syntax;
wenzelm
parents: 42510
diff changeset
    21
  "binder"} notation.  Moreover, type-inference in the style of
97f8806c3ed6 some text on inner-syntax;
wenzelm
parents: 42510
diff changeset
    22
  Hindley-Milner \cite{hindleymilner} (and extensions) enables users
97f8806c3ed6 some text on inner-syntax;
wenzelm
parents: 42510
diff changeset
    23
  to write @{text "\<forall>x. B x"} concisely, when the type @{text "'a"} is
97f8806c3ed6 some text on inner-syntax;
wenzelm
parents: 42510
diff changeset
    24
  already clear from the context.\footnote{Type-inference taken to the
97f8806c3ed6 some text on inner-syntax;
wenzelm
parents: 42510
diff changeset
    25
  extreme can easily confuse users, though.  Beginners often stumble
97f8806c3ed6 some text on inner-syntax;
wenzelm
parents: 42510
diff changeset
    26
  over unexpectedly general types inferred by the system.}
97f8806c3ed6 some text on inner-syntax;
wenzelm
parents: 42510
diff changeset
    27
97f8806c3ed6 some text on inner-syntax;
wenzelm
parents: 42510
diff changeset
    28
  \medskip The main inner syntax operations are \emph{read} for
97f8806c3ed6 some text on inner-syntax;
wenzelm
parents: 42510
diff changeset
    29
  parsing together with type-checking, and \emph{pretty} for formatted
97f8806c3ed6 some text on inner-syntax;
wenzelm
parents: 42510
diff changeset
    30
  output.  See also \secref{sec:read-print}.
97f8806c3ed6 some text on inner-syntax;
wenzelm
parents: 42510
diff changeset
    31
97f8806c3ed6 some text on inner-syntax;
wenzelm
parents: 42510
diff changeset
    32
  Furthermore, the input and output syntax layers are sub-divided into
97f8806c3ed6 some text on inner-syntax;
wenzelm
parents: 42510
diff changeset
    33
  separate phases for \emph{concrete syntax} versus \emph{abstract
97f8806c3ed6 some text on inner-syntax;
wenzelm
parents: 42510
diff changeset
    34
  syntax}, see also \secref{sec:parse-unparse} and
97f8806c3ed6 some text on inner-syntax;
wenzelm
parents: 42510
diff changeset
    35
  \secref{sec:term-check}, respectively.  This results in the
97f8806c3ed6 some text on inner-syntax;
wenzelm
parents: 42510
diff changeset
    36
  following decomposition of the main operations:
97f8806c3ed6 some text on inner-syntax;
wenzelm
parents: 42510
diff changeset
    37
97f8806c3ed6 some text on inner-syntax;
wenzelm
parents: 42510
diff changeset
    38
  \begin{itemize}
97f8806c3ed6 some text on inner-syntax;
wenzelm
parents: 42510
diff changeset
    39
97f8806c3ed6 some text on inner-syntax;
wenzelm
parents: 42510
diff changeset
    40
  \item @{text "read = parse; check"}
97f8806c3ed6 some text on inner-syntax;
wenzelm
parents: 42510
diff changeset
    41
97f8806c3ed6 some text on inner-syntax;
wenzelm
parents: 42510
diff changeset
    42
  \item @{text "pretty = uncheck; unparse"}
97f8806c3ed6 some text on inner-syntax;
wenzelm
parents: 42510
diff changeset
    43
97f8806c3ed6 some text on inner-syntax;
wenzelm
parents: 42510
diff changeset
    44
  \end{itemize}
97f8806c3ed6 some text on inner-syntax;
wenzelm
parents: 42510
diff changeset
    45
97f8806c3ed6 some text on inner-syntax;
wenzelm
parents: 42510
diff changeset
    46
  Some specification package might thus intercept syntax processing at
97f8806c3ed6 some text on inner-syntax;
wenzelm
parents: 42510
diff changeset
    47
  a well-defined stage after @{text "parse"}, to a augment the
97f8806c3ed6 some text on inner-syntax;
wenzelm
parents: 42510
diff changeset
    48
  resulting pre-term before full type-reconstruction is performed by
97f8806c3ed6 some text on inner-syntax;
wenzelm
parents: 42510
diff changeset
    49
  @{text "check"}, for example.  Note that the formal status of bound
97f8806c3ed6 some text on inner-syntax;
wenzelm
parents: 42510
diff changeset
    50
  variables, versus free variables, versus constants must not be
57345
8a9639888639 more on syntax phases;
wenzelm
parents: 57344
diff changeset
    51
  changed between these phases!
8a9639888639 more on syntax phases;
wenzelm
parents: 57344
diff changeset
    52
8a9639888639 more on syntax phases;
wenzelm
parents: 57344
diff changeset
    53
  \medskip In general, @{text check} and @{text uncheck} operate
8a9639888639 more on syntax phases;
wenzelm
parents: 57344
diff changeset
    54
  simultaneously on a list of terms. This is particular important for
8a9639888639 more on syntax phases;
wenzelm
parents: 57344
diff changeset
    55
  type-checking, to reconstruct types for several terms of the same context
8a9639888639 more on syntax phases;
wenzelm
parents: 57344
diff changeset
    56
  and scope. In contrast, @{text parse} and @{text unparse} operate separately
8a9639888639 more on syntax phases;
wenzelm
parents: 57344
diff changeset
    57
  in single terms.
8a9639888639 more on syntax phases;
wenzelm
parents: 57344
diff changeset
    58
8a9639888639 more on syntax phases;
wenzelm
parents: 57344
diff changeset
    59
  There are analogous operations to read and print types, with the same
8a9639888639 more on syntax phases;
wenzelm
parents: 57344
diff changeset
    60
  sub-division into phases.
8a9639888639 more on syntax phases;
wenzelm
parents: 57344
diff changeset
    61
*}
45258
97f8806c3ed6 some text on inner-syntax;
wenzelm
parents: 42510
diff changeset
    62
30272
2d612824e642 regenerated document;
wenzelm
parents: 30270
diff changeset
    63
39876
1ff9bce085bd preliminary material on "Concrete syntax and type-checking";
wenzelm
parents: 39865
diff changeset
    64
section {* Reading and pretty printing \label{sec:read-print} *}
34924
520727474bbe theory data example;
wenzelm
parents: 30272
diff changeset
    65
45258
97f8806c3ed6 some text on inner-syntax;
wenzelm
parents: 42510
diff changeset
    66
text {* Read and print operations are roughly dual to each other, such
97f8806c3ed6 some text on inner-syntax;
wenzelm
parents: 42510
diff changeset
    67
  that for the user @{text "s' = pretty (read s)"} looks similar to
97f8806c3ed6 some text on inner-syntax;
wenzelm
parents: 42510
diff changeset
    68
  the original source text @{text "s"}, but the details depend on many
97f8806c3ed6 some text on inner-syntax;
wenzelm
parents: 42510
diff changeset
    69
  side-conditions.  There are also explicit options to control
97f8806c3ed6 some text on inner-syntax;
wenzelm
parents: 42510
diff changeset
    70
  suppressing of type information in the output.  The default
97f8806c3ed6 some text on inner-syntax;
wenzelm
parents: 42510
diff changeset
    71
  configuration routinely looses information, so @{text "t' = read
57344
wenzelm
parents: 56420
diff changeset
    72
  (pretty t)"} might fail, or produce a differently typed term, or a
45258
97f8806c3ed6 some text on inner-syntax;
wenzelm
parents: 42510
diff changeset
    73
  completely different term in the face of syntactic overloading!  *}
34924
520727474bbe theory data example;
wenzelm
parents: 30272
diff changeset
    74
39876
1ff9bce085bd preliminary material on "Concrete syntax and type-checking";
wenzelm
parents: 39865
diff changeset
    75
text %mlref {*
1ff9bce085bd preliminary material on "Concrete syntax and type-checking";
wenzelm
parents: 39865
diff changeset
    76
  \begin{mldecls}
57345
8a9639888639 more on syntax phases;
wenzelm
parents: 57344
diff changeset
    77
  @{index_ML Syntax.read_typs: "Proof.context -> string list -> typ list"} \\
8a9639888639 more on syntax phases;
wenzelm
parents: 57344
diff changeset
    78
  @{index_ML Syntax.read_terms: "Proof.context -> string list -> term list"} \\
8a9639888639 more on syntax phases;
wenzelm
parents: 57344
diff changeset
    79
  @{index_ML Syntax.read_props: "Proof.context -> string list -> term list"} \\[0.5ex]
39876
1ff9bce085bd preliminary material on "Concrete syntax and type-checking";
wenzelm
parents: 39865
diff changeset
    80
  @{index_ML Syntax.read_typ: "Proof.context -> string -> typ"} \\
1ff9bce085bd preliminary material on "Concrete syntax and type-checking";
wenzelm
parents: 39865
diff changeset
    81
  @{index_ML Syntax.read_term: "Proof.context -> string -> term"} \\
57345
8a9639888639 more on syntax phases;
wenzelm
parents: 57344
diff changeset
    82
  @{index_ML Syntax.read_prop: "Proof.context -> string -> term"} \\[0.5ex]
39876
1ff9bce085bd preliminary material on "Concrete syntax and type-checking";
wenzelm
parents: 39865
diff changeset
    83
  @{index_ML Syntax.pretty_typ: "Proof.context -> typ -> Pretty.T"} \\
1ff9bce085bd preliminary material on "Concrete syntax and type-checking";
wenzelm
parents: 39865
diff changeset
    84
  @{index_ML Syntax.pretty_term: "Proof.context -> term -> Pretty.T"} \\
57345
8a9639888639 more on syntax phases;
wenzelm
parents: 57344
diff changeset
    85
  @{index_ML Syntax.string_of_typ: "Proof.context -> typ -> string"} \\
8a9639888639 more on syntax phases;
wenzelm
parents: 57344
diff changeset
    86
  @{index_ML Syntax.string_of_term: "Proof.context -> term -> string"} \\
39876
1ff9bce085bd preliminary material on "Concrete syntax and type-checking";
wenzelm
parents: 39865
diff changeset
    87
  \end{mldecls}
1ff9bce085bd preliminary material on "Concrete syntax and type-checking";
wenzelm
parents: 39865
diff changeset
    88
57345
8a9639888639 more on syntax phases;
wenzelm
parents: 57344
diff changeset
    89
  \begin{description}
8a9639888639 more on syntax phases;
wenzelm
parents: 57344
diff changeset
    90
57346
1d6d44a0583f more on syntax phases;
wenzelm
parents: 57345
diff changeset
    91
  \item @{ML Syntax.read_typs}~@{text "ctxt strs"} parses and checks a
57345
8a9639888639 more on syntax phases;
wenzelm
parents: 57344
diff changeset
    92
  simultaneous list of source strings as types of the logic.
8a9639888639 more on syntax phases;
wenzelm
parents: 57344
diff changeset
    93
57346
1d6d44a0583f more on syntax phases;
wenzelm
parents: 57345
diff changeset
    94
  \item @{ML Syntax.read_terms}~@{text "ctxt strs"} parses and checks a
57345
8a9639888639 more on syntax phases;
wenzelm
parents: 57344
diff changeset
    95
  simultaneous list of source strings as terms of the logic.
57346
1d6d44a0583f more on syntax phases;
wenzelm
parents: 57345
diff changeset
    96
  Type-reconstruction puts all parsed terms into the same scope: types of
1d6d44a0583f more on syntax phases;
wenzelm
parents: 57345
diff changeset
    97
  free variables ultimately need to coincide.
57345
8a9639888639 more on syntax phases;
wenzelm
parents: 57344
diff changeset
    98
8a9639888639 more on syntax phases;
wenzelm
parents: 57344
diff changeset
    99
  If particular type-constraints are required for some of the arguments, the
57346
1d6d44a0583f more on syntax phases;
wenzelm
parents: 57345
diff changeset
   100
  read operations needs to be split into its parse and check phases. Then it
1d6d44a0583f more on syntax phases;
wenzelm
parents: 57345
diff changeset
   101
  is possible to use @{ML Type.constraint} on the intermediate pre-terms.
57345
8a9639888639 more on syntax phases;
wenzelm
parents: 57344
diff changeset
   102
57346
1d6d44a0583f more on syntax phases;
wenzelm
parents: 57345
diff changeset
   103
  \item @{ML Syntax.read_props}~@{text "ctxt strs"} parses and checks a
1d6d44a0583f more on syntax phases;
wenzelm
parents: 57345
diff changeset
   104
  simultaneous list of source strings as terms of the logic, with an implicit
1d6d44a0583f more on syntax phases;
wenzelm
parents: 57345
diff changeset
   105
  type-constraint for each argument to enforce type @{typ prop}; this also
1d6d44a0583f more on syntax phases;
wenzelm
parents: 57345
diff changeset
   106
  affects the inner syntax for parsing. The remaining type-reconstructions
1d6d44a0583f more on syntax phases;
wenzelm
parents: 57345
diff changeset
   107
  works as for @{ML Syntax.read_terms} above.
57345
8a9639888639 more on syntax phases;
wenzelm
parents: 57344
diff changeset
   108
8a9639888639 more on syntax phases;
wenzelm
parents: 57344
diff changeset
   109
  \item @{ML Syntax.read_typ}, @{ML Syntax.read_term}, @{ML Syntax.read_prop}
8a9639888639 more on syntax phases;
wenzelm
parents: 57344
diff changeset
   110
  are like the simultaneous versions above, but operate on a single argument
8a9639888639 more on syntax phases;
wenzelm
parents: 57344
diff changeset
   111
  only. This convenient shorthand is adequate in situations where a single
57346
1d6d44a0583f more on syntax phases;
wenzelm
parents: 57345
diff changeset
   112
  item in its own scope is processed. Do not use @{ML "map o
1d6d44a0583f more on syntax phases;
wenzelm
parents: 57345
diff changeset
   113
  Syntax.read_term"} where @{ML Syntax.read_terms} is actually intended!
57345
8a9639888639 more on syntax phases;
wenzelm
parents: 57344
diff changeset
   114
8a9639888639 more on syntax phases;
wenzelm
parents: 57344
diff changeset
   115
  \item @{ML Syntax.pretty_typ}~@{text "ctxt T"} and @{ML
8a9639888639 more on syntax phases;
wenzelm
parents: 57344
diff changeset
   116
  Syntax.pretty_term}~@{text "ctxt t"} uncheck and pretty-print the given type
8a9639888639 more on syntax phases;
wenzelm
parents: 57344
diff changeset
   117
  or term, respectively. Although the uncheck phase acts on a simultaneous
8a9639888639 more on syntax phases;
wenzelm
parents: 57344
diff changeset
   118
  list as well, this is rarely relevant in practice, so only the singleton
57346
1d6d44a0583f more on syntax phases;
wenzelm
parents: 57345
diff changeset
   119
  case is provided as combined pretty operation. There is no distinction of
1d6d44a0583f more on syntax phases;
wenzelm
parents: 57345
diff changeset
   120
  term vs.\ proposition.
57345
8a9639888639 more on syntax phases;
wenzelm
parents: 57344
diff changeset
   121
8a9639888639 more on syntax phases;
wenzelm
parents: 57344
diff changeset
   122
  \item @{ML Syntax.string_of_typ} and @{ML Syntax.string_of_term} are
8a9639888639 more on syntax phases;
wenzelm
parents: 57344
diff changeset
   123
  convenient compositions of @{ML Syntax.pretty_typ} and @{ML
8a9639888639 more on syntax phases;
wenzelm
parents: 57344
diff changeset
   124
  Syntax.pretty_term} with @{ML Pretty.string_of} for output. The result may
8a9639888639 more on syntax phases;
wenzelm
parents: 57344
diff changeset
   125
  be concatenated with other strings, as long as there is no further
8a9639888639 more on syntax phases;
wenzelm
parents: 57344
diff changeset
   126
  formatting and line-breaking involved.
8a9639888639 more on syntax phases;
wenzelm
parents: 57344
diff changeset
   127
8a9639888639 more on syntax phases;
wenzelm
parents: 57344
diff changeset
   128
  \end{description}
8a9639888639 more on syntax phases;
wenzelm
parents: 57344
diff changeset
   129
57346
1d6d44a0583f more on syntax phases;
wenzelm
parents: 57345
diff changeset
   130
  @{ML Syntax.read_term}, @{ML Syntax.read_prop}, and @{ML
1d6d44a0583f more on syntax phases;
wenzelm
parents: 57345
diff changeset
   131
  Syntax.string_of_term} are the most important operations in practice.
57345
8a9639888639 more on syntax phases;
wenzelm
parents: 57344
diff changeset
   132
8a9639888639 more on syntax phases;
wenzelm
parents: 57344
diff changeset
   133
  \medskip Note that the string values that are passed in and out here are
57346
1d6d44a0583f more on syntax phases;
wenzelm
parents: 57345
diff changeset
   134
  annotated by the system, to carry further markup that is relevant for the
1d6d44a0583f more on syntax phases;
wenzelm
parents: 57345
diff changeset
   135
  Prover IDE \cite{isabelle-jedit}. User code should neither compose its own
1d6d44a0583f more on syntax phases;
wenzelm
parents: 57345
diff changeset
   136
  input strings, nor try to analyze the output strings. Conceptually this is
1d6d44a0583f more on syntax phases;
wenzelm
parents: 57345
diff changeset
   137
  an abstract datatype, encoded into a concrete string for historical reasons.
57345
8a9639888639 more on syntax phases;
wenzelm
parents: 57344
diff changeset
   138
8a9639888639 more on syntax phases;
wenzelm
parents: 57344
diff changeset
   139
  The standard way to provide the required position markup for input works via
8a9639888639 more on syntax phases;
wenzelm
parents: 57344
diff changeset
   140
  the outer syntax parser wrapper @{ML Parse.inner_syntax}, which is already
8a9639888639 more on syntax phases;
wenzelm
parents: 57344
diff changeset
   141
  part of @{ML Parse.typ}, @{ML Parse.term}, @{ML Parse.prop}. So a string
8a9639888639 more on syntax phases;
wenzelm
parents: 57344
diff changeset
   142
  obtained from one of the latter may be directly passed to the corresponding
57346
1d6d44a0583f more on syntax phases;
wenzelm
parents: 57345
diff changeset
   143
  read operation: this yields PIDE markup of the input and precise positions
1d6d44a0583f more on syntax phases;
wenzelm
parents: 57345
diff changeset
   144
  for warning and error messages.
39876
1ff9bce085bd preliminary material on "Concrete syntax and type-checking";
wenzelm
parents: 39865
diff changeset
   145
*}
1ff9bce085bd preliminary material on "Concrete syntax and type-checking";
wenzelm
parents: 39865
diff changeset
   146
1ff9bce085bd preliminary material on "Concrete syntax and type-checking";
wenzelm
parents: 39865
diff changeset
   147
1ff9bce085bd preliminary material on "Concrete syntax and type-checking";
wenzelm
parents: 39865
diff changeset
   148
section {* Parsing and unparsing \label{sec:parse-unparse} *}
1ff9bce085bd preliminary material on "Concrete syntax and type-checking";
wenzelm
parents: 39865
diff changeset
   149
45258
97f8806c3ed6 some text on inner-syntax;
wenzelm
parents: 42510
diff changeset
   150
text {* Parsing and unparsing converts between actual source text and
97f8806c3ed6 some text on inner-syntax;
wenzelm
parents: 42510
diff changeset
   151
  a certain \emph{pre-term} format, where all bindings and scopes are
97f8806c3ed6 some text on inner-syntax;
wenzelm
parents: 42510
diff changeset
   152
  resolved faithfully.  Thus the names of free variables or constants
97f8806c3ed6 some text on inner-syntax;
wenzelm
parents: 42510
diff changeset
   153
  are already determined in the sense of the logical context, but type
57344
wenzelm
parents: 56420
diff changeset
   154
  information might be still missing.  Pre-terms support an explicit
45258
97f8806c3ed6 some text on inner-syntax;
wenzelm
parents: 42510
diff changeset
   155
  language of \emph{type constraints} that may be augmented by user
57344
wenzelm
parents: 56420
diff changeset
   156
  code to guide the later \emph{check} phase.
45258
97f8806c3ed6 some text on inner-syntax;
wenzelm
parents: 42510
diff changeset
   157
97f8806c3ed6 some text on inner-syntax;
wenzelm
parents: 42510
diff changeset
   158
  Actual parsing is based on traditional lexical analysis and Earley
97f8806c3ed6 some text on inner-syntax;
wenzelm
parents: 42510
diff changeset
   159
  parsing for arbitrary context-free grammars.  The user can specify
57344
wenzelm
parents: 56420
diff changeset
   160
  the grammar via mixfix annotations.  Moreover, there are \emph{syntax
45258
97f8806c3ed6 some text on inner-syntax;
wenzelm
parents: 42510
diff changeset
   161
  translations} that can be augmented by the user, either
97f8806c3ed6 some text on inner-syntax;
wenzelm
parents: 42510
diff changeset
   162
  declaratively via @{command translations} or programmatically via
97f8806c3ed6 some text on inner-syntax;
wenzelm
parents: 42510
diff changeset
   163
  @{command parse_translation}, @{command print_translation} etc.  The
57346
1d6d44a0583f more on syntax phases;
wenzelm
parents: 57345
diff changeset
   164
  final scope-resolution is performed by the system, according to name
57344
wenzelm
parents: 56420
diff changeset
   165
  spaces for types, term variables and constants etc.\ determined by
wenzelm
parents: 56420
diff changeset
   166
  the context.
45258
97f8806c3ed6 some text on inner-syntax;
wenzelm
parents: 42510
diff changeset
   167
*}
39876
1ff9bce085bd preliminary material on "Concrete syntax and type-checking";
wenzelm
parents: 39865
diff changeset
   168
1ff9bce085bd preliminary material on "Concrete syntax and type-checking";
wenzelm
parents: 39865
diff changeset
   169
text %mlref {*
1ff9bce085bd preliminary material on "Concrete syntax and type-checking";
wenzelm
parents: 39865
diff changeset
   170
  \begin{mldecls}
1ff9bce085bd preliminary material on "Concrete syntax and type-checking";
wenzelm
parents: 39865
diff changeset
   171
  @{index_ML Syntax.parse_typ: "Proof.context -> string -> typ"} \\
1ff9bce085bd preliminary material on "Concrete syntax and type-checking";
wenzelm
parents: 39865
diff changeset
   172
  @{index_ML Syntax.parse_term: "Proof.context -> string -> term"} \\
1ff9bce085bd preliminary material on "Concrete syntax and type-checking";
wenzelm
parents: 39865
diff changeset
   173
  @{index_ML Syntax.parse_prop: "Proof.context -> string -> term"} \\
1ff9bce085bd preliminary material on "Concrete syntax and type-checking";
wenzelm
parents: 39865
diff changeset
   174
  @{index_ML Syntax.unparse_typ: "Proof.context -> typ -> Pretty.T"} \\
1ff9bce085bd preliminary material on "Concrete syntax and type-checking";
wenzelm
parents: 39865
diff changeset
   175
  @{index_ML Syntax.unparse_term: "Proof.context -> term -> Pretty.T"} \\
1ff9bce085bd preliminary material on "Concrete syntax and type-checking";
wenzelm
parents: 39865
diff changeset
   176
  \end{mldecls}
1ff9bce085bd preliminary material on "Concrete syntax and type-checking";
wenzelm
parents: 39865
diff changeset
   177
57346
1d6d44a0583f more on syntax phases;
wenzelm
parents: 57345
diff changeset
   178
  \begin{description}
1d6d44a0583f more on syntax phases;
wenzelm
parents: 57345
diff changeset
   179
1d6d44a0583f more on syntax phases;
wenzelm
parents: 57345
diff changeset
   180
  \item @{ML Syntax.parse_typ}~@{text "ctxt str"} parses a source strings as
1d6d44a0583f more on syntax phases;
wenzelm
parents: 57345
diff changeset
   181
  pre-type that is ready to be used with subsequent check operations.
1d6d44a0583f more on syntax phases;
wenzelm
parents: 57345
diff changeset
   182
1d6d44a0583f more on syntax phases;
wenzelm
parents: 57345
diff changeset
   183
  \item @{ML Syntax.parse_term}~@{text "ctxt str"} parses a source strings as
1d6d44a0583f more on syntax phases;
wenzelm
parents: 57345
diff changeset
   184
  pre-term that is ready to be used with subsequent check operations.
1d6d44a0583f more on syntax phases;
wenzelm
parents: 57345
diff changeset
   185
1d6d44a0583f more on syntax phases;
wenzelm
parents: 57345
diff changeset
   186
  \item @{ML Syntax.parse_prop}~@{text "ctxt str"} parses a source strings as
1d6d44a0583f more on syntax phases;
wenzelm
parents: 57345
diff changeset
   187
  pre-term that is ready to be used with subsequent check operations. The
1d6d44a0583f more on syntax phases;
wenzelm
parents: 57345
diff changeset
   188
  inner syntax category is @{typ prop} and a suitable type-constraint is
1d6d44a0583f more on syntax phases;
wenzelm
parents: 57345
diff changeset
   189
  included to ensure that this information is preserved during the check
1d6d44a0583f more on syntax phases;
wenzelm
parents: 57345
diff changeset
   190
  phase.
1d6d44a0583f more on syntax phases;
wenzelm
parents: 57345
diff changeset
   191
1d6d44a0583f more on syntax phases;
wenzelm
parents: 57345
diff changeset
   192
  \item @{ML Syntax.unparse_typ}~@{text "ctxt T"} unparses a type after
1d6d44a0583f more on syntax phases;
wenzelm
parents: 57345
diff changeset
   193
  uncheck operations, to turn it into a pretty tree.
1d6d44a0583f more on syntax phases;
wenzelm
parents: 57345
diff changeset
   194
1d6d44a0583f more on syntax phases;
wenzelm
parents: 57345
diff changeset
   195
  \item @{ML Syntax.unparse_term}~@{text "ctxt T"} unparses a term after
1d6d44a0583f more on syntax phases;
wenzelm
parents: 57345
diff changeset
   196
  uncheck operations, to turn it into a pretty tree. There is no distinction
1d6d44a0583f more on syntax phases;
wenzelm
parents: 57345
diff changeset
   197
  for propositions here.
1d6d44a0583f more on syntax phases;
wenzelm
parents: 57345
diff changeset
   198
1d6d44a0583f more on syntax phases;
wenzelm
parents: 57345
diff changeset
   199
  \end{description}
1d6d44a0583f more on syntax phases;
wenzelm
parents: 57345
diff changeset
   200
1d6d44a0583f more on syntax phases;
wenzelm
parents: 57345
diff changeset
   201
  These operations always operate on single items; use the combinator @{ML
1d6d44a0583f more on syntax phases;
wenzelm
parents: 57345
diff changeset
   202
  map} to apply them to a list of items.
39876
1ff9bce085bd preliminary material on "Concrete syntax and type-checking";
wenzelm
parents: 39865
diff changeset
   203
*}
1ff9bce085bd preliminary material on "Concrete syntax and type-checking";
wenzelm
parents: 39865
diff changeset
   204
39852
9c977f899ebf tuned chapter arrangement;
wenzelm
parents: 34924
diff changeset
   205
34924
520727474bbe theory data example;
wenzelm
parents: 30272
diff changeset
   206
section {* Checking and unchecking \label{sec:term-check} *}
520727474bbe theory data example;
wenzelm
parents: 30272
diff changeset
   207
45258
97f8806c3ed6 some text on inner-syntax;
wenzelm
parents: 42510
diff changeset
   208
text {* These operations define the transition from pre-terms and
97f8806c3ed6 some text on inner-syntax;
wenzelm
parents: 42510
diff changeset
   209
  fully-annotated terms in the sense of the logical core
97f8806c3ed6 some text on inner-syntax;
wenzelm
parents: 42510
diff changeset
   210
  (\chref{ch:logic}).
97f8806c3ed6 some text on inner-syntax;
wenzelm
parents: 42510
diff changeset
   211
97f8806c3ed6 some text on inner-syntax;
wenzelm
parents: 42510
diff changeset
   212
  The \emph{check} phase is meant to subsume a variety of mechanisms
97f8806c3ed6 some text on inner-syntax;
wenzelm
parents: 42510
diff changeset
   213
  in the manner of ``type-inference'' or ``type-reconstruction'' or
97f8806c3ed6 some text on inner-syntax;
wenzelm
parents: 42510
diff changeset
   214
  ``type-improvement'', not just type-checking in the narrow sense.
97f8806c3ed6 some text on inner-syntax;
wenzelm
parents: 42510
diff changeset
   215
  The \emph{uncheck} phase is roughly dual, it prunes type-information
97f8806c3ed6 some text on inner-syntax;
wenzelm
parents: 42510
diff changeset
   216
  before pretty printing.
97f8806c3ed6 some text on inner-syntax;
wenzelm
parents: 42510
diff changeset
   217
97f8806c3ed6 some text on inner-syntax;
wenzelm
parents: 42510
diff changeset
   218
  A typical add-on for the check/uncheck syntax layer is the @{command
97f8806c3ed6 some text on inner-syntax;
wenzelm
parents: 42510
diff changeset
   219
  abbreviation} mechanism.  Here the user specifies syntactic
97f8806c3ed6 some text on inner-syntax;
wenzelm
parents: 42510
diff changeset
   220
  definitions that are managed by the system as polymorphic @{text
97f8806c3ed6 some text on inner-syntax;
wenzelm
parents: 42510
diff changeset
   221
  "let"} bindings.  These are expanded during the @{text "check"}
97f8806c3ed6 some text on inner-syntax;
wenzelm
parents: 42510
diff changeset
   222
  phase, and contracted during the @{text "uncheck"} phase, without
97f8806c3ed6 some text on inner-syntax;
wenzelm
parents: 42510
diff changeset
   223
  affecting the type-assignment of the given terms.
97f8806c3ed6 some text on inner-syntax;
wenzelm
parents: 42510
diff changeset
   224
97f8806c3ed6 some text on inner-syntax;
wenzelm
parents: 42510
diff changeset
   225
  \medskip The precise meaning of type checking depends on the context
57344
wenzelm
parents: 56420
diff changeset
   226
  --- additional check/uncheck plugins might be defined in user space.
45258
97f8806c3ed6 some text on inner-syntax;
wenzelm
parents: 42510
diff changeset
   227
97f8806c3ed6 some text on inner-syntax;
wenzelm
parents: 42510
diff changeset
   228
  For example, the @{command class} command defines a context where
97f8806c3ed6 some text on inner-syntax;
wenzelm
parents: 42510
diff changeset
   229
  @{text "check"} treats certain type instances of overloaded
97f8806c3ed6 some text on inner-syntax;
wenzelm
parents: 42510
diff changeset
   230
  constants according to the ``dictionary construction'' of its
97f8806c3ed6 some text on inner-syntax;
wenzelm
parents: 42510
diff changeset
   231
  logical foundation.  This involves ``type improvement''
97f8806c3ed6 some text on inner-syntax;
wenzelm
parents: 42510
diff changeset
   232
  (specialization of slightly too general types) and replacement by
97f8806c3ed6 some text on inner-syntax;
wenzelm
parents: 42510
diff changeset
   233
  certain locale parameters.  See also \cite{Haftmann-Wenzel:2009}.
97f8806c3ed6 some text on inner-syntax;
wenzelm
parents: 42510
diff changeset
   234
*}
39852
9c977f899ebf tuned chapter arrangement;
wenzelm
parents: 34924
diff changeset
   235
39876
1ff9bce085bd preliminary material on "Concrete syntax and type-checking";
wenzelm
parents: 39865
diff changeset
   236
text %mlref {*
1ff9bce085bd preliminary material on "Concrete syntax and type-checking";
wenzelm
parents: 39865
diff changeset
   237
  \begin{mldecls}
1ff9bce085bd preliminary material on "Concrete syntax and type-checking";
wenzelm
parents: 39865
diff changeset
   238
  @{index_ML Syntax.check_typs: "Proof.context -> typ list -> typ list"} \\
1ff9bce085bd preliminary material on "Concrete syntax and type-checking";
wenzelm
parents: 39865
diff changeset
   239
  @{index_ML Syntax.check_terms: "Proof.context -> term list -> term list"} \\
1ff9bce085bd preliminary material on "Concrete syntax and type-checking";
wenzelm
parents: 39865
diff changeset
   240
  @{index_ML Syntax.check_props: "Proof.context -> term list -> term list"} \\
1ff9bce085bd preliminary material on "Concrete syntax and type-checking";
wenzelm
parents: 39865
diff changeset
   241
  @{index_ML Syntax.uncheck_typs: "Proof.context -> typ list -> typ list"} \\
1ff9bce085bd preliminary material on "Concrete syntax and type-checking";
wenzelm
parents: 39865
diff changeset
   242
  @{index_ML Syntax.uncheck_terms: "Proof.context -> term list -> term list"} \\
1ff9bce085bd preliminary material on "Concrete syntax and type-checking";
wenzelm
parents: 39865
diff changeset
   243
  \end{mldecls}
1ff9bce085bd preliminary material on "Concrete syntax and type-checking";
wenzelm
parents: 39865
diff changeset
   244
57346
1d6d44a0583f more on syntax phases;
wenzelm
parents: 57345
diff changeset
   245
  \begin{description}
1d6d44a0583f more on syntax phases;
wenzelm
parents: 57345
diff changeset
   246
1d6d44a0583f more on syntax phases;
wenzelm
parents: 57345
diff changeset
   247
  \item @{ML Syntax.check_typs}~@{text "ctxt Ts"} checks a simultaneous list
1d6d44a0583f more on syntax phases;
wenzelm
parents: 57345
diff changeset
   248
  of pre-types as types of the logic.  Typically, this involves normalization
1d6d44a0583f more on syntax phases;
wenzelm
parents: 57345
diff changeset
   249
  of type synonyms.
1d6d44a0583f more on syntax phases;
wenzelm
parents: 57345
diff changeset
   250
1d6d44a0583f more on syntax phases;
wenzelm
parents: 57345
diff changeset
   251
  \item @{ML Syntax.check_terms}~@{text "ctxt ts"} checks a simultaneous list
1d6d44a0583f more on syntax phases;
wenzelm
parents: 57345
diff changeset
   252
  of pre-terms as terms of the logic. Typically, this involves type-inference
1d6d44a0583f more on syntax phases;
wenzelm
parents: 57345
diff changeset
   253
  and normalization term abbreviations. The types within the given terms are
1d6d44a0583f more on syntax phases;
wenzelm
parents: 57345
diff changeset
   254
  treated in the same way as for @{ML Syntax.check_typs}.
1d6d44a0583f more on syntax phases;
wenzelm
parents: 57345
diff changeset
   255
1d6d44a0583f more on syntax phases;
wenzelm
parents: 57345
diff changeset
   256
  Applications sometimes need to check several types and terms together. The
1d6d44a0583f more on syntax phases;
wenzelm
parents: 57345
diff changeset
   257
  standard approach uses @{ML Logic.mk_type} to embed the language of types
1d6d44a0583f more on syntax phases;
wenzelm
parents: 57345
diff changeset
   258
  into that of terms; all arguments are appended into one list of terms that
1d6d44a0583f more on syntax phases;
wenzelm
parents: 57345
diff changeset
   259
  is checked; afterwards the original type arguments are recovered with @{ML
1d6d44a0583f more on syntax phases;
wenzelm
parents: 57345
diff changeset
   260
  Logic.dest_type}.
1d6d44a0583f more on syntax phases;
wenzelm
parents: 57345
diff changeset
   261
1d6d44a0583f more on syntax phases;
wenzelm
parents: 57345
diff changeset
   262
  \item @{ML Syntax.check_props}~@{text "ctxt ts"} checks a simultaneous list
1d6d44a0583f more on syntax phases;
wenzelm
parents: 57345
diff changeset
   263
  of pre-terms as terms of the logic, such that all terms are constrained by
1d6d44a0583f more on syntax phases;
wenzelm
parents: 57345
diff changeset
   264
  type @{typ prop}. The remaining check operation works as @{ML
1d6d44a0583f more on syntax phases;
wenzelm
parents: 57345
diff changeset
   265
  Syntax.check_terms} above.
1d6d44a0583f more on syntax phases;
wenzelm
parents: 57345
diff changeset
   266
1d6d44a0583f more on syntax phases;
wenzelm
parents: 57345
diff changeset
   267
  \item @{ML Syntax.uncheck_typs}~@{text "ctxt Ts"} unchecks a simultaneous
1d6d44a0583f more on syntax phases;
wenzelm
parents: 57345
diff changeset
   268
  list of types of the logic, in preparation of pretty printing.
1d6d44a0583f more on syntax phases;
wenzelm
parents: 57345
diff changeset
   269
1d6d44a0583f more on syntax phases;
wenzelm
parents: 57345
diff changeset
   270
  \item @{ML Syntax.uncheck_terms}~@{text "ctxt ts"} unchecks a simultaneous
1d6d44a0583f more on syntax phases;
wenzelm
parents: 57345
diff changeset
   271
  list of terms of the logic, in preparation of pretty printing. There is no
1d6d44a0583f more on syntax phases;
wenzelm
parents: 57345
diff changeset
   272
  distinction for propositions here.
1d6d44a0583f more on syntax phases;
wenzelm
parents: 57345
diff changeset
   273
1d6d44a0583f more on syntax phases;
wenzelm
parents: 57345
diff changeset
   274
  \end{description}
1d6d44a0583f more on syntax phases;
wenzelm
parents: 57345
diff changeset
   275
1d6d44a0583f more on syntax phases;
wenzelm
parents: 57345
diff changeset
   276
  These operations always operate simultaneously on multiple items; use the
1d6d44a0583f more on syntax phases;
wenzelm
parents: 57345
diff changeset
   277
  combinator @{ML singleton} to apply them to a single item.
39876
1ff9bce085bd preliminary material on "Concrete syntax and type-checking";
wenzelm
parents: 39865
diff changeset
   278
*}
1ff9bce085bd preliminary material on "Concrete syntax and type-checking";
wenzelm
parents: 39865
diff changeset
   279
30124
b956bf0dc87c basic setup for chapter "Syntax and type-checking";
wenzelm
parents:
diff changeset
   280
end