| author | wenzelm | 
| Thu, 20 Feb 2014 20:59:15 +0100 | |
| changeset 55633 | 460f4801b5cb | 
| parent 55112 | b1a5d603fd12 | 
| child 56186 | 01fb1b35433b | 
| permissions | -rw-r--r-- | 
| 28762 | 1  | 
theory Inner_Syntax  | 
| 42651 | 2  | 
imports Base Main  | 
| 28762 | 3  | 
begin  | 
4  | 
||
| 28778 | 5  | 
chapter {* Inner syntax --- the term language \label{ch:inner-syntax} *}
 | 
| 28762 | 6  | 
|
| 46282 | 7  | 
text {* The inner syntax of Isabelle provides concrete notation for
 | 
8  | 
  the main entities of the logical framework, notably @{text
 | 
|
9  | 
"\<lambda>"}-terms with types and type classes. Applications may either  | 
|
10  | 
extend existing syntactic categories by additional notation, or  | 
|
11  | 
define new sub-languages that are linked to the standard term  | 
|
12  | 
  language via some explicit markers.  For example @{verbatim
 | 
|
13  | 
  FOO}~@{text "foo"} could embed the syntax corresponding for some
 | 
|
14  | 
  user-defined nonterminal @{text "foo"} --- within the bounds of the
 | 
|
15  | 
given lexical syntax of Isabelle/Pure.  | 
|
16  | 
||
17  | 
The most basic way to specify concrete syntax for logical entities  | 
|
18  | 
  works via mixfix annotations (\secref{sec:mixfix}), which may be
 | 
|
19  | 
usually given as part of the original declaration or via explicit  | 
|
20  | 
  notation commands later on (\secref{sec:notation}).  This already
 | 
|
21  | 
covers many needs of concrete syntax without having to understand  | 
|
22  | 
the full complexity of inner syntax layers.  | 
|
23  | 
||
24  | 
Further details of the syntax engine involves the classical  | 
|
25  | 
distinction of lexical language versus context-free grammar (see  | 
|
26  | 
  \secref{sec:pure-syntax}), and various mechanisms for \emph{syntax
 | 
|
| 48113 | 27  | 
  transformations} (see \secref{sec:syntax-transformations}).
 | 
| 46282 | 28  | 
*}  | 
29  | 
||
30  | 
||
| 28762 | 31  | 
section {* Printing logical entities *}
 | 
32  | 
||
| 46284 | 33  | 
subsection {* Diagnostic commands \label{sec:print-diag} *}
 | 
| 28762 | 34  | 
|
35  | 
text {*
 | 
|
36  | 
  \begin{matharray}{rcl}
 | 
|
| 
28766
 
accab7594b8e
misc tuning and rearrangement of section "Printing logical entities";
 
wenzelm 
parents: 
28765 
diff
changeset
 | 
37  | 
    @{command_def "typ"}@{text "\<^sup>*"} & : & @{text "context \<rightarrow>"} \\
 | 
| 28762 | 38  | 
    @{command_def "term"}@{text "\<^sup>*"} & : & @{text "context \<rightarrow>"} \\
 | 
39  | 
    @{command_def "prop"}@{text "\<^sup>*"} & : & @{text "context \<rightarrow>"} \\
 | 
|
| 
28766
 
accab7594b8e
misc tuning and rearrangement of section "Printing logical entities";
 
wenzelm 
parents: 
28765 
diff
changeset
 | 
40  | 
    @{command_def "thm"}@{text "\<^sup>*"} & : & @{text "context \<rightarrow>"} \\
 | 
| 28762 | 41  | 
    @{command_def "prf"}@{text "\<^sup>*"} & : & @{text "context \<rightarrow>"} \\
 | 
42  | 
    @{command_def "full_prf"}@{text "\<^sup>*"} & : & @{text "context \<rightarrow>"} \\
 | 
|
| 52430 | 43  | 
    @{command_def "print_state"}@{text "\<^sup>*"} & : & @{text "any \<rightarrow>"} \\
 | 
| 28762 | 44  | 
  \end{matharray}
 | 
45  | 
||
46  | 
These diagnostic commands assist interactive development by printing  | 
|
47  | 
internal logical entities in a human-readable fashion.  | 
|
48  | 
||
| 
55112
 
b1a5d603fd12
prefer rail cartouche -- avoid back-slashed quotes;
 
wenzelm 
parents: 
55108 
diff
changeset
 | 
49  | 
  @{rail \<open>
 | 
| 48792 | 50  | 
    @@{command typ} @{syntax modes}? @{syntax type} ('::' @{syntax sort})?
 | 
| 28762 | 51  | 
;  | 
| 
42596
 
6c621a9d612a
modernized rail diagrams using @{rail} antiquotation;
 
wenzelm 
parents: 
42358 
diff
changeset
 | 
52  | 
    @@{command term} @{syntax modes}? @{syntax term}
 | 
| 28762 | 53  | 
;  | 
| 
42596
 
6c621a9d612a
modernized rail diagrams using @{rail} antiquotation;
 
wenzelm 
parents: 
42358 
diff
changeset
 | 
54  | 
    @@{command prop} @{syntax modes}? @{syntax prop}
 | 
| 28762 | 55  | 
;  | 
| 
42596
 
6c621a9d612a
modernized rail diagrams using @{rail} antiquotation;
 
wenzelm 
parents: 
42358 
diff
changeset
 | 
56  | 
    @@{command thm} @{syntax modes}? @{syntax thmrefs}
 | 
| 28762 | 57  | 
;  | 
| 
42596
 
6c621a9d612a
modernized rail diagrams using @{rail} antiquotation;
 
wenzelm 
parents: 
42358 
diff
changeset
 | 
58  | 
    ( @@{command prf} | @@{command full_prf} ) @{syntax modes}? @{syntax thmrefs}?
 | 
| 28762 | 59  | 
;  | 
| 52430 | 60  | 
    @@{command print_state} @{syntax modes}?
 | 
| 28762 | 61  | 
;  | 
| 
42596
 
6c621a9d612a
modernized rail diagrams using @{rail} antiquotation;
 
wenzelm 
parents: 
42358 
diff
changeset
 | 
62  | 
    @{syntax_def modes}: '(' (@{syntax name} + ) ')'
 | 
| 
55112
 
b1a5d603fd12
prefer rail cartouche -- avoid back-slashed quotes;
 
wenzelm 
parents: 
55108 
diff
changeset
 | 
63  | 
\<close>}  | 
| 28762 | 64  | 
|
65  | 
  \begin{description}
 | 
|
66  | 
||
| 48792 | 67  | 
  \item @{command "typ"}~@{text \<tau>} reads and prints a type expression
 | 
68  | 
according to the current context.  | 
|
69  | 
||
70  | 
  \item @{command "typ"}~@{text "\<tau> :: s"} uses type-inference to
 | 
|
71  | 
  determine the most general way to make @{text "\<tau>"} conform to sort
 | 
|
72  | 
  @{text "s"}.  For concrete @{text "\<tau>"} this checks if the type
 | 
|
73  | 
  belongs to that sort.  Dummy type parameters ``@{text "_"}''
 | 
|
74  | 
(underscore) are assigned to fresh type variables with most general  | 
|
75  | 
sorts, according the the principles of type-inference.  | 
|
| 
28766
 
accab7594b8e
misc tuning and rearrangement of section "Printing logical entities";
 
wenzelm 
parents: 
28765 
diff
changeset
 | 
76  | 
|
| 
 
accab7594b8e
misc tuning and rearrangement of section "Printing logical entities";
 
wenzelm 
parents: 
28765 
diff
changeset
 | 
77  | 
  \item @{command "term"}~@{text t} and @{command "prop"}~@{text \<phi>}
 | 
| 
 
accab7594b8e
misc tuning and rearrangement of section "Printing logical entities";
 
wenzelm 
parents: 
28765 
diff
changeset
 | 
78  | 
read, type-check and print terms or propositions according to the  | 
| 
 
accab7594b8e
misc tuning and rearrangement of section "Printing logical entities";
 
wenzelm 
parents: 
28765 
diff
changeset
 | 
79  | 
  current theory or proof context; the inferred type of @{text t} is
 | 
| 
 
accab7594b8e
misc tuning and rearrangement of section "Printing logical entities";
 
wenzelm 
parents: 
28765 
diff
changeset
 | 
80  | 
output as well. Note that these commands are also useful in  | 
| 
 
accab7594b8e
misc tuning and rearrangement of section "Printing logical entities";
 
wenzelm 
parents: 
28765 
diff
changeset
 | 
81  | 
inspecting the current environment of term abbreviations.  | 
| 28762 | 82  | 
|
83  | 
  \item @{command "thm"}~@{text "a\<^sub>1 \<dots> a\<^sub>n"} retrieves
 | 
|
84  | 
theorems from the current theory or proof context. Note that any  | 
|
85  | 
attributes included in the theorem specifications are applied to a  | 
|
86  | 
temporary context derived from the current theory or proof; the  | 
|
87  | 
  result is discarded, i.e.\ attributes involved in @{text "a\<^sub>1,
 | 
|
88  | 
\<dots>, a\<^sub>n"} do not have any permanent effect.  | 
|
89  | 
||
90  | 
  \item @{command "prf"} displays the (compact) proof term of the
 | 
|
91  | 
current proof state (if present), or of the given theorems. Note  | 
|
92  | 
that this requires proof terms to be switched on for the current  | 
|
93  | 
object logic (see the ``Proof terms'' section of the Isabelle  | 
|
94  | 
reference manual for information on how to do this).  | 
|
95  | 
||
96  | 
  \item @{command "full_prf"} is like @{command "prf"}, but displays
 | 
|
97  | 
the full proof term, i.e.\ also displays information omitted in the  | 
|
98  | 
  compact proof term, which is denoted by ``@{text _}'' placeholders
 | 
|
99  | 
there.  | 
|
100  | 
||
| 52430 | 101  | 
  \item @{command "print_state"} prints the current proof state (if
 | 
102  | 
present), including current facts and goals.  | 
|
| 
28766
 
accab7594b8e
misc tuning and rearrangement of section "Printing logical entities";
 
wenzelm 
parents: 
28765 
diff
changeset
 | 
103  | 
|
| 28762 | 104  | 
  \end{description}
 | 
105  | 
||
106  | 
  All of the diagnostic commands above admit a list of @{text modes}
 | 
|
| 42926 | 107  | 
to be specified, which is appended to the current print mode; see  | 
| 46284 | 108  | 
  also \secref{sec:print-modes}.  Thus the output behavior may be
 | 
109  | 
modified according particular print mode features. For example,  | 
|
| 52430 | 110  | 
  @{command "print_state"}~@{text "(latex xsymbols)"} prints the
 | 
111  | 
current proof state with mathematical symbols and special characters  | 
|
| 46284 | 112  | 
  represented in {\LaTeX} source, according to the Isabelle style
 | 
| 28762 | 113  | 
  \cite{isabelle-sys}.
 | 
114  | 
||
115  | 
  Note that antiquotations (cf.\ \secref{sec:antiq}) provide a more
 | 
|
116  | 
systematic way to include formal items into the printed text  | 
|
117  | 
document.  | 
|
118  | 
*}  | 
|
119  | 
||
120  | 
||
| 
28763
 
b5e6122ff575
added pretty printing options (from old ref manual);
 
wenzelm 
parents: 
28762 
diff
changeset
 | 
121  | 
subsection {* Details of printed content *}
 | 
| 
 
b5e6122ff575
added pretty printing options (from old ref manual);
 
wenzelm 
parents: 
28762 
diff
changeset
 | 
122  | 
|
| 
 
b5e6122ff575
added pretty printing options (from old ref manual);
 
wenzelm 
parents: 
28762 
diff
changeset
 | 
123  | 
text {*
 | 
| 42655 | 124  | 
  \begin{tabular}{rcll}
 | 
| 49699 | 125  | 
    @{attribute_def show_markup} & : & @{text attribute} \\
 | 
| 42655 | 126  | 
    @{attribute_def show_types} & : & @{text attribute} & default @{text false} \\
 | 
127  | 
    @{attribute_def show_sorts} & : & @{text attribute} & default @{text false} \\
 | 
|
128  | 
    @{attribute_def show_consts} & : & @{text attribute} & default @{text false} \\
 | 
|
129  | 
    @{attribute_def show_abbrevs} & : & @{text attribute} & default @{text true} \\
 | 
|
130  | 
    @{attribute_def show_brackets} & : & @{text attribute} & default @{text false} \\
 | 
|
| 
42669
 
04dfffda5671
more conventional naming scheme: names_long, names_short, names_unique;
 
wenzelm 
parents: 
42655 
diff
changeset
 | 
131  | 
    @{attribute_def names_long} & : & @{text attribute} & default @{text false} \\
 | 
| 
 
04dfffda5671
more conventional naming scheme: names_long, names_short, names_unique;
 
wenzelm 
parents: 
42655 
diff
changeset
 | 
132  | 
    @{attribute_def names_short} & : & @{text attribute} & default @{text false} \\
 | 
| 
 
04dfffda5671
more conventional naming scheme: names_long, names_short, names_unique;
 
wenzelm 
parents: 
42655 
diff
changeset
 | 
133  | 
    @{attribute_def names_unique} & : & @{text attribute} & default @{text true} \\
 | 
| 42655 | 134  | 
    @{attribute_def eta_contract} & : & @{text attribute} & default @{text true} \\
 | 
135  | 
    @{attribute_def goals_limit} & : & @{text attribute} & default @{text 10} \\
 | 
|
136  | 
    @{attribute_def show_main_goal} & : & @{text attribute} & default @{text false} \\
 | 
|
137  | 
    @{attribute_def show_hyps} & : & @{text attribute} & default @{text false} \\
 | 
|
138  | 
    @{attribute_def show_tags} & : & @{text attribute} & default @{text false} \\
 | 
|
139  | 
    @{attribute_def show_question_marks} & : & @{text attribute} & default @{text true} \\
 | 
|
140  | 
  \end{tabular}
 | 
|
141  | 
\medskip  | 
|
| 
28763
 
b5e6122ff575
added pretty printing options (from old ref manual);
 
wenzelm 
parents: 
28762 
diff
changeset
 | 
142  | 
|
| 42655 | 143  | 
These configuration options control the detail of information that  | 
144  | 
is displayed for types, terms, theorems, goals etc. See also  | 
|
145  | 
  \secref{sec:config}.
 | 
|
| 
28765
 
da8f6f4a74be
misc tuning and rearrangement of section "Printing logical entities";
 
wenzelm 
parents: 
28763 
diff
changeset
 | 
146  | 
|
| 
28763
 
b5e6122ff575
added pretty printing options (from old ref manual);
 
wenzelm 
parents: 
28762 
diff
changeset
 | 
147  | 
  \begin{description}
 | 
| 
 
b5e6122ff575
added pretty printing options (from old ref manual);
 
wenzelm 
parents: 
28762 
diff
changeset
 | 
148  | 
|
| 49699 | 149  | 
  \item @{attribute show_markup} controls direct inlining of markup
 | 
150  | 
into the printed representation of formal entities --- notably type  | 
|
151  | 
and sort constraints. This enables Prover IDE users to retrieve  | 
|
152  | 
that information via tooltips or popups while hovering with the  | 
|
153  | 
mouse over the output window, for example. Consequently, this  | 
|
154  | 
option is enabled by default for Isabelle/jEdit, but disabled for  | 
|
155  | 
TTY and Proof~General~/Emacs where document markup would not work.  | 
|
156  | 
||
| 42655 | 157  | 
  \item @{attribute show_types} and @{attribute show_sorts} control
 | 
158  | 
printing of type constraints for term variables, and sort  | 
|
159  | 
constraints for type variables. By default, neither of these are  | 
|
160  | 
  shown in output.  If @{attribute show_sorts} is enabled, types are
 | 
|
| 49699 | 161  | 
always shown as well. In Isabelle/jEdit, manual setting of these  | 
162  | 
  options is normally not required thanks to @{attribute show_markup}
 | 
|
163  | 
above.  | 
|
| 
28763
 
b5e6122ff575
added pretty printing options (from old ref manual);
 
wenzelm 
parents: 
28762 
diff
changeset
 | 
164  | 
|
| 
 
b5e6122ff575
added pretty printing options (from old ref manual);
 
wenzelm 
parents: 
28762 
diff
changeset
 | 
165  | 
Note that displaying types and sorts may explain why a polymorphic  | 
| 
 
b5e6122ff575
added pretty printing options (from old ref manual);
 
wenzelm 
parents: 
28762 
diff
changeset
 | 
166  | 
inference rule fails to resolve with some goal, or why a rewrite  | 
| 
 
b5e6122ff575
added pretty printing options (from old ref manual);
 
wenzelm 
parents: 
28762 
diff
changeset
 | 
167  | 
rule does not apply as expected.  | 
| 
 
b5e6122ff575
added pretty printing options (from old ref manual);
 
wenzelm 
parents: 
28762 
diff
changeset
 | 
168  | 
|
| 42655 | 169  | 
  \item @{attribute show_consts} controls printing of types of
 | 
170  | 
constants when displaying a goal state.  | 
|
| 
28765
 
da8f6f4a74be
misc tuning and rearrangement of section "Printing logical entities";
 
wenzelm 
parents: 
28763 
diff
changeset
 | 
171  | 
|
| 
 
da8f6f4a74be
misc tuning and rearrangement of section "Printing logical entities";
 
wenzelm 
parents: 
28763 
diff
changeset
 | 
172  | 
Note that the output can be enormous, because polymorphic constants  | 
| 
 
da8f6f4a74be
misc tuning and rearrangement of section "Printing logical entities";
 
wenzelm 
parents: 
28763 
diff
changeset
 | 
173  | 
often occur at several different type instances.  | 
| 
28763
 
b5e6122ff575
added pretty printing options (from old ref manual);
 
wenzelm 
parents: 
28762 
diff
changeset
 | 
174  | 
|
| 42655 | 175  | 
  \item @{attribute show_abbrevs} controls folding of constant
 | 
176  | 
abbreviations.  | 
|
| 
40879
 
ca132ef44944
configuration option "show_abbrevs" supersedes print mode "no_abbrevs", with inverted meaning;
 
wenzelm 
parents: 
40255 
diff
changeset
 | 
177  | 
|
| 42655 | 178  | 
  \item @{attribute show_brackets} controls bracketing in pretty
 | 
179  | 
printed output. If enabled, all sub-expressions of the pretty  | 
|
| 
28765
 
da8f6f4a74be
misc tuning and rearrangement of section "Printing logical entities";
 
wenzelm 
parents: 
28763 
diff
changeset
 | 
180  | 
printing tree will be parenthesized, even if this produces malformed  | 
| 
 
da8f6f4a74be
misc tuning and rearrangement of section "Printing logical entities";
 
wenzelm 
parents: 
28763 
diff
changeset
 | 
181  | 
term syntax! This crude way of showing the internal structure of  | 
| 
 
da8f6f4a74be
misc tuning and rearrangement of section "Printing logical entities";
 
wenzelm 
parents: 
28763 
diff
changeset
 | 
182  | 
pretty printed entities may occasionally help to diagnose problems  | 
| 
 
da8f6f4a74be
misc tuning and rearrangement of section "Printing logical entities";
 
wenzelm 
parents: 
28763 
diff
changeset
 | 
183  | 
with operator priorities, for example.  | 
| 
28763
 
b5e6122ff575
added pretty printing options (from old ref manual);
 
wenzelm 
parents: 
28762 
diff
changeset
 | 
184  | 
|
| 
42669
 
04dfffda5671
more conventional naming scheme: names_long, names_short, names_unique;
 
wenzelm 
parents: 
42655 
diff
changeset
 | 
185  | 
  \item @{attribute names_long}, @{attribute names_short}, and
 | 
| 
 
04dfffda5671
more conventional naming scheme: names_long, names_short, names_unique;
 
wenzelm 
parents: 
42655 
diff
changeset
 | 
186  | 
  @{attribute names_unique} control the way of printing fully
 | 
| 
42358
 
b47d41d9f4b5
Name_Space: proper configuration options long_names, short_names, unique_names instead of former unsynchronized references;
 
wenzelm 
parents: 
42279 
diff
changeset
 | 
187  | 
qualified internal names in external form. See also  | 
| 
 
b47d41d9f4b5
Name_Space: proper configuration options long_names, short_names, unique_names instead of former unsynchronized references;
 
wenzelm 
parents: 
42279 
diff
changeset
 | 
188  | 
  \secref{sec:antiq} for the document antiquotation options of the
 | 
| 
 
b47d41d9f4b5
Name_Space: proper configuration options long_names, short_names, unique_names instead of former unsynchronized references;
 
wenzelm 
parents: 
42279 
diff
changeset
 | 
189  | 
same names.  | 
| 
 
b47d41d9f4b5
Name_Space: proper configuration options long_names, short_names, unique_names instead of former unsynchronized references;
 
wenzelm 
parents: 
42279 
diff
changeset
 | 
190  | 
|
| 42655 | 191  | 
  \item @{attribute eta_contract} controls @{text "\<eta>"}-contracted
 | 
192  | 
printing of terms.  | 
|
| 
28763
 
b5e6122ff575
added pretty printing options (from old ref manual);
 
wenzelm 
parents: 
28762 
diff
changeset
 | 
193  | 
|
| 
 
b5e6122ff575
added pretty printing options (from old ref manual);
 
wenzelm 
parents: 
28762 
diff
changeset
 | 
194  | 
  The @{text \<eta>}-contraction law asserts @{prop "(\<lambda>x. f x) \<equiv> f"},
 | 
| 
 
b5e6122ff575
added pretty printing options (from old ref manual);
 
wenzelm 
parents: 
28762 
diff
changeset
 | 
195  | 
  provided @{text x} is not free in @{text f}.  It asserts
 | 
| 
 
b5e6122ff575
added pretty printing options (from old ref manual);
 
wenzelm 
parents: 
28762 
diff
changeset
 | 
196  | 
  \emph{extensionality} of functions: @{prop "f \<equiv> g"} if @{prop "f x \<equiv>
 | 
| 
 
b5e6122ff575
added pretty printing options (from old ref manual);
 
wenzelm 
parents: 
28762 
diff
changeset
 | 
197  | 
  g x"} for all @{text x}.  Higher-order unification frequently puts
 | 
| 
 
b5e6122ff575
added pretty printing options (from old ref manual);
 
wenzelm 
parents: 
28762 
diff
changeset
 | 
198  | 
  terms into a fully @{text \<eta>}-expanded form.  For example, if @{text
 | 
| 
 
b5e6122ff575
added pretty printing options (from old ref manual);
 
wenzelm 
parents: 
28762 
diff
changeset
 | 
199  | 
  F} has type @{text "(\<tau> \<Rightarrow> \<tau>) \<Rightarrow> \<tau>"} then its expanded form is @{term
 | 
| 
 
b5e6122ff575
added pretty printing options (from old ref manual);
 
wenzelm 
parents: 
28762 
diff
changeset
 | 
200  | 
"\<lambda>h. F (\<lambda>x. h x)"}.  | 
| 
 
b5e6122ff575
added pretty printing options (from old ref manual);
 
wenzelm 
parents: 
28762 
diff
changeset
 | 
201  | 
|
| 42655 | 202  | 
  Enabling @{attribute eta_contract} makes Isabelle perform @{text
 | 
| 
28763
 
b5e6122ff575
added pretty printing options (from old ref manual);
 
wenzelm 
parents: 
28762 
diff
changeset
 | 
203  | 
  \<eta>}-contractions before printing, so that @{term "\<lambda>h. F (\<lambda>x. h x)"}
 | 
| 
 
b5e6122ff575
added pretty printing options (from old ref manual);
 
wenzelm 
parents: 
28762 
diff
changeset
 | 
204  | 
  appears simply as @{text F}.
 | 
| 
 
b5e6122ff575
added pretty printing options (from old ref manual);
 
wenzelm 
parents: 
28762 
diff
changeset
 | 
205  | 
|
| 
 
b5e6122ff575
added pretty printing options (from old ref manual);
 
wenzelm 
parents: 
28762 
diff
changeset
 | 
206  | 
  Note that the distinction between a term and its @{text \<eta>}-expanded
 | 
| 
28765
 
da8f6f4a74be
misc tuning and rearrangement of section "Printing logical entities";
 
wenzelm 
parents: 
28763 
diff
changeset
 | 
207  | 
form occasionally matters. While higher-order resolution and  | 
| 
 
da8f6f4a74be
misc tuning and rearrangement of section "Printing logical entities";
 
wenzelm 
parents: 
28763 
diff
changeset
 | 
208  | 
  rewriting operate modulo @{text "\<alpha>\<beta>\<eta>"}-conversion, some other tools
 | 
| 
 
da8f6f4a74be
misc tuning and rearrangement of section "Printing logical entities";
 
wenzelm 
parents: 
28763 
diff
changeset
 | 
209  | 
might look at terms more discretely.  | 
| 
28763
 
b5e6122ff575
added pretty printing options (from old ref manual);
 
wenzelm 
parents: 
28762 
diff
changeset
 | 
210  | 
|
| 42655 | 211  | 
  \item @{attribute goals_limit} controls the maximum number of
 | 
| 
51960
 
61ac1efe02c3
option "goals_limit", with more uniform description;
 
wenzelm 
parents: 
51657 
diff
changeset
 | 
212  | 
subgoals to be printed.  | 
| 
28763
 
b5e6122ff575
added pretty printing options (from old ref manual);
 
wenzelm 
parents: 
28762 
diff
changeset
 | 
213  | 
|
| 42655 | 214  | 
  \item @{attribute show_main_goal} controls whether the main result
 | 
215  | 
to be proven should be displayed. This information might be  | 
|
| 39130 | 216  | 
relevant for schematic goals, to inspect the current claim that has  | 
217  | 
been synthesized so far.  | 
|
| 
28763
 
b5e6122ff575
added pretty printing options (from old ref manual);
 
wenzelm 
parents: 
28762 
diff
changeset
 | 
218  | 
|
| 42655 | 219  | 
  \item @{attribute show_hyps} controls printing of implicit
 | 
220  | 
hypotheses of local facts. Normally, only those hypotheses are  | 
|
221  | 
  displayed that are \emph{not} covered by the assumptions of the
 | 
|
222  | 
current context: this situation indicates a fault in some tool being  | 
|
223  | 
used.  | 
|
| 
28763
 
b5e6122ff575
added pretty printing options (from old ref manual);
 
wenzelm 
parents: 
28762 
diff
changeset
 | 
224  | 
|
| 42655 | 225  | 
  By enabling @{attribute show_hyps}, output of \emph{all} hypotheses
 | 
226  | 
can be enforced, which is occasionally useful for diagnostic  | 
|
227  | 
purposes.  | 
|
| 
28763
 
b5e6122ff575
added pretty printing options (from old ref manual);
 
wenzelm 
parents: 
28762 
diff
changeset
 | 
228  | 
|
| 42655 | 229  | 
  \item @{attribute show_tags} controls printing of extra annotations
 | 
230  | 
within theorems, such as internal position information, or the case  | 
|
231  | 
  names being attached by the attribute @{attribute case_names}.
 | 
|
| 
28765
 
da8f6f4a74be
misc tuning and rearrangement of section "Printing logical entities";
 
wenzelm 
parents: 
28763 
diff
changeset
 | 
232  | 
|
| 
 
da8f6f4a74be
misc tuning and rearrangement of section "Printing logical entities";
 
wenzelm 
parents: 
28763 
diff
changeset
 | 
233  | 
  Note that the @{attribute tagged} and @{attribute untagged}
 | 
| 
 
da8f6f4a74be
misc tuning and rearrangement of section "Printing logical entities";
 
wenzelm 
parents: 
28763 
diff
changeset
 | 
234  | 
attributes provide low-level access to the collection of tags  | 
| 
 
da8f6f4a74be
misc tuning and rearrangement of section "Printing logical entities";
 
wenzelm 
parents: 
28763 
diff
changeset
 | 
235  | 
associated with a theorem.  | 
| 
 
da8f6f4a74be
misc tuning and rearrangement of section "Printing logical entities";
 
wenzelm 
parents: 
28763 
diff
changeset
 | 
236  | 
|
| 42655 | 237  | 
  \item @{attribute show_question_marks} controls printing of question
 | 
238  | 
  marks for schematic variables, such as @{text ?x}.  Only the leading
 | 
|
| 
28765
 
da8f6f4a74be
misc tuning and rearrangement of section "Printing logical entities";
 
wenzelm 
parents: 
28763 
diff
changeset
 | 
239  | 
question mark is affected, the remaining text is unchanged  | 
| 
 
da8f6f4a74be
misc tuning and rearrangement of section "Printing logical entities";
 
wenzelm 
parents: 
28763 
diff
changeset
 | 
240  | 
(including proper markup for schematic variables that might be  | 
| 
 
da8f6f4a74be
misc tuning and rearrangement of section "Printing logical entities";
 
wenzelm 
parents: 
28763 
diff
changeset
 | 
241  | 
relevant for user interfaces).  | 
| 
 
da8f6f4a74be
misc tuning and rearrangement of section "Printing logical entities";
 
wenzelm 
parents: 
28763 
diff
changeset
 | 
242  | 
|
| 
 
da8f6f4a74be
misc tuning and rearrangement of section "Printing logical entities";
 
wenzelm 
parents: 
28763 
diff
changeset
 | 
243  | 
  \end{description}
 | 
| 
 
da8f6f4a74be
misc tuning and rearrangement of section "Printing logical entities";
 
wenzelm 
parents: 
28763 
diff
changeset
 | 
244  | 
*}  | 
| 
 
da8f6f4a74be
misc tuning and rearrangement of section "Printing logical entities";
 
wenzelm 
parents: 
28763 
diff
changeset
 | 
245  | 
|
| 
 
da8f6f4a74be
misc tuning and rearrangement of section "Printing logical entities";
 
wenzelm 
parents: 
28763 
diff
changeset
 | 
246  | 
|
| 46284 | 247  | 
subsection {* Alternative print modes \label{sec:print-modes} *}
 | 
248  | 
||
249  | 
text {*
 | 
|
250  | 
  \begin{mldecls}
 | 
|
251  | 
    @{index_ML print_mode_value: "unit -> string list"} \\
 | 
|
252  | 
    @{index_ML Print_Mode.with_modes: "string list -> ('a -> 'b) -> 'a -> 'b"} \\
 | 
|
253  | 
  \end{mldecls}
 | 
|
254  | 
||
255  | 
  The \emph{print mode} facility allows to modify various operations
 | 
|
256  | 
  for printing.  Commands like @{command typ}, @{command term},
 | 
|
257  | 
  @{command thm} (see \secref{sec:print-diag}) take additional print
 | 
|
258  | 
modes as optional argument. The underlying ML operations are as  | 
|
259  | 
follows.  | 
|
260  | 
||
261  | 
  \begin{description}
 | 
|
262  | 
||
263  | 
  \item @{ML "print_mode_value ()"} yields the list of currently
 | 
|
264  | 
active print mode names. This should be understood as symbolic  | 
|
265  | 
representation of certain individual features for printing (with  | 
|
266  | 
precedence from left to right).  | 
|
267  | 
||
268  | 
  \item @{ML Print_Mode.with_modes}~@{text "modes f x"} evaluates
 | 
|
269  | 
  @{text "f x"} in an execution context where the print mode is
 | 
|
270  | 
  prepended by the given @{text "modes"}.  This provides a thread-safe
 | 
|
271  | 
way to augment print modes. It is also monotonic in the set of mode  | 
|
272  | 
names: it retains the default print mode that certain  | 
|
273  | 
user-interfaces might have installed for their proper functioning!  | 
|
274  | 
||
275  | 
  \end{description}
 | 
|
276  | 
||
277  | 
  \begin{warn}
 | 
|
278  | 
  The old global reference @{ML print_mode} should never be used
 | 
|
279  | 
directly in applications. Its main reason for being publicly  | 
|
280  | 
accessible is to support historic versions of Proof~General.  | 
|
281  | 
  \end{warn}
 | 
|
282  | 
||
283  | 
\medskip The pretty printer for inner syntax maintains alternative  | 
|
284  | 
mixfix productions for any print mode name invented by the user, say  | 
|
285  | 
  in commands like @{command notation} or @{command abbreviation}.
 | 
|
286  | 
Mode names can be arbitrary, but the following ones have a specific  | 
|
287  | 
meaning by convention:  | 
|
288  | 
||
289  | 
  \begin{itemize}
 | 
|
290  | 
||
291  | 
  \item @{verbatim "\"\""} (the empty string): default mode;
 | 
|
292  | 
implicitly active as last element in the list of modes.  | 
|
293  | 
||
294  | 
  \item @{verbatim input}: dummy print mode that is never active; may
 | 
|
295  | 
be used to specify notation that is only available for input.  | 
|
296  | 
||
297  | 
  \item @{verbatim internal} dummy print mode that is never active;
 | 
|
298  | 
used internally in Isabelle/Pure.  | 
|
299  | 
||
300  | 
  \item @{verbatim xsymbols}: enable proper mathematical symbols
 | 
|
301  | 
  instead of ASCII art.\footnote{This traditional mode name stems from
 | 
|
302  | 
the ``X-Symbol'' package for old versions Proof~General with XEmacs,  | 
|
303  | 
although that package has been superseded by Unicode in recent  | 
|
304  | 
years.}  | 
|
305  | 
||
306  | 
  \item @{verbatim HTML}: additional mode that is active in HTML
 | 
|
307  | 
presentation of Isabelle theory sources; allows to provide  | 
|
308  | 
alternative output notation.  | 
|
309  | 
||
310  | 
  \item @{verbatim latex}: additional mode that is active in {\LaTeX}
 | 
|
311  | 
document preparation of Isabelle theory sources; allows to provide  | 
|
312  | 
alternative output notation.  | 
|
313  | 
||
314  | 
  \end{itemize}
 | 
|
315  | 
*}  | 
|
316  | 
||
317  | 
||
| 
28765
 
da8f6f4a74be
misc tuning and rearrangement of section "Printing logical entities";
 
wenzelm 
parents: 
28763 
diff
changeset
 | 
318  | 
subsection {* Printing limits *}
 | 
| 
 
da8f6f4a74be
misc tuning and rearrangement of section "Printing logical entities";
 
wenzelm 
parents: 
28763 
diff
changeset
 | 
319  | 
|
| 
 
da8f6f4a74be
misc tuning and rearrangement of section "Printing logical entities";
 
wenzelm 
parents: 
28763 
diff
changeset
 | 
320  | 
text {*
 | 
| 
 
da8f6f4a74be
misc tuning and rearrangement of section "Printing logical entities";
 
wenzelm 
parents: 
28763 
diff
changeset
 | 
321  | 
  \begin{mldecls}
 | 
| 36745 | 322  | 
    @{index_ML Pretty.margin_default: "int Unsynchronized.ref"} \\
 | 
| 
28765
 
da8f6f4a74be
misc tuning and rearrangement of section "Printing logical entities";
 
wenzelm 
parents: 
28763 
diff
changeset
 | 
323  | 
    @{index_ML print_depth: "int -> unit"} \\
 | 
| 
 
da8f6f4a74be
misc tuning and rearrangement of section "Printing logical entities";
 
wenzelm 
parents: 
28763 
diff
changeset
 | 
324  | 
  \end{mldecls}
 | 
| 
 
da8f6f4a74be
misc tuning and rearrangement of section "Printing logical entities";
 
wenzelm 
parents: 
28763 
diff
changeset
 | 
325  | 
|
| 
 
da8f6f4a74be
misc tuning and rearrangement of section "Printing logical entities";
 
wenzelm 
parents: 
28763 
diff
changeset
 | 
326  | 
These ML functions set limits for pretty printed text.  | 
| 
 
da8f6f4a74be
misc tuning and rearrangement of section "Printing logical entities";
 
wenzelm 
parents: 
28763 
diff
changeset
 | 
327  | 
|
| 
 
da8f6f4a74be
misc tuning and rearrangement of section "Printing logical entities";
 
wenzelm 
parents: 
28763 
diff
changeset
 | 
328  | 
  \begin{description}
 | 
| 
 
da8f6f4a74be
misc tuning and rearrangement of section "Printing logical entities";
 
wenzelm 
parents: 
28763 
diff
changeset
 | 
329  | 
|
| 36745 | 330  | 
  \item @{ML Pretty.margin_default} indicates the global default for
 | 
331  | 
the right margin of the built-in pretty printer, with initial value  | 
|
332  | 
76. Note that user-interfaces typically control margins  | 
|
333  | 
automatically when resizing windows, or even bypass the formatting  | 
|
334  | 
engine of Isabelle/ML altogether and do it within the front end via  | 
|
335  | 
Isabelle/Scala.  | 
|
| 
28765
 
da8f6f4a74be
misc tuning and rearrangement of section "Printing logical entities";
 
wenzelm 
parents: 
28763 
diff
changeset
 | 
336  | 
|
| 
 
da8f6f4a74be
misc tuning and rearrangement of section "Printing logical entities";
 
wenzelm 
parents: 
28763 
diff
changeset
 | 
337  | 
  \item @{ML print_depth}~@{text n} limits the printing depth of the
 | 
| 
 
da8f6f4a74be
misc tuning and rearrangement of section "Printing logical entities";
 
wenzelm 
parents: 
28763 
diff
changeset
 | 
338  | 
ML toplevel pretty printer; the precise effect depends on the ML  | 
| 
 
da8f6f4a74be
misc tuning and rearrangement of section "Printing logical entities";
 
wenzelm 
parents: 
28763 
diff
changeset
 | 
339  | 
  compiler and run-time system.  Typically @{text n} should be less
 | 
| 
 
da8f6f4a74be
misc tuning and rearrangement of section "Printing logical entities";
 
wenzelm 
parents: 
28763 
diff
changeset
 | 
340  | 
than 10. Bigger values such as 100--1000 are useful for debugging.  | 
| 
28763
 
b5e6122ff575
added pretty printing options (from old ref manual);
 
wenzelm 
parents: 
28762 
diff
changeset
 | 
341  | 
|
| 
 
b5e6122ff575
added pretty printing options (from old ref manual);
 
wenzelm 
parents: 
28762 
diff
changeset
 | 
342  | 
  \end{description}
 | 
| 
 
b5e6122ff575
added pretty printing options (from old ref manual);
 
wenzelm 
parents: 
28762 
diff
changeset
 | 
343  | 
*}  | 
| 
 
b5e6122ff575
added pretty printing options (from old ref manual);
 
wenzelm 
parents: 
28762 
diff
changeset
 | 
344  | 
|
| 
 
b5e6122ff575
added pretty printing options (from old ref manual);
 
wenzelm 
parents: 
28762 
diff
changeset
 | 
345  | 
|
| 46282 | 346  | 
section {* Mixfix annotations \label{sec:mixfix} *}
 | 
| 28762 | 347  | 
|
348  | 
text {* Mixfix annotations specify concrete \emph{inner syntax} of
 | 
|
| 
35351
 
7425aece4ee3
allow general mixfix syntax for type constructors;
 
wenzelm 
parents: 
32833 
diff
changeset
 | 
349  | 
Isabelle types and terms. Locally fixed parameters in toplevel  | 
| 46290 | 350  | 
theorem statements, locale and class specifications also admit  | 
351  | 
mixfix annotations in a fairly uniform manner. A mixfix annotation  | 
|
| 50635 | 352  | 
describes the concrete syntax, the translation to abstract  | 
| 46290 | 353  | 
syntax, and the pretty printing. Special case annotations provide a  | 
354  | 
simple means of specifying infix operators and binders.  | 
|
355  | 
||
356  | 
  Isabelle mixfix syntax is inspired by {\OBJ} \cite{OBJ}.  It allows
 | 
|
357  | 
to specify any context-free priority grammar, which is more general  | 
|
358  | 
than the fixity declarations of ML and Prolog.  | 
|
| 28762 | 359  | 
|
| 
55112
 
b1a5d603fd12
prefer rail cartouche -- avoid back-slashed quotes;
 
wenzelm 
parents: 
55108 
diff
changeset
 | 
360  | 
  @{rail \<open>
 | 
| 
51654
 
8450b944e58a
just one syntax category "mixfix" -- check structure annotation semantically;
 
wenzelm 
parents: 
50636 
diff
changeset
 | 
361  | 
    @{syntax_def mixfix}: '('
 | 
| 
 
8450b944e58a
just one syntax category "mixfix" -- check structure annotation semantically;
 
wenzelm 
parents: 
50636 
diff
changeset
 | 
362  | 
      @{syntax template} prios? @{syntax nat}? |
 | 
| 46290 | 363  | 
      (@'infix' | @'infixl' | @'infixr') @{syntax template} @{syntax nat} |
 | 
| 
51654
 
8450b944e58a
just one syntax category "mixfix" -- check structure annotation semantically;
 
wenzelm 
parents: 
50636 
diff
changeset
 | 
364  | 
      @'binder' @{syntax template} prios? @{syntax nat} |
 | 
| 
 
8450b944e58a
just one syntax category "mixfix" -- check structure annotation semantically;
 
wenzelm 
parents: 
50636 
diff
changeset
 | 
365  | 
@'structure'  | 
| 
 
8450b944e58a
just one syntax category "mixfix" -- check structure annotation semantically;
 
wenzelm 
parents: 
50636 
diff
changeset
 | 
366  | 
')'  | 
| 46290 | 367  | 
;  | 
368  | 
template: string  | 
|
| 46289 | 369  | 
;  | 
| 
42596
 
6c621a9d612a
modernized rail diagrams using @{rail} antiquotation;
 
wenzelm 
parents: 
42358 
diff
changeset
 | 
370  | 
    prios: '[' (@{syntax nat} + ',') ']'
 | 
| 
55112
 
b1a5d603fd12
prefer rail cartouche -- avoid back-slashed quotes;
 
wenzelm 
parents: 
55108 
diff
changeset
 | 
371  | 
\<close>}  | 
| 28762 | 372  | 
|
| 46290 | 373  | 
  The string given as @{text template} may include literal text,
 | 
374  | 
  spacing, blocks, and arguments (denoted by ``@{text _}''); the
 | 
|
375  | 
  special symbol ``@{verbatim "\<index>"}'' (printed as ``@{text "\<index>"}'')
 | 
|
| 
51657
 
3db1bbc82d8d
more accurate documentation of "(structure)" mixfix;
 
wenzelm 
parents: 
51654 
diff
changeset
 | 
376  | 
  represents an index argument that specifies an implicit @{keyword
 | 
| 
 
3db1bbc82d8d
more accurate documentation of "(structure)" mixfix;
 
wenzelm 
parents: 
51654 
diff
changeset
 | 
377  | 
  "structure"} reference (see also \secref{sec:locale}).  Only locally
 | 
| 
 
3db1bbc82d8d
more accurate documentation of "(structure)" mixfix;
 
wenzelm 
parents: 
51654 
diff
changeset
 | 
378  | 
  fixed variables may be declared as @{keyword "structure"}.
 | 
| 
 
3db1bbc82d8d
more accurate documentation of "(structure)" mixfix;
 
wenzelm 
parents: 
51654 
diff
changeset
 | 
379  | 
|
| 
 
3db1bbc82d8d
more accurate documentation of "(structure)" mixfix;
 
wenzelm 
parents: 
51654 
diff
changeset
 | 
380  | 
Infix and binder declarations provide common abbreviations for  | 
| 
 
3db1bbc82d8d
more accurate documentation of "(structure)" mixfix;
 
wenzelm 
parents: 
51654 
diff
changeset
 | 
381  | 
particular mixfix declarations. So in practice, mixfix templates  | 
| 
 
3db1bbc82d8d
more accurate documentation of "(structure)" mixfix;
 
wenzelm 
parents: 
51654 
diff
changeset
 | 
382  | 
mostly degenerate to literal text for concrete syntax, such as  | 
| 
 
3db1bbc82d8d
more accurate documentation of "(structure)" mixfix;
 
wenzelm 
parents: 
51654 
diff
changeset
 | 
383  | 
  ``@{verbatim "++"}'' for an infix symbol.  *}
 | 
| 28762 | 384  | 
|
| 46290 | 385  | 
|
386  | 
subsection {* The general mixfix form *}
 | 
|
387  | 
||
388  | 
text {* In full generality, mixfix declarations work as follows.
 | 
|
389  | 
  Suppose a constant @{text "c :: \<tau>\<^sub>1 \<Rightarrow> \<dots> \<tau>\<^sub>n \<Rightarrow> \<tau>"} is annotated by
 | 
|
390  | 
  @{text "(mixfix [p\<^sub>1, \<dots>, p\<^sub>n] p)"}, where @{text "mixfix"} is a string
 | 
|
391  | 
  @{text "d\<^sub>0 _ d\<^sub>1 _ \<dots> _ d\<^sub>n"} consisting of delimiters that surround
 | 
|
392  | 
argument positions as indicated by underscores.  | 
|
| 28762 | 393  | 
|
394  | 
Altogether this determines a production for a context-free priority  | 
|
395  | 
  grammar, where for each argument @{text "i"} the syntactic category
 | 
|
| 46292 | 396  | 
  is determined by @{text "\<tau>\<^sub>i"} (with priority @{text "p\<^sub>i"}), and the
 | 
397  | 
  result category is determined from @{text "\<tau>"} (with priority @{text
 | 
|
398  | 
"p"}). Priority specifications are optional, with default 0 for  | 
|
399  | 
  arguments and 1000 for the result.\footnote{Omitting priorities is
 | 
|
400  | 
prone to syntactic ambiguities unless the delimiter tokens determine  | 
|
401  | 
  fully bracketed notation, as in @{text "if _ then _ else _ fi"}.}
 | 
|
| 28762 | 402  | 
|
403  | 
  Since @{text "\<tau>"} may be again a function type, the constant
 | 
|
404  | 
type scheme may have more argument positions than the mixfix  | 
|
405  | 
  pattern.  Printing a nested application @{text "c t\<^sub>1 \<dots> t\<^sub>m"} for
 | 
|
406  | 
  @{text "m > n"} works by attaching concrete notation only to the
 | 
|
407  | 
  innermost part, essentially by printing @{text "(c t\<^sub>1 \<dots> t\<^sub>n) \<dots> t\<^sub>m"}
 | 
|
408  | 
instead. If a term has fewer arguments than specified in the mixfix  | 
|
409  | 
template, the concrete syntax is ignored.  | 
|
410  | 
||
411  | 
\medskip A mixfix template may also contain additional directives  | 
|
412  | 
for pretty printing, notably spaces, blocks, and breaks. The  | 
|
413  | 
general template format is a sequence over any of the following  | 
|
414  | 
entities.  | 
|
415  | 
||
| 28778 | 416  | 
  \begin{description}
 | 
| 28762 | 417  | 
|
| 
28771
 
4510201c6aaf
mixfix annotations: verbatim for special symbols;
 
wenzelm 
parents: 
28770 
diff
changeset
 | 
418  | 
  \item @{text "d"} is a delimiter, namely a non-empty sequence of
 | 
| 
 
4510201c6aaf
mixfix annotations: verbatim for special symbols;
 
wenzelm 
parents: 
28770 
diff
changeset
 | 
419  | 
characters other than the following special characters:  | 
| 28762 | 420  | 
|
| 
28771
 
4510201c6aaf
mixfix annotations: verbatim for special symbols;
 
wenzelm 
parents: 
28770 
diff
changeset
 | 
421  | 
\smallskip  | 
| 
 
4510201c6aaf
mixfix annotations: verbatim for special symbols;
 
wenzelm 
parents: 
28770 
diff
changeset
 | 
422  | 
  \begin{tabular}{ll}
 | 
| 
 
4510201c6aaf
mixfix annotations: verbatim for special symbols;
 
wenzelm 
parents: 
28770 
diff
changeset
 | 
423  | 
    @{verbatim "'"} & single quote \\
 | 
| 
 
4510201c6aaf
mixfix annotations: verbatim for special symbols;
 
wenzelm 
parents: 
28770 
diff
changeset
 | 
424  | 
    @{verbatim "_"} & underscore \\
 | 
| 
 
4510201c6aaf
mixfix annotations: verbatim for special symbols;
 
wenzelm 
parents: 
28770 
diff
changeset
 | 
425  | 
    @{text "\<index>"} & index symbol \\
 | 
| 
 
4510201c6aaf
mixfix annotations: verbatim for special symbols;
 
wenzelm 
parents: 
28770 
diff
changeset
 | 
426  | 
    @{verbatim "("} & open parenthesis \\
 | 
| 
 
4510201c6aaf
mixfix annotations: verbatim for special symbols;
 
wenzelm 
parents: 
28770 
diff
changeset
 | 
427  | 
    @{verbatim ")"} & close parenthesis \\
 | 
| 
 
4510201c6aaf
mixfix annotations: verbatim for special symbols;
 
wenzelm 
parents: 
28770 
diff
changeset
 | 
428  | 
    @{verbatim "/"} & slash \\
 | 
| 
 
4510201c6aaf
mixfix annotations: verbatim for special symbols;
 
wenzelm 
parents: 
28770 
diff
changeset
 | 
429  | 
  \end{tabular}
 | 
| 
 
4510201c6aaf
mixfix annotations: verbatim for special symbols;
 
wenzelm 
parents: 
28770 
diff
changeset
 | 
430  | 
\medskip  | 
| 28762 | 431  | 
|
| 
28771
 
4510201c6aaf
mixfix annotations: verbatim for special symbols;
 
wenzelm 
parents: 
28770 
diff
changeset
 | 
432  | 
  \item @{verbatim "'"} escapes the special meaning of these
 | 
| 
 
4510201c6aaf
mixfix annotations: verbatim for special symbols;
 
wenzelm 
parents: 
28770 
diff
changeset
 | 
433  | 
meta-characters, producing a literal version of the following  | 
| 
 
4510201c6aaf
mixfix annotations: verbatim for special symbols;
 
wenzelm 
parents: 
28770 
diff
changeset
 | 
434  | 
character, unless that is a blank.  | 
| 
 
4510201c6aaf
mixfix annotations: verbatim for special symbols;
 
wenzelm 
parents: 
28770 
diff
changeset
 | 
435  | 
|
| 
 
4510201c6aaf
mixfix annotations: verbatim for special symbols;
 
wenzelm 
parents: 
28770 
diff
changeset
 | 
436  | 
A single quote followed by a blank separates delimiters, without  | 
| 
 
4510201c6aaf
mixfix annotations: verbatim for special symbols;
 
wenzelm 
parents: 
28770 
diff
changeset
 | 
437  | 
affecting printing, but input tokens may have additional white space  | 
| 
 
4510201c6aaf
mixfix annotations: verbatim for special symbols;
 
wenzelm 
parents: 
28770 
diff
changeset
 | 
438  | 
here.  | 
| 
 
4510201c6aaf
mixfix annotations: verbatim for special symbols;
 
wenzelm 
parents: 
28770 
diff
changeset
 | 
439  | 
|
| 
 
4510201c6aaf
mixfix annotations: verbatim for special symbols;
 
wenzelm 
parents: 
28770 
diff
changeset
 | 
440  | 
  \item @{verbatim "_"} is an argument position, which stands for a
 | 
| 28762 | 441  | 
certain syntactic category in the underlying grammar.  | 
442  | 
||
| 
28771
 
4510201c6aaf
mixfix annotations: verbatim for special symbols;
 
wenzelm 
parents: 
28770 
diff
changeset
 | 
443  | 
  \item @{text "\<index>"} is an indexed argument position; this is the place
 | 
| 
 
4510201c6aaf
mixfix annotations: verbatim for special symbols;
 
wenzelm 
parents: 
28770 
diff
changeset
 | 
444  | 
where implicit structure arguments can be attached.  | 
| 28762 | 445  | 
|
| 
28771
 
4510201c6aaf
mixfix annotations: verbatim for special symbols;
 
wenzelm 
parents: 
28770 
diff
changeset
 | 
446  | 
  \item @{text "s"} is a non-empty sequence of spaces for printing.
 | 
| 
 
4510201c6aaf
mixfix annotations: verbatim for special symbols;
 
wenzelm 
parents: 
28770 
diff
changeset
 | 
447  | 
This and the following specifications do not affect parsing at all.  | 
| 28762 | 448  | 
|
| 
28771
 
4510201c6aaf
mixfix annotations: verbatim for special symbols;
 
wenzelm 
parents: 
28770 
diff
changeset
 | 
449  | 
  \item @{verbatim "("}@{text n} opens a pretty printing block.  The
 | 
| 28762 | 450  | 
optional number specifies how much indentation to add when a line  | 
451  | 
break occurs within the block. If the parenthesis is not followed  | 
|
452  | 
by digits, the indentation defaults to 0. A block specified via  | 
|
| 
28771
 
4510201c6aaf
mixfix annotations: verbatim for special symbols;
 
wenzelm 
parents: 
28770 
diff
changeset
 | 
453  | 
  @{verbatim "(00"} is unbreakable.
 | 
| 28762 | 454  | 
|
| 
28771
 
4510201c6aaf
mixfix annotations: verbatim for special symbols;
 
wenzelm 
parents: 
28770 
diff
changeset
 | 
455  | 
  \item @{verbatim ")"} closes a pretty printing block.
 | 
| 28762 | 456  | 
|
| 
28771
 
4510201c6aaf
mixfix annotations: verbatim for special symbols;
 
wenzelm 
parents: 
28770 
diff
changeset
 | 
457  | 
  \item @{verbatim "//"} forces a line break.
 | 
| 28762 | 458  | 
|
| 
28771
 
4510201c6aaf
mixfix annotations: verbatim for special symbols;
 
wenzelm 
parents: 
28770 
diff
changeset
 | 
459  | 
  \item @{verbatim "/"}@{text s} allows a line break.  Here @{text s}
 | 
| 
 
4510201c6aaf
mixfix annotations: verbatim for special symbols;
 
wenzelm 
parents: 
28770 
diff
changeset
 | 
460  | 
stands for the string of spaces (zero or more) right after the  | 
| 
 
4510201c6aaf
mixfix annotations: verbatim for special symbols;
 
wenzelm 
parents: 
28770 
diff
changeset
 | 
461  | 
  slash.  These spaces are printed if the break is \emph{not} taken.
 | 
| 28762 | 462  | 
|
| 28778 | 463  | 
  \end{description}
 | 
| 28762 | 464  | 
|
465  | 
The general idea of pretty printing with blocks and breaks is also  | 
|
| 46286 | 466  | 
  described in \cite{paulson-ml2}; it goes back to \cite{Oppen:1980}.
 | 
| 28762 | 467  | 
*}  | 
468  | 
||
469  | 
||
| 46290 | 470  | 
subsection {* Infixes *}
 | 
471  | 
||
472  | 
text {* Infix operators are specified by convenient short forms that
 | 
|
473  | 
abbreviate general mixfix annotations as follows:  | 
|
474  | 
||
475  | 
  \begin{center}
 | 
|
476  | 
  \begin{tabular}{lll}
 | 
|
477  | 
||
| 46292 | 478  | 
  @{verbatim "("}@{keyword_def "infix"}~@{verbatim "\""}@{text sy}@{verbatim "\""} @{text "p"}@{verbatim ")"}
 | 
| 46290 | 479  | 
  & @{text "\<mapsto>"} &
 | 
480  | 
  @{verbatim "(\"(_ "}@{text sy}@{verbatim "/ _)\" ["}@{text "p + 1"}@{verbatim ", "}@{text "p + 1"}@{verbatim "]"}@{text " p"}@{verbatim ")"} \\
 | 
|
| 46292 | 481  | 
  @{verbatim "("}@{keyword_def "infixl"}~@{verbatim "\""}@{text sy}@{verbatim "\""} @{text "p"}@{verbatim ")"}
 | 
| 46290 | 482  | 
  & @{text "\<mapsto>"} &
 | 
483  | 
  @{verbatim "(\"(_ "}@{text sy}@{verbatim "/ _)\" ["}@{text "p"}@{verbatim ", "}@{text "p + 1"}@{verbatim "]"}@{text " p"}@{verbatim ")"} \\
 | 
|
| 46292 | 484  | 
  @{verbatim "("}@{keyword_def "infixr"}~@{verbatim "\""}@{text sy}@{verbatim "\""} @{text "p"}@{verbatim ")"}
 | 
| 46290 | 485  | 
  & @{text "\<mapsto>"} &
 | 
486  | 
  @{verbatim "(\"(_ "}@{text sy}@{verbatim "/ _)\" ["}@{text "p + 1"}@{verbatim ", "}@{text "p"}@{verbatim "]"}@{text " p"}@{verbatim ")"} \\
 | 
|
487  | 
||
488  | 
  \end{tabular}
 | 
|
489  | 
  \end{center}
 | 
|
490  | 
||
| 46292 | 491  | 
  The mixfix template @{verbatim "\"(_ "}@{text sy}@{verbatim "/ _)\""}
 | 
492  | 
specifies two argument positions; the delimiter is preceded by a  | 
|
493  | 
space and followed by a space or line break; the entire phrase is a  | 
|
494  | 
pretty printing block.  | 
|
| 46290 | 495  | 
|
496  | 
  The alternative notation @{verbatim "op"}~@{text sy} is introduced
 | 
|
497  | 
in addition. Thus any infix operator may be written in prefix form  | 
|
498  | 
(as in ML), independently of the number of arguments in the term.  | 
|
499  | 
*}  | 
|
500  | 
||
501  | 
||
502  | 
subsection {* Binders *}
 | 
|
503  | 
||
504  | 
text {* A \emph{binder} is a variable-binding construct such as a
 | 
|
505  | 
  quantifier.  The idea to formalize @{text "\<forall>x. b"} as @{text "All
 | 
|
506  | 
  (\<lambda>x. b)"} for @{text "All :: ('a \<Rightarrow> bool) \<Rightarrow> bool"} already goes back
 | 
|
507  | 
  to \cite{church40}.  Isabelle declarations of certain higher-order
 | 
|
| 46292 | 508  | 
  operators may be annotated with @{keyword_def "binder"} annotations
 | 
509  | 
as follows:  | 
|
| 46290 | 510  | 
|
511  | 
  \begin{center}
 | 
|
512  | 
  @{text "c :: "}@{verbatim "\""}@{text "(\<tau>\<^sub>1 \<Rightarrow> \<tau>\<^sub>2) \<Rightarrow> \<tau>\<^sub>3"}@{verbatim "\"  ("}@{keyword "binder"}@{verbatim " \""}@{text "sy"}@{verbatim "\" ["}@{text "p"}@{verbatim "] "}@{text "q"}@{verbatim ")"}
 | 
|
513  | 
  \end{center}
 | 
|
514  | 
||
515  | 
  This introduces concrete binder syntax @{text "sy x. b"}, where
 | 
|
516  | 
  @{text x} is a bound variable of type @{text "\<tau>\<^sub>1"}, the body @{text
 | 
|
517  | 
  b} has type @{text "\<tau>\<^sub>2"} and the whole term has type @{text "\<tau>\<^sub>3"}.
 | 
|
518  | 
  The optional integer @{text p} specifies the syntactic priority of
 | 
|
519  | 
  the body; the default is @{text "q"}, which is also the priority of
 | 
|
520  | 
the whole construct.  | 
|
521  | 
||
522  | 
Internally, the binder syntax is expanded to something like this:  | 
|
523  | 
  \begin{center}
 | 
|
524  | 
  @{text "c_binder :: "}@{verbatim "\""}@{text "idts \<Rightarrow> \<tau>\<^sub>2 \<Rightarrow> \<tau>\<^sub>3"}@{verbatim "\"  (\"(3"}@{text sy}@{verbatim "_./ _)\" [0, "}@{text "p"}@{verbatim "] "}@{text "q"}@{verbatim ")"}
 | 
|
525  | 
  \end{center}
 | 
|
526  | 
||
527  | 
  Here @{syntax (inner) idts} is the nonterminal symbol for a list of
 | 
|
528  | 
identifiers with optional type constraints (see also  | 
|
529  | 
  \secref{sec:pure-grammar}).  The mixfix template @{verbatim
 | 
|
530  | 
  "\"(3"}@{text sy}@{verbatim "_./ _)\""} defines argument positions
 | 
|
531  | 
for the bound identifiers and the body, separated by a dot with  | 
|
532  | 
optional line break; the entire phrase is a pretty printing block of  | 
|
533  | 
  indentation level 3.  Note that there is no extra space after @{text
 | 
|
534  | 
"sy"}, so it needs to be included user specification if the binder  | 
|
535  | 
syntax ends with a token that may be continued by an identifier  | 
|
536  | 
  token at the start of @{syntax (inner) idts}.
 | 
|
537  | 
||
538  | 
  Furthermore, a syntax translation to transforms @{text "c_binder x\<^sub>1
 | 
|
539  | 
  \<dots> x\<^sub>n b"} into iterated application @{text "c (\<lambda>x\<^sub>1. \<dots> c (\<lambda>x\<^sub>n. b)\<dots>)"}.
 | 
|
540  | 
This works in both directions, for parsing and printing. *}  | 
|
541  | 
||
542  | 
||
| 46282 | 543  | 
section {* Explicit notation \label{sec:notation} *}
 | 
| 28762 | 544  | 
|
545  | 
text {*
 | 
|
546  | 
  \begin{matharray}{rcll}
 | 
|
| 35413 | 547  | 
    @{command_def "type_notation"} & : & @{text "local_theory \<rightarrow> local_theory"} \\
 | 
548  | 
    @{command_def "no_type_notation"} & : & @{text "local_theory \<rightarrow> local_theory"} \\
 | 
|
| 28762 | 549  | 
    @{command_def "notation"} & : & @{text "local_theory \<rightarrow> local_theory"} \\
 | 
550  | 
    @{command_def "no_notation"} & : & @{text "local_theory \<rightarrow> local_theory"} \\
 | 
|
| 
36508
 
03d2a2d0ee4a
allow concrete syntax for local entities within a proof body, either via regular mixfix annotations to 'fix' etc. or the separate 'write' command;
 
wenzelm 
parents: 
35413 
diff
changeset
 | 
551  | 
    @{command_def "write"} & : & @{text "proof(state) \<rightarrow> proof(state)"} \\
 | 
| 28762 | 552  | 
  \end{matharray}
 | 
553  | 
||
| 46288 | 554  | 
Commands that introduce new logical entities (terms or types)  | 
555  | 
usually allow to provide mixfix annotations on the spot, which is  | 
|
556  | 
convenient for default notation. Nonetheless, the syntax may be  | 
|
557  | 
modified later on by declarations for explicit notation. This  | 
|
558  | 
allows to add or delete mixfix annotations for of existing logical  | 
|
559  | 
entities within the current context.  | 
|
560  | 
||
| 
55112
 
b1a5d603fd12
prefer rail cartouche -- avoid back-slashed quotes;
 
wenzelm 
parents: 
55108 
diff
changeset
 | 
561  | 
  @{rail \<open>
 | 
| 
42596
 
6c621a9d612a
modernized rail diagrams using @{rail} antiquotation;
 
wenzelm 
parents: 
42358 
diff
changeset
 | 
562  | 
    (@@{command type_notation} | @@{command no_type_notation}) @{syntax target}?
 | 
| 
55029
 
61a6bf7d4b02
clarified @{rail} syntax: prefer explicit \<newline> symbol;
 
wenzelm 
parents: 
52430 
diff
changeset
 | 
563  | 
      @{syntax mode}? \<newline> (@{syntax nameref} @{syntax mixfix} + @'and')
 | 
| 35413 | 564  | 
;  | 
| 
55029
 
61a6bf7d4b02
clarified @{rail} syntax: prefer explicit \<newline> symbol;
 
wenzelm 
parents: 
52430 
diff
changeset
 | 
565  | 
    (@@{command notation} | @@{command no_notation}) @{syntax target}? @{syntax mode}? \<newline>
 | 
| 
51654
 
8450b944e58a
just one syntax category "mixfix" -- check structure annotation semantically;
 
wenzelm 
parents: 
50636 
diff
changeset
 | 
566  | 
      (@{syntax nameref} @{syntax mixfix} + @'and')
 | 
| 28762 | 567  | 
;  | 
| 
51654
 
8450b944e58a
just one syntax category "mixfix" -- check structure annotation semantically;
 
wenzelm 
parents: 
50636 
diff
changeset
 | 
568  | 
    @@{command write} @{syntax mode}? (@{syntax nameref} @{syntax mixfix} + @'and')
 | 
| 
55112
 
b1a5d603fd12
prefer rail cartouche -- avoid back-slashed quotes;
 
wenzelm 
parents: 
55108 
diff
changeset
 | 
569  | 
\<close>}  | 
| 28762 | 570  | 
|
571  | 
  \begin{description}
 | 
|
572  | 
||
| 35413 | 573  | 
  \item @{command "type_notation"}~@{text "c (mx)"} associates mixfix
 | 
574  | 
syntax with an existing type constructor. The arity of the  | 
|
575  | 
constructor is retrieved from the context.  | 
|
| 46282 | 576  | 
|
| 35413 | 577  | 
  \item @{command "no_type_notation"} is similar to @{command
 | 
578  | 
"type_notation"}, but removes the specified syntax annotation from  | 
|
579  | 
the present context.  | 
|
580  | 
||
| 28762 | 581  | 
  \item @{command "notation"}~@{text "c (mx)"} associates mixfix
 | 
| 35413 | 582  | 
syntax with an existing constant or fixed variable. The type  | 
583  | 
declaration of the given entity is retrieved from the context.  | 
|
| 46282 | 584  | 
|
| 28762 | 585  | 
  \item @{command "no_notation"} is similar to @{command "notation"},
 | 
586  | 
but removes the specified syntax annotation from the present  | 
|
587  | 
context.  | 
|
588  | 
||
| 
36508
 
03d2a2d0ee4a
allow concrete syntax for local entities within a proof body, either via regular mixfix annotations to 'fix' etc. or the separate 'write' command;
 
wenzelm 
parents: 
35413 
diff
changeset
 | 
589  | 
  \item @{command "write"} is similar to @{command "notation"}, but
 | 
| 
 
03d2a2d0ee4a
allow concrete syntax for local entities within a proof body, either via regular mixfix annotations to 'fix' etc. or the separate 'write' command;
 
wenzelm 
parents: 
35413 
diff
changeset
 | 
590  | 
works within an Isar proof body.  | 
| 
 
03d2a2d0ee4a
allow concrete syntax for local entities within a proof body, either via regular mixfix annotations to 'fix' etc. or the separate 'write' command;
 
wenzelm 
parents: 
35413 
diff
changeset
 | 
591  | 
|
| 28762 | 592  | 
  \end{description}
 | 
593  | 
*}  | 
|
594  | 
||
| 28778 | 595  | 
|
596  | 
section {* The Pure syntax \label{sec:pure-syntax} *}
 | 
|
| 
28769
 
8fc228f21861
added section "Priority grammars" (variant from old ref manual);
 
wenzelm 
parents: 
28767 
diff
changeset
 | 
597  | 
|
| 46282 | 598  | 
subsection {* Lexical matters \label{sec:inner-lex} *}
 | 
599  | 
||
600  | 
text {* The inner lexical syntax vaguely resembles the outer one
 | 
|
601  | 
  (\secref{sec:outer-lex}), but some details are different.  There are
 | 
|
602  | 
two main categories of inner syntax tokens:  | 
|
603  | 
||
604  | 
  \begin{enumerate}
 | 
|
605  | 
||
606  | 
  \item \emph{delimiters} --- the literal tokens occurring in
 | 
|
607  | 
productions of the given priority grammar (cf.\  | 
|
608  | 
  \secref{sec:priority-grammar});
 | 
|
609  | 
||
610  | 
  \item \emph{named tokens} --- various categories of identifiers etc.
 | 
|
611  | 
||
612  | 
  \end{enumerate}
 | 
|
613  | 
||
614  | 
Delimiters override named tokens and may thus render certain  | 
|
615  | 
identifiers inaccessible. Sometimes the logical context admits  | 
|
616  | 
alternative ways to refer to the same entity, potentially via  | 
|
617  | 
qualified names.  | 
|
618  | 
||
619  | 
\medskip The categories for named tokens are defined once and for  | 
|
620  | 
all as follows, reusing some categories of the outer token syntax  | 
|
621  | 
  (\secref{sec:outer-lex}).
 | 
|
622  | 
||
623  | 
  \begin{center}
 | 
|
624  | 
  \begin{supertabular}{rcl}
 | 
|
625  | 
    @{syntax_def (inner) id} & = & @{syntax_ref ident} \\
 | 
|
626  | 
    @{syntax_def (inner) longid} & = & @{syntax_ref longident} \\
 | 
|
627  | 
    @{syntax_def (inner) var} & = & @{syntax_ref var} \\
 | 
|
628  | 
    @{syntax_def (inner) tid} & = & @{syntax_ref typefree} \\
 | 
|
629  | 
    @{syntax_def (inner) tvar} & = & @{syntax_ref typevar} \\
 | 
|
630  | 
    @{syntax_def (inner) num_token} & = & @{syntax_ref nat}@{text "  |  "}@{verbatim "-"}@{syntax_ref nat} \\
 | 
|
631  | 
    @{syntax_def (inner) float_token} & = & @{syntax_ref nat}@{verbatim "."}@{syntax_ref nat}@{text "  |  "}@{verbatim "-"}@{syntax_ref nat}@{verbatim "."}@{syntax_ref nat} \\
 | 
|
632  | 
    @{syntax_def (inner) xnum_token} & = & @{verbatim "#"}@{syntax_ref nat}@{text "  |  "}@{verbatim "#-"}@{syntax_ref nat} \\
 | 
|
| 46483 | 633  | 
    @{syntax_def (inner) str_token} & = & @{verbatim "''"} @{text "\<dots>"} @{verbatim "''"} \\
 | 
| 
55108
 
0b7a0c1fdf7e
inner syntax token language allows regular quoted strings;
 
wenzelm 
parents: 
55033 
diff
changeset
 | 
634  | 
    @{syntax_def (inner) string_token} & = & @{verbatim "\""} @{text "\<dots>"} @{verbatim "\""} \\
 | 
| 55033 | 635  | 
    @{syntax_def (inner) cartouche} & = & @{verbatim "\<open>"} @{text "\<dots>"} @{verbatim "\<close>"} \\
 | 
| 46282 | 636  | 
  \end{supertabular}
 | 
637  | 
  \end{center}
 | 
|
638  | 
||
639  | 
  The token categories @{syntax (inner) num_token}, @{syntax (inner)
 | 
|
| 55033 | 640  | 
  float_token}, @{syntax (inner) xnum_token}, @{syntax (inner)
 | 
| 
55108
 
0b7a0c1fdf7e
inner syntax token language allows regular quoted strings;
 
wenzelm 
parents: 
55033 
diff
changeset
 | 
641  | 
  str_token}, @{syntax (inner) string_token}, and @{syntax (inner)
 | 
| 
 
0b7a0c1fdf7e
inner syntax token language allows regular quoted strings;
 
wenzelm 
parents: 
55033 
diff
changeset
 | 
642  | 
cartouche} are not used in Pure. Object-logics may implement  | 
| 
 
0b7a0c1fdf7e
inner syntax token language allows regular quoted strings;
 
wenzelm 
parents: 
55033 
diff
changeset
 | 
643  | 
numerals and string literals by adding appropriate syntax  | 
| 
 
0b7a0c1fdf7e
inner syntax token language allows regular quoted strings;
 
wenzelm 
parents: 
55033 
diff
changeset
 | 
644  | 
declarations, together with some translation functions (e.g.\ see  | 
| 
 
0b7a0c1fdf7e
inner syntax token language allows regular quoted strings;
 
wenzelm 
parents: 
55033 
diff
changeset
 | 
645  | 
  @{file "~~/src/HOL/Tools/string_syntax.ML"}).
 | 
| 46282 | 646  | 
|
647  | 
  The derived categories @{syntax_def (inner) num_const}, @{syntax_def
 | 
|
648  | 
  (inner) float_const}, and @{syntax_def (inner) num_const} provide
 | 
|
649  | 
robust access to the respective tokens: the syntax tree holds a  | 
|
650  | 
syntactic constant instead of a free variable.  | 
|
651  | 
*}  | 
|
652  | 
||
653  | 
||
| 28777 | 654  | 
subsection {* Priority grammars \label{sec:priority-grammar} *}
 | 
| 
28769
 
8fc228f21861
added section "Priority grammars" (variant from old ref manual);
 
wenzelm 
parents: 
28767 
diff
changeset
 | 
655  | 
|
| 
 
8fc228f21861
added section "Priority grammars" (variant from old ref manual);
 
wenzelm 
parents: 
28767 
diff
changeset
 | 
656  | 
text {* A context-free grammar consists of a set of \emph{terminal
 | 
| 
 
8fc228f21861
added section "Priority grammars" (variant from old ref manual);
 
wenzelm 
parents: 
28767 
diff
changeset
 | 
657  | 
  symbols}, a set of \emph{nonterminal symbols} and a set of
 | 
| 
 
8fc228f21861
added section "Priority grammars" (variant from old ref manual);
 
wenzelm 
parents: 
28767 
diff
changeset
 | 
658  | 
  \emph{productions}.  Productions have the form @{text "A = \<gamma>"},
 | 
| 
 
8fc228f21861
added section "Priority grammars" (variant from old ref manual);
 
wenzelm 
parents: 
28767 
diff
changeset
 | 
659  | 
  where @{text A} is a nonterminal and @{text \<gamma>} is a string of
 | 
| 
 
8fc228f21861
added section "Priority grammars" (variant from old ref manual);
 
wenzelm 
parents: 
28767 
diff
changeset
 | 
660  | 
terminals and nonterminals. One designated nonterminal is called  | 
| 
 
8fc228f21861
added section "Priority grammars" (variant from old ref manual);
 
wenzelm 
parents: 
28767 
diff
changeset
 | 
661  | 
  the \emph{root symbol}.  The language defined by the grammar
 | 
| 
 
8fc228f21861
added section "Priority grammars" (variant from old ref manual);
 
wenzelm 
parents: 
28767 
diff
changeset
 | 
662  | 
consists of all strings of terminals that can be derived from the  | 
| 
 
8fc228f21861
added section "Priority grammars" (variant from old ref manual);
 
wenzelm 
parents: 
28767 
diff
changeset
 | 
663  | 
root symbol by applying productions as rewrite rules.  | 
| 
 
8fc228f21861
added section "Priority grammars" (variant from old ref manual);
 
wenzelm 
parents: 
28767 
diff
changeset
 | 
664  | 
|
| 
 
8fc228f21861
added section "Priority grammars" (variant from old ref manual);
 
wenzelm 
parents: 
28767 
diff
changeset
 | 
665  | 
  The standard Isabelle parser for inner syntax uses a \emph{priority
 | 
| 
 
8fc228f21861
added section "Priority grammars" (variant from old ref manual);
 
wenzelm 
parents: 
28767 
diff
changeset
 | 
666  | 
grammar}. Each nonterminal is decorated by an integer priority:  | 
| 
 
8fc228f21861
added section "Priority grammars" (variant from old ref manual);
 
wenzelm 
parents: 
28767 
diff
changeset
 | 
667  | 
  @{text "A\<^sup>(\<^sup>p\<^sup>)"}.  In a derivation, @{text "A\<^sup>(\<^sup>p\<^sup>)"} may be rewritten
 | 
| 
 
8fc228f21861
added section "Priority grammars" (variant from old ref manual);
 
wenzelm 
parents: 
28767 
diff
changeset
 | 
668  | 
  using a production @{text "A\<^sup>(\<^sup>q\<^sup>) = \<gamma>"} only if @{text "p \<le> q"}.  Any
 | 
| 
 
8fc228f21861
added section "Priority grammars" (variant from old ref manual);
 
wenzelm 
parents: 
28767 
diff
changeset
 | 
669  | 
priority grammar can be translated into a normal context-free  | 
| 
 
8fc228f21861
added section "Priority grammars" (variant from old ref manual);
 
wenzelm 
parents: 
28767 
diff
changeset
 | 
670  | 
grammar by introducing new nonterminals and productions.  | 
| 
 
8fc228f21861
added section "Priority grammars" (variant from old ref manual);
 
wenzelm 
parents: 
28767 
diff
changeset
 | 
671  | 
|
| 
 
8fc228f21861
added section "Priority grammars" (variant from old ref manual);
 
wenzelm 
parents: 
28767 
diff
changeset
 | 
672  | 
  \medskip Formally, a set of context free productions @{text G}
 | 
| 
 
8fc228f21861
added section "Priority grammars" (variant from old ref manual);
 
wenzelm 
parents: 
28767 
diff
changeset
 | 
673  | 
  induces a derivation relation @{text "\<longrightarrow>\<^sub>G"} as follows.  Let @{text
 | 
| 
 
8fc228f21861
added section "Priority grammars" (variant from old ref manual);
 
wenzelm 
parents: 
28767 
diff
changeset
 | 
674  | 
  \<alpha>} and @{text \<beta>} denote strings of terminal or nonterminal symbols.
 | 
| 28774 | 675  | 
  Then @{text "\<alpha> A\<^sup>(\<^sup>p\<^sup>) \<beta> \<longrightarrow>\<^sub>G \<alpha> \<gamma> \<beta>"} holds if and only if @{text G}
 | 
676  | 
  contains some production @{text "A\<^sup>(\<^sup>q\<^sup>) = \<gamma>"} for @{text "p \<le> q"}.
 | 
|
| 
28769
 
8fc228f21861
added section "Priority grammars" (variant from old ref manual);
 
wenzelm 
parents: 
28767 
diff
changeset
 | 
677  | 
|
| 
 
8fc228f21861
added section "Priority grammars" (variant from old ref manual);
 
wenzelm 
parents: 
28767 
diff
changeset
 | 
678  | 
\medskip The following grammar for arithmetic expressions  | 
| 
 
8fc228f21861
added section "Priority grammars" (variant from old ref manual);
 
wenzelm 
parents: 
28767 
diff
changeset
 | 
679  | 
demonstrates how binding power and associativity of operators can be  | 
| 
 
8fc228f21861
added section "Priority grammars" (variant from old ref manual);
 
wenzelm 
parents: 
28767 
diff
changeset
 | 
680  | 
enforced by priorities.  | 
| 
 
8fc228f21861
added section "Priority grammars" (variant from old ref manual);
 
wenzelm 
parents: 
28767 
diff
changeset
 | 
681  | 
|
| 
 
8fc228f21861
added section "Priority grammars" (variant from old ref manual);
 
wenzelm 
parents: 
28767 
diff
changeset
 | 
682  | 
  \begin{center}
 | 
| 
 
8fc228f21861
added section "Priority grammars" (variant from old ref manual);
 
wenzelm 
parents: 
28767 
diff
changeset
 | 
683  | 
  \begin{tabular}{rclr}
 | 
| 28774 | 684  | 
  @{text "A\<^sup>(\<^sup>1\<^sup>0\<^sup>0\<^sup>0\<^sup>)"} & @{text "="} & @{verbatim "("} @{text "A\<^sup>(\<^sup>0\<^sup>)"} @{verbatim ")"} \\
 | 
| 
28769
 
8fc228f21861
added section "Priority grammars" (variant from old ref manual);
 
wenzelm 
parents: 
28767 
diff
changeset
 | 
685  | 
  @{text "A\<^sup>(\<^sup>1\<^sup>0\<^sup>0\<^sup>0\<^sup>)"} & @{text "="} & @{verbatim 0} \\
 | 
| 
 
8fc228f21861
added section "Priority grammars" (variant from old ref manual);
 
wenzelm 
parents: 
28767 
diff
changeset
 | 
686  | 
  @{text "A\<^sup>(\<^sup>0\<^sup>)"} & @{text "="} & @{text "A\<^sup>(\<^sup>0\<^sup>)"} @{verbatim "+"} @{text "A\<^sup>(\<^sup>1\<^sup>)"} \\
 | 
| 
 
8fc228f21861
added section "Priority grammars" (variant from old ref manual);
 
wenzelm 
parents: 
28767 
diff
changeset
 | 
687  | 
  @{text "A\<^sup>(\<^sup>2\<^sup>)"} & @{text "="} & @{text "A\<^sup>(\<^sup>3\<^sup>)"} @{verbatim "*"} @{text "A\<^sup>(\<^sup>2\<^sup>)"} \\
 | 
| 
 
8fc228f21861
added section "Priority grammars" (variant from old ref manual);
 
wenzelm 
parents: 
28767 
diff
changeset
 | 
688  | 
  @{text "A\<^sup>(\<^sup>3\<^sup>)"} & @{text "="} & @{verbatim "-"} @{text "A\<^sup>(\<^sup>3\<^sup>)"} \\
 | 
| 
 
8fc228f21861
added section "Priority grammars" (variant from old ref manual);
 
wenzelm 
parents: 
28767 
diff
changeset
 | 
689  | 
  \end{tabular}
 | 
| 
 
8fc228f21861
added section "Priority grammars" (variant from old ref manual);
 
wenzelm 
parents: 
28767 
diff
changeset
 | 
690  | 
  \end{center}
 | 
| 
 
8fc228f21861
added section "Priority grammars" (variant from old ref manual);
 
wenzelm 
parents: 
28767 
diff
changeset
 | 
691  | 
  The choice of priorities determines that @{verbatim "-"} binds
 | 
| 
 
8fc228f21861
added section "Priority grammars" (variant from old ref manual);
 
wenzelm 
parents: 
28767 
diff
changeset
 | 
692  | 
  tighter than @{verbatim "*"}, which binds tighter than @{verbatim
 | 
| 
 
8fc228f21861
added section "Priority grammars" (variant from old ref manual);
 
wenzelm 
parents: 
28767 
diff
changeset
 | 
693  | 
  "+"}.  Furthermore @{verbatim "+"} associates to the left and
 | 
| 
 
8fc228f21861
added section "Priority grammars" (variant from old ref manual);
 
wenzelm 
parents: 
28767 
diff
changeset
 | 
694  | 
  @{verbatim "*"} to the right.
 | 
| 
 
8fc228f21861
added section "Priority grammars" (variant from old ref manual);
 
wenzelm 
parents: 
28767 
diff
changeset
 | 
695  | 
|
| 
 
8fc228f21861
added section "Priority grammars" (variant from old ref manual);
 
wenzelm 
parents: 
28767 
diff
changeset
 | 
696  | 
\medskip For clarity, grammars obey these conventions:  | 
| 
 
8fc228f21861
added section "Priority grammars" (variant from old ref manual);
 
wenzelm 
parents: 
28767 
diff
changeset
 | 
697  | 
  \begin{itemize}
 | 
| 
 
8fc228f21861
added section "Priority grammars" (variant from old ref manual);
 
wenzelm 
parents: 
28767 
diff
changeset
 | 
698  | 
|
| 
 
8fc228f21861
added section "Priority grammars" (variant from old ref manual);
 
wenzelm 
parents: 
28767 
diff
changeset
 | 
699  | 
\item All priorities must lie between 0 and 1000.  | 
| 
 
8fc228f21861
added section "Priority grammars" (variant from old ref manual);
 
wenzelm 
parents: 
28767 
diff
changeset
 | 
700  | 
|
| 
 
8fc228f21861
added section "Priority grammars" (variant from old ref manual);
 
wenzelm 
parents: 
28767 
diff
changeset
 | 
701  | 
\item Priority 0 on the right-hand side and priority 1000 on the  | 
| 
 
8fc228f21861
added section "Priority grammars" (variant from old ref manual);
 
wenzelm 
parents: 
28767 
diff
changeset
 | 
702  | 
left-hand side may be omitted.  | 
| 
 
8fc228f21861
added section "Priority grammars" (variant from old ref manual);
 
wenzelm 
parents: 
28767 
diff
changeset
 | 
703  | 
|
| 
 
8fc228f21861
added section "Priority grammars" (variant from old ref manual);
 
wenzelm 
parents: 
28767 
diff
changeset
 | 
704  | 
  \item The production @{text "A\<^sup>(\<^sup>p\<^sup>) = \<alpha>"} is written as @{text "A = \<alpha>
 | 
| 
 
8fc228f21861
added section "Priority grammars" (variant from old ref manual);
 
wenzelm 
parents: 
28767 
diff
changeset
 | 
705  | 
(p)"}, i.e.\ the priority of the left-hand side actually appears in  | 
| 
 
8fc228f21861
added section "Priority grammars" (variant from old ref manual);
 
wenzelm 
parents: 
28767 
diff
changeset
 | 
706  | 
a column on the far right.  | 
| 
 
8fc228f21861
added section "Priority grammars" (variant from old ref manual);
 
wenzelm 
parents: 
28767 
diff
changeset
 | 
707  | 
|
| 
 
8fc228f21861
added section "Priority grammars" (variant from old ref manual);
 
wenzelm 
parents: 
28767 
diff
changeset
 | 
708  | 
  \item Alternatives are separated by @{text "|"}.
 | 
| 
 
8fc228f21861
added section "Priority grammars" (variant from old ref manual);
 
wenzelm 
parents: 
28767 
diff
changeset
 | 
709  | 
|
| 
 
8fc228f21861
added section "Priority grammars" (variant from old ref manual);
 
wenzelm 
parents: 
28767 
diff
changeset
 | 
710  | 
  \item Repetition is indicated by dots @{text "(\<dots>)"} in an informal
 | 
| 
 
8fc228f21861
added section "Priority grammars" (variant from old ref manual);
 
wenzelm 
parents: 
28767 
diff
changeset
 | 
711  | 
but obvious way.  | 
| 
 
8fc228f21861
added section "Priority grammars" (variant from old ref manual);
 
wenzelm 
parents: 
28767 
diff
changeset
 | 
712  | 
|
| 
 
8fc228f21861
added section "Priority grammars" (variant from old ref manual);
 
wenzelm 
parents: 
28767 
diff
changeset
 | 
713  | 
  \end{itemize}
 | 
| 
 
8fc228f21861
added section "Priority grammars" (variant from old ref manual);
 
wenzelm 
parents: 
28767 
diff
changeset
 | 
714  | 
|
| 
 
8fc228f21861
added section "Priority grammars" (variant from old ref manual);
 
wenzelm 
parents: 
28767 
diff
changeset
 | 
715  | 
Using these conventions, the example grammar specification above  | 
| 
 
8fc228f21861
added section "Priority grammars" (variant from old ref manual);
 
wenzelm 
parents: 
28767 
diff
changeset
 | 
716  | 
takes the form:  | 
| 
 
8fc228f21861
added section "Priority grammars" (variant from old ref manual);
 
wenzelm 
parents: 
28767 
diff
changeset
 | 
717  | 
  \begin{center}
 | 
| 
 
8fc228f21861
added section "Priority grammars" (variant from old ref manual);
 
wenzelm 
parents: 
28767 
diff
changeset
 | 
718  | 
  \begin{tabular}{rclc}
 | 
| 28774 | 719  | 
    @{text A} & @{text "="} & @{verbatim "("} @{text A} @{verbatim ")"} \\
 | 
720  | 
              & @{text "|"} & @{verbatim 0} & \qquad\qquad \\
 | 
|
| 
28769
 
8fc228f21861
added section "Priority grammars" (variant from old ref manual);
 
wenzelm 
parents: 
28767 
diff
changeset
 | 
721  | 
              & @{text "|"} & @{text A} @{verbatim "+"} @{text "A\<^sup>(\<^sup>1\<^sup>)"} & @{text "(0)"} \\
 | 
| 
 
8fc228f21861
added section "Priority grammars" (variant from old ref manual);
 
wenzelm 
parents: 
28767 
diff
changeset
 | 
722  | 
              & @{text "|"} & @{text "A\<^sup>(\<^sup>3\<^sup>)"} @{verbatim "*"} @{text "A\<^sup>(\<^sup>2\<^sup>)"} & @{text "(2)"} \\
 | 
| 
 
8fc228f21861
added section "Priority grammars" (variant from old ref manual);
 
wenzelm 
parents: 
28767 
diff
changeset
 | 
723  | 
              & @{text "|"} & @{verbatim "-"} @{text "A\<^sup>(\<^sup>3\<^sup>)"} & @{text "(3)"} \\
 | 
| 
 
8fc228f21861
added section "Priority grammars" (variant from old ref manual);
 
wenzelm 
parents: 
28767 
diff
changeset
 | 
724  | 
  \end{tabular}
 | 
| 
 
8fc228f21861
added section "Priority grammars" (variant from old ref manual);
 
wenzelm 
parents: 
28767 
diff
changeset
 | 
725  | 
  \end{center}
 | 
| 
 
8fc228f21861
added section "Priority grammars" (variant from old ref manual);
 
wenzelm 
parents: 
28767 
diff
changeset
 | 
726  | 
*}  | 
| 
 
8fc228f21861
added section "Priority grammars" (variant from old ref manual);
 
wenzelm 
parents: 
28767 
diff
changeset
 | 
727  | 
|
| 
 
8fc228f21861
added section "Priority grammars" (variant from old ref manual);
 
wenzelm 
parents: 
28767 
diff
changeset
 | 
728  | 
|
| 46290 | 729  | 
subsection {* The Pure grammar \label{sec:pure-grammar} *}
 | 
| 
28770
 
93a372e2dc7a
added section "The Pure grammar" (incomplete version, based on old ref manual);
 
wenzelm 
parents: 
28769 
diff
changeset
 | 
730  | 
|
| 46287 | 731  | 
text {* The priority grammar of the @{text "Pure"} theory is defined
 | 
732  | 
approximately like this:  | 
|
| 28774 | 733  | 
|
| 
28770
 
93a372e2dc7a
added section "The Pure grammar" (incomplete version, based on old ref manual);
 
wenzelm 
parents: 
28769 
diff
changeset
 | 
734  | 
  \begin{center}
 | 
| 28773 | 735  | 
  \begin{supertabular}{rclr}
 | 
| 
28770
 
93a372e2dc7a
added section "The Pure grammar" (incomplete version, based on old ref manual);
 
wenzelm 
parents: 
28769 
diff
changeset
 | 
736  | 
|
| 28778 | 737  | 
  @{syntax_def (inner) any} & = & @{text "prop  |  logic"} \\\\
 | 
| 28772 | 738  | 
|
| 28778 | 739  | 
  @{syntax_def (inner) prop} & = & @{verbatim "("} @{text prop} @{verbatim ")"} \\
 | 
| 28772 | 740  | 
    & @{text "|"} & @{text "prop\<^sup>(\<^sup>4\<^sup>)"} @{verbatim "::"} @{text type} & @{text "(3)"} \\
 | 
| 
50636
 
07f47142378e
uniform notation for == and \<equiv> (cf. 3e3c2af5e8a5);
 
wenzelm 
parents: 
50635 
diff
changeset
 | 
741  | 
    & @{text "|"} & @{text "any\<^sup>(\<^sup>3\<^sup>)"} @{verbatim "=="} @{text "any\<^sup>(\<^sup>3\<^sup>)"} & @{text "(2)"} \\
 | 
| 
 
07f47142378e
uniform notation for == and \<equiv> (cf. 3e3c2af5e8a5);
 
wenzelm 
parents: 
50635 
diff
changeset
 | 
742  | 
    & @{text "|"} & @{text "any\<^sup>(\<^sup>3\<^sup>)"} @{text "\<equiv>"} @{text "any\<^sup>(\<^sup>3\<^sup>)"} & @{text "(2)"} \\
 | 
| 
28856
 
5e009a80fe6d
Pure syntax: more coherent treatment of aprop, permanent TERM and &&&;
 
wenzelm 
parents: 
28779 
diff
changeset
 | 
743  | 
    & @{text "|"} & @{text "prop\<^sup>(\<^sup>3\<^sup>)"} @{verbatim "&&&"} @{text "prop\<^sup>(\<^sup>2\<^sup>)"} & @{text "(2)"} \\
 | 
| 28772 | 744  | 
    & @{text "|"} & @{text "prop\<^sup>(\<^sup>2\<^sup>)"} @{verbatim "==>"} @{text "prop\<^sup>(\<^sup>1\<^sup>)"} & @{text "(1)"} \\
 | 
| 28773 | 745  | 
    & @{text "|"} & @{text "prop\<^sup>(\<^sup>2\<^sup>)"} @{text "\<Longrightarrow>"} @{text "prop\<^sup>(\<^sup>1\<^sup>)"} & @{text "(1)"} \\
 | 
| 28772 | 746  | 
    & @{text "|"} & @{verbatim "[|"} @{text prop} @{verbatim ";"} @{text "\<dots>"} @{verbatim ";"} @{text prop} @{verbatim "|]"} @{verbatim "==>"} @{text "prop\<^sup>(\<^sup>1\<^sup>)"} & @{text "(1)"} \\
 | 
| 28773 | 747  | 
    & @{text "|"} & @{text "\<lbrakk>"} @{text prop} @{verbatim ";"} @{text "\<dots>"} @{verbatim ";"} @{text prop} @{text "\<rbrakk>"} @{text "\<Longrightarrow>"} @{text "prop\<^sup>(\<^sup>1\<^sup>)"} & @{text "(1)"} \\
 | 
| 28772 | 748  | 
    & @{text "|"} & @{verbatim "!!"} @{text idts} @{verbatim "."} @{text prop} & @{text "(0)"} \\
 | 
| 28773 | 749  | 
    & @{text "|"} & @{text "\<And>"} @{text idts} @{verbatim "."} @{text prop} & @{text "(0)"} \\
 | 
750  | 
    & @{text "|"} & @{verbatim OFCLASS} @{verbatim "("} @{text type} @{verbatim ","} @{text logic} @{verbatim ")"} \\
 | 
|
751  | 
    & @{text "|"} & @{verbatim SORT_CONSTRAINT} @{verbatim "("} @{text type} @{verbatim ")"} \\
 | 
|
| 
28856
 
5e009a80fe6d
Pure syntax: more coherent treatment of aprop, permanent TERM and &&&;
 
wenzelm 
parents: 
28779 
diff
changeset
 | 
752  | 
    & @{text "|"} & @{verbatim TERM} @{text logic} \\
 | 
| 28773 | 753  | 
    & @{text "|"} & @{verbatim PROP} @{text aprop} \\\\
 | 
| 28772 | 754  | 
|
| 
28856
 
5e009a80fe6d
Pure syntax: more coherent treatment of aprop, permanent TERM and &&&;
 
wenzelm 
parents: 
28779 
diff
changeset
 | 
755  | 
  @{syntax_def (inner) aprop} & = & @{verbatim "("} @{text aprop} @{verbatim ")"} \\
 | 
| 
 
5e009a80fe6d
Pure syntax: more coherent treatment of aprop, permanent TERM and &&&;
 
wenzelm 
parents: 
28779 
diff
changeset
 | 
756  | 
    & @{text "|"} & @{text "id  |  longid  |  var  |  "}@{verbatim "_"}@{text "  |  "}@{verbatim "..."} \\
 | 
| 
 
5e009a80fe6d
Pure syntax: more coherent treatment of aprop, permanent TERM and &&&;
 
wenzelm 
parents: 
28779 
diff
changeset
 | 
757  | 
    & @{text "|"} & @{verbatim CONST} @{text "id  |  "}@{verbatim CONST} @{text "longid"} \\
 | 
| 46287 | 758  | 
    & @{text "|"} & @{verbatim XCONST} @{text "id  |  "}@{verbatim XCONST} @{text "longid"} \\
 | 
| 28773 | 759  | 
    & @{text "|"} & @{text "logic\<^sup>(\<^sup>1\<^sup>0\<^sup>0\<^sup>0\<^sup>)  any\<^sup>(\<^sup>1\<^sup>0\<^sup>0\<^sup>0\<^sup>) \<dots> any\<^sup>(\<^sup>1\<^sup>0\<^sup>0\<^sup>0\<^sup>)"} & @{text "(999)"} \\\\
 | 
| 
28770
 
93a372e2dc7a
added section "The Pure grammar" (incomplete version, based on old ref manual);
 
wenzelm 
parents: 
28769 
diff
changeset
 | 
760  | 
|
| 28778 | 761  | 
  @{syntax_def (inner) logic} & = & @{verbatim "("} @{text logic} @{verbatim ")"} \\
 | 
| 28772 | 762  | 
    & @{text "|"} & @{text "logic\<^sup>(\<^sup>4\<^sup>)"} @{verbatim "::"} @{text type} & @{text "(3)"} \\
 | 
| 28773 | 763  | 
    & @{text "|"} & @{text "id  |  longid  |  var  |  "}@{verbatim "_"}@{text "  |  "}@{verbatim "..."} \\
 | 
| 
28856
 
5e009a80fe6d
Pure syntax: more coherent treatment of aprop, permanent TERM and &&&;
 
wenzelm 
parents: 
28779 
diff
changeset
 | 
764  | 
    & @{text "|"} & @{verbatim CONST} @{text "id  |  "}@{verbatim CONST} @{text "longid"} \\
 | 
| 46287 | 765  | 
    & @{text "|"} & @{verbatim XCONST} @{text "id  |  "}@{verbatim XCONST} @{text "longid"} \\
 | 
| 28773 | 766  | 
    & @{text "|"} & @{text "logic\<^sup>(\<^sup>1\<^sup>0\<^sup>0\<^sup>0\<^sup>)  any\<^sup>(\<^sup>1\<^sup>0\<^sup>0\<^sup>0\<^sup>) \<dots> any\<^sup>(\<^sup>1\<^sup>0\<^sup>0\<^sup>0\<^sup>)"} & @{text "(999)"} \\
 | 
| 46287 | 767  | 
    & @{text "|"} & @{text "\<struct> index\<^sup>(\<^sup>1\<^sup>0\<^sup>0\<^sup>0\<^sup>)"} \\
 | 
| 28772 | 768  | 
    & @{text "|"} & @{verbatim "%"} @{text pttrns} @{verbatim "."} @{text "any\<^sup>(\<^sup>3\<^sup>)"} & @{text "(3)"} \\
 | 
| 28773 | 769  | 
    & @{text "|"} & @{text \<lambda>} @{text pttrns} @{verbatim "."} @{text "any\<^sup>(\<^sup>3\<^sup>)"} & @{text "(3)"} \\
 | 
| 46287 | 770  | 
    & @{text "|"} & @{verbatim op} @{verbatim "=="}@{text "  |  "}@{verbatim op} @{text "\<equiv>"}@{text "  |  "}@{verbatim op} @{verbatim "&&&"} \\
 | 
771  | 
    & @{text "|"} & @{verbatim op} @{verbatim "==>"}@{text "  |  "}@{verbatim op} @{text "\<Longrightarrow>"} \\
 | 
|
| 28772 | 772  | 
    & @{text "|"} & @{verbatim TYPE} @{verbatim "("} @{text type} @{verbatim ")"} \\\\
 | 
773  | 
||
| 28778 | 774  | 
  @{syntax_def (inner) idt} & = & @{verbatim "("} @{text idt} @{verbatim ")"}@{text "  |  id  |  "}@{verbatim "_"} \\
 | 
| 28773 | 775  | 
    & @{text "|"} & @{text id} @{verbatim "::"} @{text type} & @{text "(0)"} \\
 | 
776  | 
    & @{text "|"} & @{verbatim "_"} @{verbatim "::"} @{text type} & @{text "(0)"} \\\\
 | 
|
| 28772 | 777  | 
|
| 46287 | 778  | 
  @{syntax_def (inner) index} & = & @{verbatim "\<^bsub>"} @{text "logic\<^sup>(\<^sup>0\<^sup>)"} @{verbatim "\<^esub>"}@{text "  |  |  \<index>"} \\\\
 | 
779  | 
||
| 28778 | 780  | 
  @{syntax_def (inner) idts} & = & @{text "idt  |  idt\<^sup>(\<^sup>1\<^sup>) idts"} & @{text "(0)"} \\\\
 | 
| 28772 | 781  | 
|
| 28778 | 782  | 
  @{syntax_def (inner) pttrn} & = & @{text idt} \\\\
 | 
| 28772 | 783  | 
|
| 28778 | 784  | 
  @{syntax_def (inner) pttrns} & = & @{text "pttrn  |  pttrn\<^sup>(\<^sup>1\<^sup>) pttrns"} & @{text "(0)"} \\\\
 | 
| 28774 | 785  | 
|
| 28778 | 786  | 
  @{syntax_def (inner) type} & = & @{verbatim "("} @{text type} @{verbatim ")"} \\
 | 
| 28773 | 787  | 
    & @{text "|"} & @{text "tid  |  tvar  |  "}@{verbatim "_"} \\
 | 
788  | 
    & @{text "|"} & @{text "tid"} @{verbatim "::"} @{text "sort  |  tvar  "}@{verbatim "::"} @{text "sort  |  "}@{verbatim "_"} @{verbatim "::"} @{text "sort"} \\
 | 
|
| 46287 | 789  | 
    & @{text "|"} & @{text "type_name  |  type\<^sup>(\<^sup>1\<^sup>0\<^sup>0\<^sup>0\<^sup>) type_name"} \\
 | 
790  | 
    & @{text "|"} & @{verbatim "("} @{text type} @{verbatim ","} @{text "\<dots>"} @{verbatim ","} @{text type} @{verbatim ")"} @{text type_name} \\
 | 
|
| 28772 | 791  | 
    & @{text "|"} & @{text "type\<^sup>(\<^sup>1\<^sup>)"} @{verbatim "=>"} @{text type} & @{text "(0)"} \\
 | 
| 28773 | 792  | 
    & @{text "|"} & @{text "type\<^sup>(\<^sup>1\<^sup>)"} @{text "\<Rightarrow>"} @{text type} & @{text "(0)"} \\
 | 
793  | 
    & @{text "|"} & @{verbatim "["} @{text type} @{verbatim ","} @{text "\<dots>"} @{verbatim ","} @{text type} @{verbatim "]"} @{verbatim "=>"} @{text type} & @{text "(0)"} \\
 | 
|
| 46287 | 794  | 
    & @{text "|"} & @{verbatim "["} @{text type} @{verbatim ","} @{text "\<dots>"} @{verbatim ","} @{text type} @{verbatim "]"} @{text "\<Rightarrow>"} @{text type} & @{text "(0)"} \\
 | 
795  | 
  @{syntax_def (inner) type_name} & = & @{text "id  |  longid"} \\\\
 | 
|
| 28772 | 796  | 
|
| 46287 | 797  | 
  @{syntax_def (inner) sort} & = & @{syntax class_name}~@{text "  |  "}@{verbatim "{}"} \\
 | 
798  | 
    & @{text "|"} & @{verbatim "{"} @{syntax class_name} @{verbatim ","} @{text "\<dots>"} @{verbatim ","} @{syntax class_name} @{verbatim "}"} \\
 | 
|
799  | 
  @{syntax_def (inner) class_name} & = & @{text "id  |  longid"} \\
 | 
|
| 28773 | 800  | 
  \end{supertabular}
 | 
| 
28770
 
93a372e2dc7a
added section "The Pure grammar" (incomplete version, based on old ref manual);
 
wenzelm 
parents: 
28769 
diff
changeset
 | 
801  | 
  \end{center}
 | 
| 
 
93a372e2dc7a
added section "The Pure grammar" (incomplete version, based on old ref manual);
 
wenzelm 
parents: 
28769 
diff
changeset
 | 
802  | 
|
| 28774 | 803  | 
  \medskip Here literal terminals are printed @{verbatim "verbatim"};
 | 
804  | 
  see also \secref{sec:inner-lex} for further token categories of the
 | 
|
805  | 
inner syntax. The meaning of the nonterminals defined by the above  | 
|
806  | 
grammar is as follows:  | 
|
| 
28770
 
93a372e2dc7a
added section "The Pure grammar" (incomplete version, based on old ref manual);
 
wenzelm 
parents: 
28769 
diff
changeset
 | 
807  | 
|
| 
 
93a372e2dc7a
added section "The Pure grammar" (incomplete version, based on old ref manual);
 
wenzelm 
parents: 
28769 
diff
changeset
 | 
808  | 
  \begin{description}
 | 
| 
 
93a372e2dc7a
added section "The Pure grammar" (incomplete version, based on old ref manual);
 
wenzelm 
parents: 
28769 
diff
changeset
 | 
809  | 
|
| 28778 | 810  | 
  \item @{syntax_ref (inner) any} denotes any term.
 | 
| 
28770
 
93a372e2dc7a
added section "The Pure grammar" (incomplete version, based on old ref manual);
 
wenzelm 
parents: 
28769 
diff
changeset
 | 
811  | 
|
| 28778 | 812  | 
  \item @{syntax_ref (inner) prop} denotes meta-level propositions,
 | 
813  | 
  which are terms of type @{typ prop}.  The syntax of such formulae of
 | 
|
814  | 
the meta-logic is carefully distinguished from usual conventions for  | 
|
815  | 
  object-logics.  In particular, plain @{text "\<lambda>"}-term notation is
 | 
|
816  | 
  \emph{not} recognized as @{syntax (inner) prop}.
 | 
|
| 
28770
 
93a372e2dc7a
added section "The Pure grammar" (incomplete version, based on old ref manual);
 
wenzelm 
parents: 
28769 
diff
changeset
 | 
817  | 
|
| 28778 | 818  | 
  \item @{syntax_ref (inner) aprop} denotes atomic propositions, which
 | 
819  | 
  are embedded into regular @{syntax (inner) prop} by means of an
 | 
|
820  | 
  explicit @{verbatim PROP} token.
 | 
|
| 
28770
 
93a372e2dc7a
added section "The Pure grammar" (incomplete version, based on old ref manual);
 
wenzelm 
parents: 
28769 
diff
changeset
 | 
821  | 
|
| 
 
93a372e2dc7a
added section "The Pure grammar" (incomplete version, based on old ref manual);
 
wenzelm 
parents: 
28769 
diff
changeset
 | 
822  | 
  Terms of type @{typ prop} with non-constant head, e.g.\ a plain
 | 
| 
 
93a372e2dc7a
added section "The Pure grammar" (incomplete version, based on old ref manual);
 
wenzelm 
parents: 
28769 
diff
changeset
 | 
823  | 
  variable, are printed in this form.  Constants that yield type @{typ
 | 
| 
 
93a372e2dc7a
added section "The Pure grammar" (incomplete version, based on old ref manual);
 
wenzelm 
parents: 
28769 
diff
changeset
 | 
824  | 
prop} are expected to provide their own concrete syntax; otherwise  | 
| 28778 | 825  | 
  the printed version will appear like @{syntax (inner) logic} and
 | 
826  | 
  cannot be parsed again as @{syntax (inner) prop}.
 | 
|
| 
28770
 
93a372e2dc7a
added section "The Pure grammar" (incomplete version, based on old ref manual);
 
wenzelm 
parents: 
28769 
diff
changeset
 | 
827  | 
|
| 28778 | 828  | 
  \item @{syntax_ref (inner) logic} denotes arbitrary terms of a
 | 
829  | 
  logical type, excluding type @{typ prop}.  This is the main
 | 
|
830  | 
  syntactic category of object-logic entities, covering plain @{text
 | 
|
831  | 
\<lambda>}-term notation (variables, abstraction, application), plus  | 
|
832  | 
anything defined by the user.  | 
|
| 
28770
 
93a372e2dc7a
added section "The Pure grammar" (incomplete version, based on old ref manual);
 
wenzelm 
parents: 
28769 
diff
changeset
 | 
833  | 
|
| 
 
93a372e2dc7a
added section "The Pure grammar" (incomplete version, based on old ref manual);
 
wenzelm 
parents: 
28769 
diff
changeset
 | 
834  | 
When specifying notation for logical entities, all logical types  | 
| 
 
93a372e2dc7a
added section "The Pure grammar" (incomplete version, based on old ref manual);
 
wenzelm 
parents: 
28769 
diff
changeset
 | 
835  | 
  (excluding @{typ prop}) are \emph{collapsed} to this single category
 | 
| 28778 | 836  | 
  of @{syntax (inner) logic}.
 | 
| 
28770
 
93a372e2dc7a
added section "The Pure grammar" (incomplete version, based on old ref manual);
 
wenzelm 
parents: 
28769 
diff
changeset
 | 
837  | 
|
| 46287 | 838  | 
  \item @{syntax_ref (inner) index} denotes an optional index term for
 | 
| 
51657
 
3db1bbc82d8d
more accurate documentation of "(structure)" mixfix;
 
wenzelm 
parents: 
51654 
diff
changeset
 | 
839  | 
  indexed syntax.  If omitted, it refers to the first @{keyword_ref
 | 
| 46287 | 840  | 
  "structure"} variable in the context.  The special dummy ``@{text
 | 
841  | 
"\<index>"}'' serves as pattern variable in mixfix annotations that  | 
|
842  | 
introduce indexed notation.  | 
|
843  | 
||
| 28778 | 844  | 
  \item @{syntax_ref (inner) idt} denotes identifiers, possibly
 | 
845  | 
constrained by types.  | 
|
| 
28770
 
93a372e2dc7a
added section "The Pure grammar" (incomplete version, based on old ref manual);
 
wenzelm 
parents: 
28769 
diff
changeset
 | 
846  | 
|
| 28778 | 847  | 
  \item @{syntax_ref (inner) idts} denotes a sequence of @{syntax_ref
 | 
848  | 
(inner) idt}. This is the most basic category for variables in  | 
|
849  | 
  iterated binders, such as @{text "\<lambda>"} or @{text "\<And>"}.
 | 
|
| 
28770
 
93a372e2dc7a
added section "The Pure grammar" (incomplete version, based on old ref manual);
 
wenzelm 
parents: 
28769 
diff
changeset
 | 
850  | 
|
| 28778 | 851  | 
  \item @{syntax_ref (inner) pttrn} and @{syntax_ref (inner) pttrns}
 | 
852  | 
denote patterns for abstraction, cases bindings etc. In Pure, these  | 
|
853  | 
  categories start as a merely copy of @{syntax (inner) idt} and
 | 
|
854  | 
  @{syntax (inner) idts}, respectively.  Object-logics may add
 | 
|
855  | 
additional productions for binding forms.  | 
|
| 
28770
 
93a372e2dc7a
added section "The Pure grammar" (incomplete version, based on old ref manual);
 
wenzelm 
parents: 
28769 
diff
changeset
 | 
856  | 
|
| 28778 | 857  | 
  \item @{syntax_ref (inner) type} denotes types of the meta-logic.
 | 
| 
28770
 
93a372e2dc7a
added section "The Pure grammar" (incomplete version, based on old ref manual);
 
wenzelm 
parents: 
28769 
diff
changeset
 | 
858  | 
|
| 28778 | 859  | 
  \item @{syntax_ref (inner) sort} denotes meta-level sorts.
 | 
| 
28770
 
93a372e2dc7a
added section "The Pure grammar" (incomplete version, based on old ref manual);
 
wenzelm 
parents: 
28769 
diff
changeset
 | 
860  | 
|
| 
 
93a372e2dc7a
added section "The Pure grammar" (incomplete version, based on old ref manual);
 
wenzelm 
parents: 
28769 
diff
changeset
 | 
861  | 
  \end{description}
 | 
| 
 
93a372e2dc7a
added section "The Pure grammar" (incomplete version, based on old ref manual);
 
wenzelm 
parents: 
28769 
diff
changeset
 | 
862  | 
|
| 28774 | 863  | 
Here are some further explanations of certain syntax features.  | 
| 28773 | 864  | 
|
865  | 
  \begin{itemize}
 | 
|
| 
28770
 
93a372e2dc7a
added section "The Pure grammar" (incomplete version, based on old ref manual);
 
wenzelm 
parents: 
28769 
diff
changeset
 | 
866  | 
|
| 28778 | 867  | 
  \item In @{syntax (inner) idts}, note that @{text "x :: nat y"} is
 | 
868  | 
  parsed as @{text "x :: (nat y)"}, treating @{text y} like a type
 | 
|
869  | 
  constructor applied to @{text nat}.  To avoid this interpretation,
 | 
|
870  | 
  write @{text "(x :: nat) y"} with explicit parentheses.
 | 
|
| 28773 | 871  | 
|
872  | 
  \item Similarly, @{text "x :: nat y :: nat"} is parsed as @{text "x ::
 | 
|
| 
28770
 
93a372e2dc7a
added section "The Pure grammar" (incomplete version, based on old ref manual);
 
wenzelm 
parents: 
28769 
diff
changeset
 | 
873  | 
  (nat y :: nat)"}.  The correct form is @{text "(x :: nat) (y ::
 | 
| 
 
93a372e2dc7a
added section "The Pure grammar" (incomplete version, based on old ref manual);
 
wenzelm 
parents: 
28769 
diff
changeset
 | 
874  | 
  nat)"}, or @{text "(x :: nat) y :: nat"} if @{text y} is last in the
 | 
| 
 
93a372e2dc7a
added section "The Pure grammar" (incomplete version, based on old ref manual);
 
wenzelm 
parents: 
28769 
diff
changeset
 | 
875  | 
sequence of identifiers.  | 
| 28773 | 876  | 
|
877  | 
\item Type constraints for terms bind very weakly. For example,  | 
|
878  | 
  @{text "x < y :: nat"} is normally parsed as @{text "(x < y) ::
 | 
|
879  | 
  nat"}, unless @{text "<"} has a very low priority, in which case the
 | 
|
880  | 
  input is likely to be ambiguous.  The correct form is @{text "x < (y
 | 
|
881  | 
:: nat)"}.  | 
|
882  | 
||
883  | 
\item Constraints may be either written with two literal colons  | 
|
884  | 
  ``@{verbatim "::"}'' or the double-colon symbol @{verbatim "\<Colon>"},
 | 
|
| 28774 | 885  | 
  which actually looks exactly the same in some {\LaTeX} styles.
 | 
| 28773 | 886  | 
|
| 28774 | 887  | 
\item Dummy variables (written as underscore) may occur in different  | 
888  | 
roles.  | 
|
| 28773 | 889  | 
|
890  | 
  \begin{description}
 | 
|
891  | 
||
| 28774 | 892  | 
  \item A type ``@{text "_"}'' or ``@{text "_ :: sort"}'' acts like an
 | 
893  | 
anonymous inference parameter, which is filled-in according to the  | 
|
894  | 
most general type produced by the type-checking phase.  | 
|
| 
28770
 
93a372e2dc7a
added section "The Pure grammar" (incomplete version, based on old ref manual);
 
wenzelm 
parents: 
28769 
diff
changeset
 | 
895  | 
|
| 28774 | 896  | 
  \item A bound ``@{text "_"}'' refers to a vacuous abstraction, where
 | 
897  | 
the body does not refer to the binding introduced here. As in the  | 
|
898  | 
  term @{term "\<lambda>x _. x"}, which is @{text "\<alpha>"}-equivalent to @{text
 | 
|
899  | 
"\<lambda>x y. x"}.  | 
|
| 28773 | 900  | 
|
| 28774 | 901  | 
  \item A free ``@{text "_"}'' refers to an implicit outer binding.
 | 
902  | 
  Higher definitional packages usually allow forms like @{text "f x _
 | 
|
903  | 
= x"}.  | 
|
| 28773 | 904  | 
|
| 28774 | 905  | 
  \item A schematic ``@{text "_"}'' (within a term pattern, see
 | 
906  | 
  \secref{sec:term-decls}) refers to an anonymous variable that is
 | 
|
907  | 
implicitly abstracted over its context of locally bound variables.  | 
|
908  | 
  For example, this allows pattern matching of @{text "{x. f x = g
 | 
|
909  | 
  x}"} against @{text "{x. _ = _}"}, or even @{text "{_. _ = _}"} by
 | 
|
910  | 
using both bound and schematic dummies.  | 
|
| 28773 | 911  | 
|
912  | 
  \end{description}
 | 
|
913  | 
||
| 28774 | 914  | 
  \item The three literal dots ``@{verbatim "..."}'' may be also
 | 
915  | 
  written as ellipsis symbol @{verbatim "\<dots>"}.  In both cases this
 | 
|
916  | 
refers to a special schematic variable, which is bound in the  | 
|
917  | 
context. This special term abbreviation works nicely with  | 
|
918  | 
  calculational reasoning (\secref{sec:calculation}).
 | 
|
919  | 
||
| 46287 | 920  | 
  \item @{verbatim CONST} ensures that the given identifier is treated
 | 
921  | 
as constant term, and passed through the parse tree in fully  | 
|
922  | 
internalized form. This is particularly relevant for translation  | 
|
923  | 
  rules (\secref{sec:syn-trans}), notably on the RHS.
 | 
|
924  | 
||
925  | 
  \item @{verbatim XCONST} is similar to @{verbatim CONST}, but
 | 
|
926  | 
retains the constant name as given. This is only relevant to  | 
|
927  | 
  translation rules (\secref{sec:syn-trans}), notably on the LHS.
 | 
|
928  | 
||
| 28773 | 929  | 
  \end{itemize}
 | 
| 
28770
 
93a372e2dc7a
added section "The Pure grammar" (incomplete version, based on old ref manual);
 
wenzelm 
parents: 
28769 
diff
changeset
 | 
930  | 
*}  | 
| 
 
93a372e2dc7a
added section "The Pure grammar" (incomplete version, based on old ref manual);
 
wenzelm 
parents: 
28769 
diff
changeset
 | 
931  | 
|
| 28777 | 932  | 
|
| 46282 | 933  | 
subsection {* Inspecting the syntax *}
 | 
| 28777 | 934  | 
|
| 46282 | 935  | 
text {*
 | 
936  | 
  \begin{matharray}{rcl}
 | 
|
937  | 
    @{command_def "print_syntax"}@{text "\<^sup>*"} & : & @{text "context \<rightarrow>"} \\
 | 
|
938  | 
  \end{matharray}
 | 
|
| 28777 | 939  | 
|
| 46282 | 940  | 
  \begin{description}
 | 
941  | 
||
942  | 
  \item @{command "print_syntax"} prints the inner syntax of the
 | 
|
943  | 
current context. The output can be quite large; the most important  | 
|
944  | 
sections are explained below.  | 
|
| 28777 | 945  | 
|
| 46282 | 946  | 
  \begin{description}
 | 
| 28777 | 947  | 
|
| 46282 | 948  | 
  \item @{text "lexicon"} lists the delimiters of the inner token
 | 
949  | 
  language; see \secref{sec:inner-lex}.
 | 
|
| 28777 | 950  | 
|
| 46282 | 951  | 
  \item @{text "prods"} lists the productions of the underlying
 | 
952  | 
  priority grammar; see \secref{sec:priority-grammar}.
 | 
|
| 28777 | 953  | 
|
| 46282 | 954  | 
  The nonterminal @{text "A\<^sup>(\<^sup>p\<^sup>)"} is rendered in plain text as @{text
 | 
955  | 
"A[p]"}; delimiters are quoted. Many productions have an extra  | 
|
956  | 
  @{text "\<dots> => name"}.  These names later become the heads of parse
 | 
|
957  | 
trees; they also guide the pretty printer.  | 
|
| 28777 | 958  | 
|
| 46282 | 959  | 
  Productions without such parse tree names are called \emph{copy
 | 
960  | 
productions}. Their right-hand side must have exactly one  | 
|
961  | 
nonterminal symbol (or named token). The parser does not create a  | 
|
962  | 
new parse tree node for copy productions, but simply returns the  | 
|
963  | 
parse tree of the right-hand symbol.  | 
|
964  | 
||
965  | 
If the right-hand side of a copy production consists of a single  | 
|
966  | 
  nonterminal without any delimiters, then it is called a \emph{chain
 | 
|
967  | 
production}. Chain productions act as abbreviations: conceptually,  | 
|
968  | 
they are removed from the grammar by adding new productions.  | 
|
969  | 
Priority information attached to chain productions is ignored; only  | 
|
970  | 
  the dummy value @{text "-1"} is displayed.
 | 
|
971  | 
||
972  | 
  \item @{text "print modes"} lists the alternative print modes
 | 
|
973  | 
  provided by this grammar; see \secref{sec:print-modes}.
 | 
|
| 28777 | 974  | 
|
| 46282 | 975  | 
  \item @{text "parse_rules"} and @{text "print_rules"} relate to
 | 
976  | 
  syntax translations (macros); see \secref{sec:syn-trans}.
 | 
|
977  | 
||
978  | 
  \item @{text "parse_ast_translation"} and @{text
 | 
|
979  | 
"print_ast_translation"} list sets of constants that invoke  | 
|
980  | 
translation functions for abstract syntax trees, which are only  | 
|
981  | 
  required in very special situations; see \secref{sec:tr-funs}.
 | 
|
| 28777 | 982  | 
|
| 46282 | 983  | 
  \item @{text "parse_translation"} and @{text "print_translation"}
 | 
984  | 
list the sets of constants that invoke regular translation  | 
|
985  | 
  functions; see \secref{sec:tr-funs}.
 | 
|
| 29157 | 986  | 
|
| 46282 | 987  | 
  \end{description}
 | 
988  | 
||
989  | 
  \end{description}
 | 
|
| 28777 | 990  | 
*}  | 
| 28774 | 991  | 
|
| 
28770
 
93a372e2dc7a
added section "The Pure grammar" (incomplete version, based on old ref manual);
 
wenzelm 
parents: 
28769 
diff
changeset
 | 
992  | 
|
| 46291 | 993  | 
subsection {* Ambiguity of parsed expressions *}
 | 
994  | 
||
995  | 
text {*
 | 
|
996  | 
  \begin{tabular}{rcll}
 | 
|
| 
46512
 
4f9f61f9b535
simplified configuration options for syntax ambiguity;
 
wenzelm 
parents: 
46506 
diff
changeset
 | 
997  | 
    @{attribute_def syntax_ambiguity_warning} & : & @{text attribute} & default @{text true} \\
 | 
| 
46506
 
c7faa011bfa7
simplified configuration options for syntax ambiguity;
 
wenzelm 
parents: 
46494 
diff
changeset
 | 
998  | 
    @{attribute_def syntax_ambiguity_limit} & : & @{text attribute} & default @{text 10} \\
 | 
| 46291 | 999  | 
  \end{tabular}
 | 
1000  | 
||
1001  | 
Depending on the grammar and the given input, parsing may be  | 
|
1002  | 
ambiguous. Isabelle lets the Earley parser enumerate all possible  | 
|
1003  | 
parse trees, and then tries to make the best out of the situation.  | 
|
1004  | 
Terms that cannot be type-checked are filtered out, which often  | 
|
1005  | 
leads to a unique result in the end. Unlike regular type  | 
|
1006  | 
reconstruction, which is applied to the whole collection of input  | 
|
1007  | 
terms simultaneously, the filtering stage only treats each given  | 
|
1008  | 
term in isolation. Filtering is also not attempted for individual  | 
|
1009  | 
  types or raw ASTs (as required for @{command translations}).
 | 
|
1010  | 
||
1011  | 
Certain warning or error messages are printed, depending on the  | 
|
1012  | 
situation and the given configuration options. Parsing ultimately  | 
|
1013  | 
fails, if multiple results remain after the filtering phase.  | 
|
1014  | 
||
1015  | 
  \begin{description}
 | 
|
1016  | 
||
| 
46512
 
4f9f61f9b535
simplified configuration options for syntax ambiguity;
 
wenzelm 
parents: 
46506 
diff
changeset
 | 
1017  | 
  \item @{attribute syntax_ambiguity_warning} controls output of
 | 
| 
 
4f9f61f9b535
simplified configuration options for syntax ambiguity;
 
wenzelm 
parents: 
46506 
diff
changeset
 | 
1018  | 
explicit warning messages about syntax ambiguity.  | 
| 46291 | 1019  | 
|
| 
46506
 
c7faa011bfa7
simplified configuration options for syntax ambiguity;
 
wenzelm 
parents: 
46494 
diff
changeset
 | 
1020  | 
  \item @{attribute syntax_ambiguity_limit} determines the number of
 | 
| 46291 | 1021  | 
resulting parse trees that are shown as part of the printed message  | 
1022  | 
in case of an ambiguity.  | 
|
1023  | 
||
1024  | 
  \end{description}
 | 
|
1025  | 
*}  | 
|
1026  | 
||
1027  | 
||
| 48113 | 1028  | 
section {* Syntax transformations \label{sec:syntax-transformations} *}
 | 
1029  | 
||
1030  | 
text {* The inner syntax engine of Isabelle provides separate
 | 
|
| 52413 | 1031  | 
mechanisms to transform parse trees either via rewrite systems on  | 
| 48113 | 1032  | 
  first-order ASTs (\secref{sec:syn-trans}), or ML functions on ASTs
 | 
1033  | 
  or syntactic @{text "\<lambda>"}-terms (\secref{sec:tr-funs}).  This works
 | 
|
1034  | 
both for parsing and printing, as outlined in  | 
|
1035  | 
  \figref{fig:parse-print}.
 | 
|
1036  | 
||
1037  | 
  \begin{figure}[htbp]
 | 
|
1038  | 
  \begin{center}
 | 
|
1039  | 
  \begin{tabular}{cl}
 | 
|
1040  | 
string & \\  | 
|
1041  | 
  @{text "\<down>"}     & lexer + parser \\
 | 
|
1042  | 
parse tree & \\  | 
|
1043  | 
  @{text "\<down>"}     & parse AST translation \\
 | 
|
1044  | 
AST & \\  | 
|
1045  | 
  @{text "\<down>"}     & AST rewriting (macros) \\
 | 
|
1046  | 
AST & \\  | 
|
1047  | 
  @{text "\<down>"}     & parse translation \\
 | 
|
1048  | 
--- pre-term --- & \\  | 
|
1049  | 
  @{text "\<down>"}     & print translation \\
 | 
|
1050  | 
AST & \\  | 
|
1051  | 
  @{text "\<down>"}     & AST rewriting (macros) \\
 | 
|
1052  | 
AST & \\  | 
|
1053  | 
  @{text "\<down>"}     & print AST translation \\
 | 
|
1054  | 
string &  | 
|
1055  | 
  \end{tabular}
 | 
|
1056  | 
  \end{center}
 | 
|
1057  | 
  \caption{Parsing and printing with translations}\label{fig:parse-print}
 | 
|
1058  | 
  \end{figure}
 | 
|
1059  | 
||
1060  | 
These intermediate syntax tree formats eventually lead to a pre-term  | 
|
1061  | 
with all names and binding scopes resolved, but most type  | 
|
1062  | 
information still missing. Explicit type constraints might be given by  | 
|
1063  | 
the user, or implicit position information by the system --- both  | 
|
| 48816 | 1064  | 
need to be passed-through carefully by syntax transformations.  | 
| 48113 | 1065  | 
|
1066  | 
  Pre-terms are further processed by the so-called \emph{check} and
 | 
|
1067  | 
  \emph{unckeck} phases that are intertwined with type-inference (see
 | 
|
1068  | 
  also \cite{isabelle-implementation}).  The latter allows to operate
 | 
|
1069  | 
on higher-order abstract syntax with proper binding and type  | 
|
1070  | 
information already available.  | 
|
1071  | 
||
1072  | 
As a rule of thumb, anything that manipulates bindings of variables  | 
|
1073  | 
or constants needs to be implemented as syntax transformation (see  | 
|
1074  | 
below). Anything else is better done via check/uncheck: a prominent  | 
|
1075  | 
  example application is the @{command abbreviation} concept of
 | 
|
1076  | 
Isabelle/Pure. *}  | 
|
1077  | 
||
1078  | 
||
| 48115 | 1079  | 
subsection {* Abstract syntax trees \label{sec:ast} *}
 | 
| 48113 | 1080  | 
|
| 48114 | 1081  | 
text {* The ML datatype @{ML_type Ast.ast} explicitly represents the
 | 
1082  | 
intermediate AST format that is used for syntax rewriting  | 
|
1083  | 
  (\secref{sec:syn-trans}).  It is defined in ML as follows:
 | 
|
1084  | 
  \begin{ttbox}
 | 
|
1085  | 
datatype ast =  | 
|
1086  | 
Constant of string |  | 
|
1087  | 
Variable of string |  | 
|
1088  | 
Appl of ast list  | 
|
1089  | 
  \end{ttbox}
 | 
|
1090  | 
||
1091  | 
An AST is either an atom (constant or variable) or a list of (at  | 
|
1092  | 
least two) subtrees. Occasional diagnostic output of ASTs uses  | 
|
1093  | 
notation that resembles S-expression of LISP. Constant atoms are  | 
|
1094  | 
shown as quoted strings, variable atoms as non-quoted strings and  | 
|
1095  | 
applications as a parenthesized list of subtrees. For example, the  | 
|
1096  | 
AST  | 
|
1097  | 
  @{ML [display] "Ast.Appl
 | 
|
1098  | 
[Ast.Constant \"_abs\", Ast.Variable \"x\", Ast.Variable \"t\"]"}  | 
|
1099  | 
  is pretty-printed as @{verbatim "(\"_abs\" x t)"}.  Note that
 | 
|
1100  | 
  @{verbatim "()"} and @{verbatim "(x)"} are excluded as ASTs, because
 | 
|
1101  | 
they have too few subtrees.  | 
|
1102  | 
||
1103  | 
\medskip AST application is merely a pro-forma mechanism to indicate  | 
|
1104  | 
  certain syntactic structures.  Thus @{verbatim "(c a b)"} could mean
 | 
|
1105  | 
either term application or type application, depending on the  | 
|
1106  | 
syntactic context.  | 
|
1107  | 
||
1108  | 
  Nested application like @{verbatim "((\"_abs\" x t) u)"} is also
 | 
|
1109  | 
possible, but ASTs are definitely first-order: the syntax constant  | 
|
1110  | 
  @{verbatim "\"_abs\""} does not bind the @{verbatim x} in any way.
 | 
|
1111  | 
Proper bindings are introduced in later stages of the term syntax,  | 
|
1112  | 
  where @{verbatim "(\"_abs\" x t)"} becomes an @{ML Abs} node and
 | 
|
1113  | 
  occurrences of @{verbatim x} in @{verbatim t} are replaced by bound
 | 
|
1114  | 
variables (represented as de-Bruijn indices).  | 
|
| 48113 | 1115  | 
*}  | 
1116  | 
||
1117  | 
||
| 48115 | 1118  | 
subsubsection {* AST constants versus variables *}
 | 
| 48114 | 1119  | 
|
1120  | 
text {* Depending on the situation --- input syntax, output syntax,
 | 
|
1121  | 
  translation patterns --- the distinction of atomic asts as @{ML
 | 
|
1122  | 
  Ast.Constant} versus @{ML Ast.Variable} serves slightly different
 | 
|
1123  | 
purposes.  | 
|
1124  | 
||
1125  | 
  Input syntax of a term such as @{text "f a b = c"} does not yet
 | 
|
1126  | 
  indicate the scopes of atomic entities @{text "f, a, b, c"}: they
 | 
|
1127  | 
could be global constants or local variables, even bound ones  | 
|
1128  | 
  depending on the context of the term.  @{ML Ast.Variable} leaves
 | 
|
1129  | 
this choice still open: later syntax layers (or translation  | 
|
1130  | 
functions) may capture such a variable to determine its role  | 
|
1131  | 
specifically, to make it a constant, bound variable, free variable  | 
|
1132  | 
etc. In contrast, syntax translations that introduce already known  | 
|
1133  | 
  constants would rather do it via @{ML Ast.Constant} to prevent
 | 
|
1134  | 
accidental re-interpretation later on.  | 
|
1135  | 
||
1136  | 
  Output syntax turns term constants into @{ML Ast.Constant} and
 | 
|
1137  | 
  variables (free or schematic) into @{ML Ast.Variable}.  This
 | 
|
1138  | 
  information is precise when printing fully formal @{text "\<lambda>"}-terms.
 | 
|
1139  | 
||
| 52413 | 1140  | 
  \medskip AST translation patterns (\secref{sec:syn-trans}) that
 | 
1141  | 
represent terms cannot distinguish constants and variables  | 
|
1142  | 
  syntactically.  Explicit indication of @{text "CONST c"} inside the
 | 
|
1143  | 
  term language is required, unless @{text "c"} is known as special
 | 
|
1144  | 
  \emph{syntax constant} (see also @{command syntax}).  It is also
 | 
|
1145  | 
  possible to use @{command syntax} declarations (without mixfix
 | 
|
1146  | 
annotation) to enforce that certain unqualified names are always  | 
|
1147  | 
treated as constant within the syntax machinery.  | 
|
| 48114 | 1148  | 
|
| 52413 | 1149  | 
The situation is simpler for ASTs that represent types or sorts,  | 
1150  | 
since the concrete syntax already distinguishes type variables from  | 
|
1151  | 
  type constants (constructors).  So @{text "('a, 'b) foo"}
 | 
|
1152  | 
  corresponds to an AST application of some constant for @{text foo}
 | 
|
1153  | 
  and variable arguments for @{text "'a"} and @{text "'b"}.  Note that
 | 
|
1154  | 
the postfix application is merely a feature of the concrete syntax,  | 
|
1155  | 
while in the AST the constructor occurs in head position. *}  | 
|
| 48114 | 1156  | 
|
1157  | 
||
1158  | 
subsubsection {* Authentic syntax names *}
 | 
|
1159  | 
||
1160  | 
text {* Naming constant entities within ASTs is another delicate
 | 
|
| 52413 | 1161  | 
issue. Unqualified names are resolved in the name space tables in  | 
| 48114 | 1162  | 
the last stage of parsing, after all translations have been applied.  | 
1163  | 
Since syntax transformations do not know about this later name  | 
|
| 52413 | 1164  | 
resolution, there can be surprises in boundary cases.  | 
| 48114 | 1165  | 
|
1166  | 
  \emph{Authentic syntax names} for @{ML Ast.Constant} avoid this
 | 
|
1167  | 
problem: the fully-qualified constant name with a special prefix for  | 
|
1168  | 
  its formal category (@{text "class"}, @{text "type"}, @{text
 | 
|
1169  | 
  "const"}, @{text "fixed"}) represents the information faithfully
 | 
|
1170  | 
within the untyped AST format. Accidental overlap with free or  | 
|
1171  | 
bound variables is excluded as well. Authentic syntax names work  | 
|
1172  | 
implicitly in the following situations:  | 
|
1173  | 
||
1174  | 
  \begin{itemize}
 | 
|
1175  | 
||
1176  | 
\item Input of term constants (or fixed variables) that are  | 
|
1177  | 
  introduced by concrete syntax via @{command notation}: the
 | 
|
1178  | 
correspondence of a particular grammar production to some known term  | 
|
1179  | 
entity is preserved.  | 
|
1180  | 
||
| 48816 | 1181  | 
\item Input of type constants (constructors) and type classes ---  | 
| 48114 | 1182  | 
thanks to explicit syntactic distinction independently on the  | 
1183  | 
context.  | 
|
1184  | 
||
1185  | 
\item Output of term constants, type constants, type classes ---  | 
|
1186  | 
this information is already available from the internal term to be  | 
|
1187  | 
printed.  | 
|
1188  | 
||
1189  | 
  \end{itemize}
 | 
|
1190  | 
||
1191  | 
In other words, syntax transformations that operate on input terms  | 
|
| 48816 | 1192  | 
written as prefix applications are difficult to make robust.  | 
1193  | 
Luckily, this case rarely occurs in practice, because syntax forms  | 
|
| 52413 | 1194  | 
to be translated usually correspond to some concrete notation. *}  | 
| 48114 | 1195  | 
|
1196  | 
||
| 48113 | 1197  | 
subsection {* Raw syntax and translations \label{sec:syn-trans} *}
 | 
| 28762 | 1198  | 
|
1199  | 
text {*
 | 
|
| 48117 | 1200  | 
  \begin{tabular}{rcll}
 | 
| 
41229
 
d797baa3d57c
replaced command 'nonterminals' by slightly modernized version 'nonterminal';
 
wenzelm 
parents: 
40879 
diff
changeset
 | 
1201  | 
    @{command_def "nonterminal"} & : & @{text "theory \<rightarrow> theory"} \\
 | 
| 28762 | 1202  | 
    @{command_def "syntax"} & : & @{text "theory \<rightarrow> theory"} \\
 | 
1203  | 
    @{command_def "no_syntax"} & : & @{text "theory \<rightarrow> theory"} \\
 | 
|
1204  | 
    @{command_def "translations"} & : & @{text "theory \<rightarrow> theory"} \\
 | 
|
1205  | 
    @{command_def "no_translations"} & : & @{text "theory \<rightarrow> theory"} \\
 | 
|
| 48117 | 1206  | 
    @{attribute_def syntax_ast_trace} & : & @{text attribute} & default @{text false} \\
 | 
1207  | 
    @{attribute_def syntax_ast_stats} & : & @{text attribute} & default @{text false} \\
 | 
|
1208  | 
  \end{tabular}
 | 
|
| 28762 | 1209  | 
|
| 46292 | 1210  | 
Unlike mixfix notation for existing formal entities  | 
1211  | 
  (\secref{sec:notation}), raw syntax declarations provide full access
 | 
|
| 48115 | 1212  | 
to the priority grammar of the inner syntax, without any sanity  | 
1213  | 
checks. This includes additional syntactic categories (via  | 
|
1214  | 
  @{command nonterminal}) and free-form grammar productions (via
 | 
|
1215  | 
  @{command syntax}).  Additional syntax translations (or macros, via
 | 
|
1216  | 
  @{command translations}) are required to turn resulting parse trees
 | 
|
1217  | 
into proper representations of formal entities again.  | 
|
| 46292 | 1218  | 
|
| 
55112
 
b1a5d603fd12
prefer rail cartouche -- avoid back-slashed quotes;
 
wenzelm 
parents: 
55108 
diff
changeset
 | 
1219  | 
  @{rail \<open>
 | 
| 
42596
 
6c621a9d612a
modernized rail diagrams using @{rail} antiquotation;
 
wenzelm 
parents: 
42358 
diff
changeset
 | 
1220  | 
    @@{command nonterminal} (@{syntax name} + @'and')
 | 
| 28762 | 1221  | 
;  | 
| 
46494
 
ea2ae63336f3
clarified outer syntax "constdecl", which is only local to some rail diagrams;
 
wenzelm 
parents: 
46483 
diff
changeset
 | 
1222  | 
    (@@{command syntax} | @@{command no_syntax}) @{syntax mode}? (constdecl +)
 | 
| 28762 | 1223  | 
;  | 
| 
42596
 
6c621a9d612a
modernized rail diagrams using @{rail} antiquotation;
 
wenzelm 
parents: 
42358 
diff
changeset
 | 
1224  | 
    (@@{command translations} | @@{command no_translations})
 | 
| 
 
6c621a9d612a
modernized rail diagrams using @{rail} antiquotation;
 
wenzelm 
parents: 
42358 
diff
changeset
 | 
1225  | 
      (transpat ('==' | '=>' | '<=' | '\<rightleftharpoons>' | '\<rightharpoonup>' | '\<leftharpoondown>') transpat +)
 | 
| 28762 | 1226  | 
;  | 
1227  | 
||
| 
46494
 
ea2ae63336f3
clarified outer syntax "constdecl", which is only local to some rail diagrams;
 
wenzelm 
parents: 
46483 
diff
changeset
 | 
1228  | 
    constdecl: @{syntax name} '::' @{syntax type} @{syntax mixfix}?
 | 
| 
 
ea2ae63336f3
clarified outer syntax "constdecl", which is only local to some rail diagrams;
 
wenzelm 
parents: 
46483 
diff
changeset
 | 
1229  | 
;  | 
| 
42596
 
6c621a9d612a
modernized rail diagrams using @{rail} antiquotation;
 
wenzelm 
parents: 
42358 
diff
changeset
 | 
1230  | 
    mode: ('(' ( @{syntax name} | @'output' | @{syntax name} @'output' ) ')')
 | 
| 28762 | 1231  | 
;  | 
| 
42596
 
6c621a9d612a
modernized rail diagrams using @{rail} antiquotation;
 
wenzelm 
parents: 
42358 
diff
changeset
 | 
1232  | 
    transpat: ('(' @{syntax nameref} ')')? @{syntax string}
 | 
| 
55112
 
b1a5d603fd12
prefer rail cartouche -- avoid back-slashed quotes;
 
wenzelm 
parents: 
55108 
diff
changeset
 | 
1233  | 
\<close>}  | 
| 28762 | 1234  | 
|
1235  | 
  \begin{description}
 | 
|
| 46282 | 1236  | 
|
| 
41229
 
d797baa3d57c
replaced command 'nonterminals' by slightly modernized version 'nonterminal';
 
wenzelm 
parents: 
40879 
diff
changeset
 | 
1237  | 
  \item @{command "nonterminal"}~@{text c} declares a type
 | 
| 28762 | 1238  | 
  constructor @{text c} (without arguments) to act as purely syntactic
 | 
1239  | 
type: a nonterminal symbol of the inner syntax.  | 
|
1240  | 
||
| 46292 | 1241  | 
  \item @{command "syntax"}~@{text "(mode) c :: \<sigma> (mx)"} augments the
 | 
1242  | 
priority grammar and the pretty printer table for the given print  | 
|
1243  | 
  mode (default @{verbatim "\"\""}). An optional keyword @{keyword_ref
 | 
|
1244  | 
"output"} means that only the pretty printer table is affected.  | 
|
1245  | 
||
1246  | 
  Following \secref{sec:mixfix}, the mixfix annotation @{text "mx =
 | 
|
1247  | 
  template ps q"} together with type @{text "\<sigma> = \<tau>\<^sub>1 \<Rightarrow> \<dots> \<tau>\<^sub>n \<Rightarrow> \<tau>"} and
 | 
|
1248  | 
  specify a grammar production.  The @{text template} contains
 | 
|
1249  | 
  delimiter tokens that surround @{text "n"} argument positions
 | 
|
1250  | 
  (@{verbatim "_"}).  The latter correspond to nonterminal symbols
 | 
|
1251  | 
  @{text "A\<^sub>i"} derived from the argument types @{text "\<tau>\<^sub>i"} as
 | 
|
1252  | 
follows:  | 
|
1253  | 
  \begin{itemize}
 | 
|
1254  | 
||
1255  | 
  \item @{text "prop"} if @{text "\<tau>\<^sub>i = prop"}
 | 
|
1256  | 
||
1257  | 
  \item @{text "logic"} if @{text "\<tau>\<^sub>i = (\<dots>)\<kappa>"} for logical type
 | 
|
1258  | 
  constructor @{text "\<kappa> \<noteq> prop"}
 | 
|
1259  | 
||
1260  | 
  \item @{text any} if @{text "\<tau>\<^sub>i = \<alpha>"} for type variables
 | 
|
1261  | 
||
1262  | 
  \item @{text "\<kappa>"} if @{text "\<tau>\<^sub>i = \<kappa>"} for nonterminal @{text "\<kappa>"}
 | 
|
1263  | 
(syntactic type constructor)  | 
|
1264  | 
||
1265  | 
  \end{itemize}
 | 
|
1266  | 
||
1267  | 
  Each @{text "A\<^sub>i"} is decorated by priority @{text "p\<^sub>i"} from the
 | 
|
1268  | 
  given list @{text "ps"}; misssing priorities default to 0.
 | 
|
1269  | 
||
1270  | 
The resulting nonterminal of the production is determined similarly  | 
|
1271  | 
  from type @{text "\<tau>"}, with priority @{text "q"} and default 1000.
 | 
|
1272  | 
||
1273  | 
  \medskip Parsing via this production produces parse trees @{text
 | 
|
1274  | 
"t\<^sub>1, \<dots>, t\<^sub>n"} for the argument slots. The resulting parse tree is  | 
|
1275  | 
  composed as @{text "c t\<^sub>1 \<dots> t\<^sub>n"}, by using the syntax constant @{text
 | 
|
1276  | 
"c"} of the syntax declaration.  | 
|
1277  | 
||
1278  | 
Such syntactic constants are invented on the spot, without formal  | 
|
1279  | 
check wrt.\ existing declarations. It is conventional to use plain  | 
|
1280  | 
  identifiers prefixed by a single underscore (e.g.\ @{text
 | 
|
1281  | 
"_foobar"}). Names should be chosen with care, to avoid clashes  | 
|
| 48816 | 1282  | 
with other syntax declarations.  | 
| 46292 | 1283  | 
|
1284  | 
  \medskip The special case of copy production is specified by @{text
 | 
|
1285  | 
  "c = "}@{verbatim "\"\""} (empty string).  It means that the
 | 
|
1286  | 
  resulting parse tree @{text "t"} is copied directly, without any
 | 
|
1287  | 
further decoration.  | 
|
| 46282 | 1288  | 
|
| 28762 | 1289  | 
  \item @{command "no_syntax"}~@{text "(mode) decls"} removes grammar
 | 
1290  | 
  declarations (and translations) resulting from @{text decls}, which
 | 
|
1291  | 
  are interpreted in the same manner as for @{command "syntax"} above.
 | 
|
| 46282 | 1292  | 
|
| 28762 | 1293  | 
  \item @{command "translations"}~@{text rules} specifies syntactic
 | 
| 48115 | 1294  | 
translation rules (i.e.\ macros) as first-order rewrite rules on  | 
| 48816 | 1295  | 
  ASTs (\secref{sec:ast}).  The theory context maintains two
 | 
| 48115 | 1296  | 
  independent lists translation rules: parse rules (@{verbatim "=>"}
 | 
1297  | 
  or @{text "\<rightharpoonup>"}) and print rules (@{verbatim "<="} or @{text "\<leftharpoondown>"}).
 | 
|
1298  | 
For convenience, both can be specified simultaneously as parse~/  | 
|
1299  | 
  print rules (@{verbatim "=="} or @{text "\<rightleftharpoons>"}).
 | 
|
1300  | 
||
| 28762 | 1301  | 
Translation patterns may be prefixed by the syntactic category to be  | 
| 48115 | 1302  | 
  used for parsing; the default is @{text logic} which means that
 | 
1303  | 
regular term syntax is used. Both sides of the syntax translation  | 
|
1304  | 
rule undergo parsing and parse AST translations  | 
|
1305  | 
  \secref{sec:tr-funs}, in order to perform some fundamental
 | 
|
1306  | 
  normalization like @{text "\<lambda>x y. b \<leadsto> \<lambda>x. \<lambda>y. b"}, but other AST
 | 
|
1307  | 
  translation rules are \emph{not} applied recursively here.
 | 
|
1308  | 
||
1309  | 
When processing AST patterns, the inner syntax lexer runs in a  | 
|
1310  | 
different mode that allows identifiers to start with underscore.  | 
|
1311  | 
This accommodates the usual naming convention for auxiliary syntax  | 
|
1312  | 
constants --- those that do not have a logical counter part --- by  | 
|
1313  | 
allowing to specify arbitrary AST applications within the term  | 
|
1314  | 
syntax, independently of the corresponding concrete syntax.  | 
|
1315  | 
||
1316  | 
  Atomic ASTs are distinguished as @{ML Ast.Constant} versus @{ML
 | 
|
1317  | 
Ast.Variable} as follows: a qualified name or syntax constant  | 
|
1318  | 
  declared via @{command syntax}, or parse tree head of concrete
 | 
|
1319  | 
  notation becomes @{ML Ast.Constant}, anything else @{ML
 | 
|
1320  | 
  Ast.Variable}.  Note that @{text CONST} and @{text XCONST} within
 | 
|
1321  | 
  the term language (\secref{sec:pure-grammar}) allow to enforce
 | 
|
1322  | 
treatment as constants.  | 
|
1323  | 
||
1324  | 
  AST rewrite rules @{text "(lhs, rhs)"} need to obey the following
 | 
|
1325  | 
side-conditions:  | 
|
1326  | 
||
1327  | 
  \begin{itemize}
 | 
|
1328  | 
||
1329  | 
  \item Rules must be left linear: @{text "lhs"} must not contain
 | 
|
1330  | 
  repeated variables.\footnote{The deeper reason for this is that AST
 | 
|
1331  | 
equality is not well-defined: different occurrences of the ``same''  | 
|
1332  | 
AST could be decorated differently by accidental type-constraints or  | 
|
1333  | 
source position information, for example.}  | 
|
1334  | 
||
1335  | 
  \item Every variable in @{text "rhs"} must also occur in @{text
 | 
|
1336  | 
"lhs"}.  | 
|
1337  | 
||
1338  | 
  \end{itemize}
 | 
|
| 46282 | 1339  | 
|
| 28762 | 1340  | 
  \item @{command "no_translations"}~@{text rules} removes syntactic
 | 
1341  | 
translation rules, which are interpreted in the same manner as for  | 
|
1342  | 
  @{command "translations"} above.
 | 
|
1343  | 
||
| 48117 | 1344  | 
  \item @{attribute syntax_ast_trace} and @{attribute
 | 
1345  | 
syntax_ast_stats} control diagnostic output in the AST normalization  | 
|
1346  | 
process, when translation rules are applied to concrete input or  | 
|
1347  | 
output.  | 
|
1348  | 
||
| 28762 | 1349  | 
  \end{description}
 | 
| 46293 | 1350  | 
|
1351  | 
Raw syntax and translations provides a slightly more low-level  | 
|
1352  | 
access to the grammar and the form of resulting parse trees. It is  | 
|
1353  | 
often possible to avoid this untyped macro mechanism, and use  | 
|
1354  | 
  type-safe @{command abbreviation} or @{command notation} instead.
 | 
|
1355  | 
  Some important situations where @{command syntax} and @{command
 | 
|
1356  | 
translations} are really need are as follows:  | 
|
1357  | 
||
1358  | 
  \begin{itemize}
 | 
|
1359  | 
||
1360  | 
  \item Iterated replacement via recursive @{command translations}.
 | 
|
1361  | 
  For example, consider list enumeration @{term "[a, b, c, d]"} as
 | 
|
1362  | 
  defined in theory @{theory List} in Isabelle/HOL.
 | 
|
1363  | 
||
1364  | 
\item Change of binding status of variables: anything beyond the  | 
|
1365  | 
  built-in @{keyword "binder"} mixfix annotation requires explicit
 | 
|
1366  | 
syntax translations. For example, consider list filter  | 
|
1367  | 
  comprehension @{term "[x \<leftarrow> xs . P]"} as defined in theory @{theory
 | 
|
1368  | 
List} in Isabelle/HOL.  | 
|
1369  | 
||
1370  | 
  \end{itemize}
 | 
|
| 28762 | 1371  | 
*}  | 
1372  | 
||
| 48117 | 1373  | 
subsubsection {* Applying translation rules *}
 | 
1374  | 
||
1375  | 
text {* As a term is being parsed or printed, an AST is generated as
 | 
|
1376  | 
  an intermediate form according to \figref{fig:parse-print}.  The AST
 | 
|
1377  | 
is normalized by applying translation rules in the manner of a  | 
|
1378  | 
first-order term rewriting system. We first examine how a single  | 
|
1379  | 
rule is applied.  | 
|
1380  | 
||
1381  | 
  Let @{text "t"} be the abstract syntax tree to be normalized and
 | 
|
1382  | 
  @{text "(lhs, rhs)"} some translation rule.  A subtree @{text "u"}
 | 
|
1383  | 
  of @{text "t"} is called \emph{redex} if it is an instance of @{text
 | 
|
1384  | 
  "lhs"}; in this case the pattern @{text "lhs"} is said to match the
 | 
|
1385  | 
  object @{text "u"}.  A redex matched by @{text "lhs"} may be
 | 
|
1386  | 
  replaced by the corresponding instance of @{text "rhs"}, thus
 | 
|
1387  | 
  \emph{rewriting} the AST @{text "t"}.  Matching requires some notion
 | 
|
1388  | 
  of \emph{place-holders} in rule patterns: @{ML Ast.Variable} serves
 | 
|
1389  | 
this purpose.  | 
|
1390  | 
||
1391  | 
  More precisely, the matching of the object @{text "u"} against the
 | 
|
1392  | 
  pattern @{text "lhs"} is performed as follows:
 | 
|
1393  | 
||
1394  | 
  \begin{itemize}
 | 
|
1395  | 
||
1396  | 
  \item Objects of the form @{ML Ast.Variable}~@{text "x"} or @{ML
 | 
|
1397  | 
  Ast.Constant}~@{text "x"} are matched by pattern @{ML
 | 
|
1398  | 
  Ast.Constant}~@{text "x"}.  Thus all atomic ASTs in the object are
 | 
|
1399  | 
treated as (potential) constants, and a successful match makes them  | 
|
1400  | 
actual constants even before name space resolution (see also  | 
|
1401  | 
  \secref{sec:ast}).
 | 
|
1402  | 
||
1403  | 
  \item Object @{text "u"} is matched by pattern @{ML
 | 
|
1404  | 
  Ast.Variable}~@{text "x"}, binding @{text "x"} to @{text "u"}.
 | 
|
1405  | 
||
1406  | 
  \item Object @{ML Ast.Appl}~@{text "us"} is matched by @{ML
 | 
|
1407  | 
  Ast.Appl}~@{text "ts"} if @{text "us"} and @{text "ts"} have the
 | 
|
1408  | 
same length and each corresponding subtree matches.  | 
|
1409  | 
||
1410  | 
\item In every other case, matching fails.  | 
|
1411  | 
||
1412  | 
  \end{itemize}
 | 
|
1413  | 
||
1414  | 
  A successful match yields a substitution that is applied to @{text
 | 
|
1415  | 
  "rhs"}, generating the instance that replaces @{text "u"}.
 | 
|
1416  | 
||
1417  | 
Normalizing an AST involves repeatedly applying translation rules  | 
|
1418  | 
until none are applicable. This works yoyo-like: top-down,  | 
|
1419  | 
bottom-up, top-down, etc. At each subtree position, rules are  | 
|
1420  | 
chosen in order of appearance in the theory definitions.  | 
|
1421  | 
||
1422  | 
  The configuration options @{attribute syntax_ast_trace} and
 | 
|
| 48816 | 1423  | 
  @{attribute syntax_ast_stats} might help to understand this process
 | 
| 48117 | 1424  | 
and diagnose problems.  | 
1425  | 
||
1426  | 
  \begin{warn}
 | 
|
1427  | 
If syntax translation rules work incorrectly, the output of  | 
|
| 48118 | 1428  | 
  @{command_ref print_syntax} with its \emph{rules} sections reveals the
 | 
| 48117 | 1429  | 
actual internal forms of AST pattern, without potentially confusing  | 
1430  | 
concrete syntax. Recall that AST constants appear as quoted strings  | 
|
1431  | 
and variables without quotes.  | 
|
1432  | 
  \end{warn}
 | 
|
1433  | 
||
1434  | 
  \begin{warn}
 | 
|
1435  | 
  If @{attribute_ref eta_contract} is set to @{text "true"}, terms
 | 
|
1436  | 
  will be @{text "\<eta>"}-contracted \emph{before} the AST rewriter sees
 | 
|
1437  | 
them. Thus some abstraction nodes needed for print rules to match  | 
|
1438  | 
  may vanish.  For example, @{text "Ball A (\<lambda>x. P x)"} would contract
 | 
|
1439  | 
  to @{text "Ball A P"} and the standard print rule would fail to
 | 
|
1440  | 
apply. This problem can be avoided by hand-written ML translation  | 
|
1441  | 
  functions (see also \secref{sec:tr-funs}), which is in fact the same
 | 
|
1442  | 
  mechanism used in built-in @{keyword "binder"} declarations.
 | 
|
1443  | 
  \end{warn}
 | 
|
1444  | 
*}  | 
|
1445  | 
||
| 28762 | 1446  | 
|
| 48113 | 1447  | 
subsection {* Syntax translation functions \label{sec:tr-funs} *}
 | 
| 28762 | 1448  | 
|
1449  | 
text {*
 | 
|
1450  | 
  \begin{matharray}{rcl}
 | 
|
1451  | 
    @{command_def "parse_ast_translation"} & : & @{text "theory \<rightarrow> theory"} \\
 | 
|
1452  | 
    @{command_def "parse_translation"} & : & @{text "theory \<rightarrow> theory"} \\
 | 
|
1453  | 
    @{command_def "print_translation"} & : & @{text "theory \<rightarrow> theory"} \\
 | 
|
1454  | 
    @{command_def "typed_print_translation"} & : & @{text "theory \<rightarrow> theory"} \\
 | 
|
1455  | 
    @{command_def "print_ast_translation"} & : & @{text "theory \<rightarrow> theory"} \\
 | 
|
| 
48119
 
55c305e29f4b
cover @{class_syntax}, @{type_syntax}, @{const_syntax}, @{syntax_const} in isar-ref, in contrast to other ML antiquotations in implementation manual;
 
wenzelm 
parents: 
48118 
diff
changeset
 | 
1456  | 
    @{ML_antiquotation_def "class_syntax"} & : & @{text ML_antiquotation} \\
 | 
| 
 
55c305e29f4b
cover @{class_syntax}, @{type_syntax}, @{const_syntax}, @{syntax_const} in isar-ref, in contrast to other ML antiquotations in implementation manual;
 
wenzelm 
parents: 
48118 
diff
changeset
 | 
1457  | 
    @{ML_antiquotation_def "type_syntax"} & : & @{text ML_antiquotation} \\
 | 
| 
 
55c305e29f4b
cover @{class_syntax}, @{type_syntax}, @{const_syntax}, @{syntax_const} in isar-ref, in contrast to other ML antiquotations in implementation manual;
 
wenzelm 
parents: 
48118 
diff
changeset
 | 
1458  | 
    @{ML_antiquotation_def "const_syntax"} & : & @{text ML_antiquotation} \\
 | 
| 
 
55c305e29f4b
cover @{class_syntax}, @{type_syntax}, @{const_syntax}, @{syntax_const} in isar-ref, in contrast to other ML antiquotations in implementation manual;
 
wenzelm 
parents: 
48118 
diff
changeset
 | 
1459  | 
    @{ML_antiquotation_def "syntax_const"} & : & @{text ML_antiquotation} \\
 | 
| 28762 | 1460  | 
  \end{matharray}
 | 
1461  | 
||
| 48118 | 1462  | 
Syntax translation functions written in ML admit almost arbitrary  | 
1463  | 
manipulations of inner syntax, at the expense of some complexity and  | 
|
1464  | 
obscurity in the implementation.  | 
|
1465  | 
||
| 
55112
 
b1a5d603fd12
prefer rail cartouche -- avoid back-slashed quotes;
 
wenzelm 
parents: 
55108 
diff
changeset
 | 
1466  | 
  @{rail \<open>
 | 
| 
42596
 
6c621a9d612a
modernized rail diagrams using @{rail} antiquotation;
 
wenzelm 
parents: 
42358 
diff
changeset
 | 
1467  | 
  ( @@{command parse_ast_translation} | @@{command parse_translation} |
 | 
| 
 
6c621a9d612a
modernized rail diagrams using @{rail} antiquotation;
 
wenzelm 
parents: 
42358 
diff
changeset
 | 
1468  | 
    @@{command print_translation} | @@{command typed_print_translation} |
 | 
| 52143 | 1469  | 
    @@{command print_ast_translation}) @{syntax text}
 | 
| 
48119
 
55c305e29f4b
cover @{class_syntax}, @{type_syntax}, @{const_syntax}, @{syntax_const} in isar-ref, in contrast to other ML antiquotations in implementation manual;
 
wenzelm 
parents: 
48118 
diff
changeset
 | 
1470  | 
;  | 
| 
 
55c305e29f4b
cover @{class_syntax}, @{type_syntax}, @{const_syntax}, @{syntax_const} in isar-ref, in contrast to other ML antiquotations in implementation manual;
 
wenzelm 
parents: 
48118 
diff
changeset
 | 
1471  | 
  (@@{ML_antiquotation class_syntax} |
 | 
| 
 
55c305e29f4b
cover @{class_syntax}, @{type_syntax}, @{const_syntax}, @{syntax_const} in isar-ref, in contrast to other ML antiquotations in implementation manual;
 
wenzelm 
parents: 
48118 
diff
changeset
 | 
1472  | 
   @@{ML_antiquotation type_syntax} |
 | 
| 
 
55c305e29f4b
cover @{class_syntax}, @{type_syntax}, @{const_syntax}, @{syntax_const} in isar-ref, in contrast to other ML antiquotations in implementation manual;
 
wenzelm 
parents: 
48118 
diff
changeset
 | 
1473  | 
   @@{ML_antiquotation const_syntax} |
 | 
| 
 
55c305e29f4b
cover @{class_syntax}, @{type_syntax}, @{const_syntax}, @{syntax_const} in isar-ref, in contrast to other ML antiquotations in implementation manual;
 
wenzelm 
parents: 
48118 
diff
changeset
 | 
1474  | 
   @@{ML_antiquotation syntax_const}) name
 | 
| 
55112
 
b1a5d603fd12
prefer rail cartouche -- avoid back-slashed quotes;
 
wenzelm 
parents: 
55108 
diff
changeset
 | 
1475  | 
\<close>}  | 
| 28762 | 1476  | 
|
| 
48119
 
55c305e29f4b
cover @{class_syntax}, @{type_syntax}, @{const_syntax}, @{syntax_const} in isar-ref, in contrast to other ML antiquotations in implementation manual;
 
wenzelm 
parents: 
48118 
diff
changeset
 | 
1477  | 
  \begin{description}
 | 
| 
 
55c305e29f4b
cover @{class_syntax}, @{type_syntax}, @{const_syntax}, @{syntax_const} in isar-ref, in contrast to other ML antiquotations in implementation manual;
 
wenzelm 
parents: 
48118 
diff
changeset
 | 
1478  | 
|
| 
 
55c305e29f4b
cover @{class_syntax}, @{type_syntax}, @{const_syntax}, @{syntax_const} in isar-ref, in contrast to other ML antiquotations in implementation manual;
 
wenzelm 
parents: 
48118 
diff
changeset
 | 
1479  | 
  \item @{command parse_translation} etc. declare syntax translation
 | 
| 
 
55c305e29f4b
cover @{class_syntax}, @{type_syntax}, @{const_syntax}, @{syntax_const} in isar-ref, in contrast to other ML antiquotations in implementation manual;
 
wenzelm 
parents: 
48118 
diff
changeset
 | 
1480  | 
functions to the theory. Any of these commands have a single  | 
| 
 
55c305e29f4b
cover @{class_syntax}, @{type_syntax}, @{const_syntax}, @{syntax_const} in isar-ref, in contrast to other ML antiquotations in implementation manual;
 
wenzelm 
parents: 
48118 
diff
changeset
 | 
1481  | 
  @{syntax text} argument that refers to an ML expression of
 | 
| 52413 | 1482  | 
appropriate type as follows:  | 
| 48118 | 1483  | 
|
1484  | 
\medskip  | 
|
| 
48119
 
55c305e29f4b
cover @{class_syntax}, @{type_syntax}, @{const_syntax}, @{syntax_const} in isar-ref, in contrast to other ML antiquotations in implementation manual;
 
wenzelm 
parents: 
48118 
diff
changeset
 | 
1485  | 
  {\footnotesize
 | 
| 52143 | 1486  | 
  \begin{tabular}{l}
 | 
1487  | 
  @{command parse_ast_translation} : \\
 | 
|
1488  | 
  \quad @{ML_type "(string * (Proof.context -> Ast.ast list -> Ast.ast)) list"} \\
 | 
|
1489  | 
  @{command parse_translation} : \\
 | 
|
1490  | 
  \quad @{ML_type "(string * (Proof.context -> term list -> term)) list"} \\
 | 
|
1491  | 
  @{command print_translation} : \\
 | 
|
1492  | 
  \quad @{ML_type "(string * (Proof.context -> term list -> term)) list"} \\
 | 
|
1493  | 
  @{command typed_print_translation} : \\
 | 
|
1494  | 
  \quad @{ML_type "(string * (Proof.context -> typ -> term list -> term)) list"} \\
 | 
|
1495  | 
  @{command print_ast_translation} : \\
 | 
|
1496  | 
  \quad @{ML_type "(string * (Proof.context -> Ast.ast list -> Ast.ast)) list"} \\
 | 
|
| 48118 | 1497  | 
  \end{tabular}}
 | 
1498  | 
\medskip  | 
|
| 28762 | 1499  | 
|
| 48816 | 1500  | 
  The argument list consists of @{text "(c, tr)"} pairs, where @{text
 | 
1501  | 
  "c"} is the syntax name of the formal entity involved, and @{text
 | 
|
1502  | 
  "tr"} a function that translates a syntax form @{text "c args"} into
 | 
|
| 52413 | 1503  | 
  @{text "tr ctxt args"} (depending on the context).  The Isabelle/ML
 | 
1504  | 
  naming convention for parse translations is @{text "c_tr"} and for
 | 
|
1505  | 
  print translations @{text "c_tr'"}.
 | 
|
| 48118 | 1506  | 
|
1507  | 
  The @{command_ref print_syntax} command displays the sets of names
 | 
|
1508  | 
  associated with the translation functions of a theory under @{text
 | 
|
1509  | 
"parse_ast_translation"} etc.  | 
|
1510  | 
||
| 
48119
 
55c305e29f4b
cover @{class_syntax}, @{type_syntax}, @{const_syntax}, @{syntax_const} in isar-ref, in contrast to other ML antiquotations in implementation manual;
 
wenzelm 
parents: 
48118 
diff
changeset
 | 
1511  | 
  \item @{text "@{class_syntax c}"}, @{text "@{type_syntax c}"},
 | 
| 
 
55c305e29f4b
cover @{class_syntax}, @{type_syntax}, @{const_syntax}, @{syntax_const} in isar-ref, in contrast to other ML antiquotations in implementation manual;
 
wenzelm 
parents: 
48118 
diff
changeset
 | 
1512  | 
  @{text "@{const_syntax c}"} inline the authentic syntax name of the
 | 
| 
 
55c305e29f4b
cover @{class_syntax}, @{type_syntax}, @{const_syntax}, @{syntax_const} in isar-ref, in contrast to other ML antiquotations in implementation manual;
 
wenzelm 
parents: 
48118 
diff
changeset
 | 
1513  | 
given formal entities into the ML source. This is the  | 
| 
 
55c305e29f4b
cover @{class_syntax}, @{type_syntax}, @{const_syntax}, @{syntax_const} in isar-ref, in contrast to other ML antiquotations in implementation manual;
 
wenzelm 
parents: 
48118 
diff
changeset
 | 
1514  | 
fully-qualified logical name prefixed by a special marker to  | 
| 
 
55c305e29f4b
cover @{class_syntax}, @{type_syntax}, @{const_syntax}, @{syntax_const} in isar-ref, in contrast to other ML antiquotations in implementation manual;
 
wenzelm 
parents: 
48118 
diff
changeset
 | 
1515  | 
indicate its kind: thus different logical name spaces are properly  | 
| 
 
55c305e29f4b
cover @{class_syntax}, @{type_syntax}, @{const_syntax}, @{syntax_const} in isar-ref, in contrast to other ML antiquotations in implementation manual;
 
wenzelm 
parents: 
48118 
diff
changeset
 | 
1516  | 
distinguished within parse trees.  | 
| 
 
55c305e29f4b
cover @{class_syntax}, @{type_syntax}, @{const_syntax}, @{syntax_const} in isar-ref, in contrast to other ML antiquotations in implementation manual;
 
wenzelm 
parents: 
48118 
diff
changeset
 | 
1517  | 
|
| 
 
55c305e29f4b
cover @{class_syntax}, @{type_syntax}, @{const_syntax}, @{syntax_const} in isar-ref, in contrast to other ML antiquotations in implementation manual;
 
wenzelm 
parents: 
48118 
diff
changeset
 | 
1518  | 
  \item @{text "@{const_syntax c}"} inlines the name @{text "c"} of
 | 
| 
 
55c305e29f4b
cover @{class_syntax}, @{type_syntax}, @{const_syntax}, @{syntax_const} in isar-ref, in contrast to other ML antiquotations in implementation manual;
 
wenzelm 
parents: 
48118 
diff
changeset
 | 
1519  | 
the given syntax constant, having checked that it has been declared  | 
| 
 
55c305e29f4b
cover @{class_syntax}, @{type_syntax}, @{const_syntax}, @{syntax_const} in isar-ref, in contrast to other ML antiquotations in implementation manual;
 
wenzelm 
parents: 
48118 
diff
changeset
 | 
1520  | 
  via some @{command syntax} commands within the theory context.  Note
 | 
| 
 
55c305e29f4b
cover @{class_syntax}, @{type_syntax}, @{const_syntax}, @{syntax_const} in isar-ref, in contrast to other ML antiquotations in implementation manual;
 
wenzelm 
parents: 
48118 
diff
changeset
 | 
1521  | 
that the usual naming convention makes syntax constants start with  | 
| 
 
55c305e29f4b
cover @{class_syntax}, @{type_syntax}, @{const_syntax}, @{syntax_const} in isar-ref, in contrast to other ML antiquotations in implementation manual;
 
wenzelm 
parents: 
48118 
diff
changeset
 | 
1522  | 
underscore, to reduce the chance of accidental clashes with other  | 
| 
 
55c305e29f4b
cover @{class_syntax}, @{type_syntax}, @{const_syntax}, @{syntax_const} in isar-ref, in contrast to other ML antiquotations in implementation manual;
 
wenzelm 
parents: 
48118 
diff
changeset
 | 
1523  | 
names occurring in parse trees (unqualified constants etc.).  | 
| 
 
55c305e29f4b
cover @{class_syntax}, @{type_syntax}, @{const_syntax}, @{syntax_const} in isar-ref, in contrast to other ML antiquotations in implementation manual;
 
wenzelm 
parents: 
48118 
diff
changeset
 | 
1524  | 
|
| 
 
55c305e29f4b
cover @{class_syntax}, @{type_syntax}, @{const_syntax}, @{syntax_const} in isar-ref, in contrast to other ML antiquotations in implementation manual;
 
wenzelm 
parents: 
48118 
diff
changeset
 | 
1525  | 
  \end{description}
 | 
| 48118 | 1526  | 
*}  | 
1527  | 
||
| 
48119
 
55c305e29f4b
cover @{class_syntax}, @{type_syntax}, @{const_syntax}, @{syntax_const} in isar-ref, in contrast to other ML antiquotations in implementation manual;
 
wenzelm 
parents: 
48118 
diff
changeset
 | 
1528  | 
|
| 48118 | 1529  | 
subsubsection {* The translation strategy *}
 | 
| 28762 | 1530  | 
|
| 48816 | 1531  | 
text {* The different kinds of translation functions are invoked during
 | 
| 48118 | 1532  | 
the transformations between parse trees, ASTs and syntactic terms  | 
1533  | 
  (cf.\ \figref{fig:parse-print}).  Whenever a combination of the form
 | 
|
1534  | 
  @{text "c x\<^sub>1 \<dots> x\<^sub>n"} is encountered, and a translation function
 | 
|
1535  | 
  @{text "f"} of appropriate kind is declared for @{text "c"}, the
 | 
|
1536  | 
  result is produced by evaluation of @{text "f [x\<^sub>1, \<dots>, x\<^sub>n]"} in ML.
 | 
|
1537  | 
||
1538  | 
  For AST translations, the arguments @{text "x\<^sub>1, \<dots>, x\<^sub>n"} are ASTs.  A
 | 
|
1539  | 
  combination has the form @{ML "Ast.Constant"}~@{text "c"} or @{ML
 | 
|
1540  | 
  "Ast.Appl"}~@{text "["}@{ML Ast.Constant}~@{text "c, x\<^sub>1, \<dots>, x\<^sub>n]"}.
 | 
|
1541  | 
For term translations, the arguments are terms and a combination has  | 
|
1542  | 
  the form @{ML Const}~@{text "(c, \<tau>)"} or @{ML Const}~@{text "(c, \<tau>)
 | 
|
1543  | 
$ x\<^sub>1 $ \<dots> $ x\<^sub>n"}. Terms allow more sophisticated transformations  | 
|
1544  | 
than ASTs do, typically involving abstractions and bound  | 
|
1545  | 
  variables. \emph{Typed} print translations may even peek at the type
 | 
|
| 52413 | 1546  | 
  @{text "\<tau>"} of the constant they are invoked on, although some
 | 
1547  | 
information might have been suppressed for term output already.  | 
|
| 48118 | 1548  | 
|
1549  | 
Regardless of whether they act on ASTs or terms, translation  | 
|
1550  | 
functions called during the parsing process differ from those for  | 
|
1551  | 
printing in their overall behaviour:  | 
|
1552  | 
||
1553  | 
  \begin{description}
 | 
|
| 28762 | 1554  | 
|
| 48118 | 1555  | 
\item [Parse translations] are applied bottom-up. The arguments are  | 
1556  | 
already in translated form. The translations must not fail;  | 
|
1557  | 
exceptions trigger an error message. There may be at most one  | 
|
1558  | 
function associated with any syntactic name.  | 
|
| 46294 | 1559  | 
|
| 48118 | 1560  | 
\item [Print translations] are applied top-down. They are supplied  | 
1561  | 
with arguments that are partly still in internal form. The result  | 
|
1562  | 
again undergoes translation; therefore a print translation should  | 
|
1563  | 
not introduce as head the very constant that invoked it. The  | 
|
1564  | 
  function may raise exception @{ML Match} to indicate failure; in
 | 
|
1565  | 
this event it has no effect. Multiple functions associated with  | 
|
1566  | 
some syntactic name are tried in the order of declaration in the  | 
|
1567  | 
theory.  | 
|
1568  | 
||
1569  | 
  \end{description}
 | 
|
1570  | 
||
1571  | 
  Only constant atoms --- constructor @{ML Ast.Constant} for ASTs and
 | 
|
1572  | 
  @{ML Const} for terms --- can invoke translation functions.  This
 | 
|
1573  | 
means that parse translations can only be associated with parse tree  | 
|
1574  | 
heads of concrete syntax, or syntactic constants introduced via  | 
|
1575  | 
other translations. For plain identifiers within the term language,  | 
|
1576  | 
the status of constant versus variable is not yet know during  | 
|
1577  | 
parsing. This is in contrast to print translations, where constants  | 
|
1578  | 
are explicitly known from the given term in its fully internal form.  | 
|
| 28762 | 1579  | 
*}  | 
1580  | 
||
| 
52414
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1581  | 
|
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1582  | 
subsection {* Built-in syntax transformations *}
 | 
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1583  | 
|
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1584  | 
text {*
 | 
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1585  | 
Here are some further details of the main syntax transformation  | 
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1586  | 
  phases of \figref{fig:parse-print}.
 | 
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1587  | 
*}  | 
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1588  | 
|
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1589  | 
|
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1590  | 
subsubsection {* Transforming parse trees to ASTs *}
 | 
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1591  | 
|
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1592  | 
text {* The parse tree is the raw output of the parser.  It is
 | 
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1593  | 
transformed into an AST according to some basic scheme that may be  | 
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1594  | 
augmented by AST translation functions as explained in  | 
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1595  | 
  \secref{sec:tr-funs}.
 | 
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1596  | 
|
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1597  | 
The parse tree is constructed by nesting the right-hand sides of the  | 
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1598  | 
productions used to recognize the input. Such parse trees are  | 
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1599  | 
simply lists of tokens and constituent parse trees, the latter  | 
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1600  | 
representing the nonterminals of the productions. Ignoring AST  | 
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1601  | 
translation functions, parse trees are transformed to ASTs by  | 
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1602  | 
stripping out delimiters and copy productions, while retaining some  | 
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1603  | 
source position information from input tokens.  | 
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1604  | 
|
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1605  | 
The Pure syntax provides predefined AST translations to make the  | 
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1606  | 
  basic @{text "\<lambda>"}-term structure more apparent within the
 | 
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1607  | 
(first-order) AST representation, and thus facilitate the use of  | 
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1608  | 
  @{command translations} (see also \secref{sec:syn-trans}).  This
 | 
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1609  | 
covers ordinary term application, type application, nested  | 
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1610  | 
abstraction, iterated meta implications and function types. The  | 
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1611  | 
effect is illustrated on some representative input strings is as  | 
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1612  | 
follows:  | 
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1613  | 
|
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1614  | 
  \begin{center}
 | 
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1615  | 
  \begin{tabular}{ll}
 | 
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1616  | 
input source & AST \\  | 
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1617  | 
\hline  | 
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1618  | 
  @{text "f x y z"} & @{verbatim "(f x y z)"} \\
 | 
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1619  | 
  @{text "'a ty"} & @{verbatim "(ty 'a)"} \\
 | 
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1620  | 
  @{text "('a, 'b)ty"} & @{verbatim "(ty 'a 'b)"} \\
 | 
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1621  | 
  @{text "\<lambda>x y z. t"} & @{verbatim "(\"_abs\" x (\"_abs\" y (\"_abs\" z t)))"} \\
 | 
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1622  | 
  @{text "\<lambda>x :: 'a. t"} & @{verbatim "(\"_abs\" (\"_constrain\" x 'a) t)"} \\
 | 
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1623  | 
  @{text "\<lbrakk>P; Q; R\<rbrakk> \<Longrightarrow> S"} & @{verbatim "(\"==>\" P (\"==>\" Q (\"==>\" R S)))"} \\
 | 
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1624  | 
   @{text "['a, 'b, 'c] \<Rightarrow> 'd"} & @{verbatim "(\"fun\" 'a (\"fun\" 'b (\"fun\" 'c 'd)))"} \\
 | 
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1625  | 
  \end{tabular}
 | 
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1626  | 
  \end{center}
 | 
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1627  | 
|
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1628  | 
Note that type and sort constraints may occur in further places ---  | 
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1629  | 
translations need to be ready to cope with them. The built-in  | 
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1630  | 
syntax transformation from parse trees to ASTs insert additional  | 
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1631  | 
constraints that represent source positions.  | 
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1632  | 
*}  | 
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1633  | 
|
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1634  | 
|
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1635  | 
subsubsection {* Transforming ASTs to terms *}
 | 
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1636  | 
|
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1637  | 
text {* After application of macros (\secref{sec:syn-trans}), the AST
 | 
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1638  | 
is transformed into a term. This term still lacks proper type  | 
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1639  | 
information, but it might contain some constraints consisting of  | 
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1640  | 
  applications with head @{verbatim "_constrain"}, where the second
 | 
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1641  | 
argument is a type encoded as a pre-term within the syntax. Type  | 
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1642  | 
inference later introduces correct types, or indicates type errors  | 
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1643  | 
in the input.  | 
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1644  | 
|
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1645  | 
Ignoring parse translations, ASTs are transformed to terms by  | 
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1646  | 
mapping AST constants to term constants, AST variables to term  | 
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1647  | 
variables or constants (according to the name space), and AST  | 
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1648  | 
applications to iterated term applications.  | 
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1649  | 
|
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1650  | 
The outcome is still a first-order term. Proper abstractions and  | 
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1651  | 
bound variables are introduced by parse translations associated with  | 
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1652  | 
  certain syntax constants.  Thus @{verbatim "(_abs x x)"} eventually
 | 
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1653  | 
  becomes a de-Bruijn term @{verbatim "Abs (\"x\", _, Bound 0)"}.
 | 
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1654  | 
*}  | 
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1655  | 
|
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1656  | 
|
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1657  | 
subsubsection {* Printing of terms *}
 | 
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1658  | 
|
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1659  | 
text {* The output phase is essentially the inverse of the input
 | 
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1660  | 
phase. Terms are translated via abstract syntax trees into  | 
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1661  | 
pretty-printed text.  | 
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1662  | 
|
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1663  | 
Ignoring print translations, the transformation maps term constants,  | 
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1664  | 
variables and applications to the corresponding constructs on ASTs.  | 
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1665  | 
Abstractions are mapped to applications of the special constant  | 
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1666  | 
  @{verbatim "_abs"} as seen before.  Type constraints are represented
 | 
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1667  | 
  via special @{verbatim "_constrain"} forms, according to various
 | 
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1668  | 
policies of type annotation determined elsewhere. Sort constraints  | 
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1669  | 
of type variables are handled in a similar fashion.  | 
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1670  | 
|
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1671  | 
  After application of macros (\secref{sec:syn-trans}), the AST is
 | 
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1672  | 
finally pretty-printed. The built-in print AST translations reverse  | 
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1673  | 
the corresponding parse AST translations.  | 
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1674  | 
|
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1675  | 
\medskip For the actual printing process, the priority grammar  | 
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1676  | 
  (\secref{sec:priority-grammar}) plays a vital role: productions are
 | 
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1677  | 
used as templates for pretty printing, with argument slots stemming  | 
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1678  | 
from nonterminals, and syntactic sugar stemming from literal tokens.  | 
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1679  | 
|
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1680  | 
  Each AST application with constant head @{text "c"} and arguments
 | 
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1681  | 
  @{text "t\<^sub>1"}, \dots, @{text "t\<^sub>n"} (for @{text "n = 0"} the AST is
 | 
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1682  | 
  just the constant @{text "c"} itself) is printed according to the
 | 
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1683  | 
  first grammar production of result name @{text "c"}.  The required
 | 
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1684  | 
syntax priority of the argument slot is given by its nonterminal  | 
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1685  | 
  @{text "A\<^sup>(\<^sup>p\<^sup>)"}.  The argument @{text "t\<^sub>i"} that corresponds to the
 | 
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1686  | 
  position of @{text "A\<^sup>(\<^sup>p\<^sup>)"} is printed recursively, and then put in
 | 
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1687  | 
  parentheses \emph{if} its priority @{text "p"} requires this.  The
 | 
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1688  | 
resulting output is concatenated with the syntactic sugar according  | 
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1689  | 
to the grammar production.  | 
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1690  | 
|
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1691  | 
  If an AST application @{text "(c x\<^sub>1 \<dots> x\<^sub>m)"} has more arguments than
 | 
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1692  | 
  the corresponding production, it is first split into @{text "((c x\<^sub>1
 | 
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1693  | 
\<dots> x\<^sub>n) x\<^sub>n\<^sub>+\<^sub>1 \<dots> x\<^sub>m)"} and then printed recursively as above.  | 
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1694  | 
|
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1695  | 
Applications with too few arguments or with non-constant head or  | 
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1696  | 
without a corresponding production are printed in prefix-form like  | 
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1697  | 
  @{text "f t\<^sub>1 \<dots> t\<^sub>n"} for terms.
 | 
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1698  | 
|
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1699  | 
  Multiple productions associated with some name @{text "c"} are tried
 | 
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1700  | 
in order of appearance within the grammar. An occurrence of some  | 
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1701  | 
  AST variable @{text "x"} is printed as @{text "x"} outright.
 | 
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1702  | 
|
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1703  | 
  \medskip White space is \emph{not} inserted automatically.  If
 | 
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1704  | 
blanks (or breaks) are required to separate tokens, they need to be  | 
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1705  | 
  specified in the mixfix declaration (\secref{sec:mixfix}).
 | 
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1706  | 
*}  | 
| 
 
8429123bc58a
more on built-in syntax transformations, based on reduced version of old material;
 
wenzelm 
parents: 
52413 
diff
changeset
 | 
1707  | 
|
| 28762 | 1708  | 
end  |