author | wenzelm |
Wed, 01 Nov 2017 20:46:23 +0100 | |
changeset 66983 | df83b66f1d94 |
parent 66776 | b74b9d0bf763 |
child 66984 | a1d3e5df0c95 |
permissions | -rw-r--r-- |
34166 | 1 |
/* Title: Pure/Isar/outer_syntax.scala |
2 |
Author: Makarius |
|
3 |
||
4 |
Isabelle/Isar outer syntax. |
|
5 |
*/ |
|
6 |
||
7 |
package isabelle |
|
8 |
||
9 |
||
43411
0206466ee473
some support for partial scans with explicit context;
wenzelm
parents:
40533
diff
changeset
|
10 |
import scala.collection.mutable |
34166 | 11 |
|
12 |
||
43774
6dfdb70496fe
added Outer_Syntax.quote_string, which is conceptually a bit different from Token.unparse;
wenzelm
parents:
43695
diff
changeset
|
13 |
object Outer_Syntax |
6dfdb70496fe
added Outer_Syntax.quote_string, which is conceptually a bit different from Token.unparse;
wenzelm
parents:
43695
diff
changeset
|
14 |
{ |
58706 | 15 |
/* syntax */ |
16 |
||
17 |
val empty: Outer_Syntax = new Outer_Syntax() |
|
18 |
||
19 |
def init(): Outer_Syntax = new Outer_Syntax(completion = Completion.init()) |
|
20 |
||
66776 | 21 |
def merge(syns: List[Outer_Syntax]): Outer_Syntax = (empty /: syns)(_ ++ _) |
66717
67dbf5cdc056
more informative loaded_theories: dependencies and syntax;
wenzelm
parents:
65384
diff
changeset
|
22 |
|
58706 | 23 |
|
24 |
/* string literals */ |
|
25 |
||
43774
6dfdb70496fe
added Outer_Syntax.quote_string, which is conceptually a bit different from Token.unparse;
wenzelm
parents:
43695
diff
changeset
|
26 |
def quote_string(str: String): String = |
6dfdb70496fe
added Outer_Syntax.quote_string, which is conceptually a bit different from Token.unparse;
wenzelm
parents:
43695
diff
changeset
|
27 |
{ |
6dfdb70496fe
added Outer_Syntax.quote_string, which is conceptually a bit different from Token.unparse;
wenzelm
parents:
43695
diff
changeset
|
28 |
val result = new StringBuilder(str.length + 10) |
6dfdb70496fe
added Outer_Syntax.quote_string, which is conceptually a bit different from Token.unparse;
wenzelm
parents:
43695
diff
changeset
|
29 |
result += '"' |
6dfdb70496fe
added Outer_Syntax.quote_string, which is conceptually a bit different from Token.unparse;
wenzelm
parents:
43695
diff
changeset
|
30 |
for (s <- Symbol.iterator(str)) { |
6dfdb70496fe
added Outer_Syntax.quote_string, which is conceptually a bit different from Token.unparse;
wenzelm
parents:
43695
diff
changeset
|
31 |
if (s.length == 1) { |
6dfdb70496fe
added Outer_Syntax.quote_string, which is conceptually a bit different from Token.unparse;
wenzelm
parents:
43695
diff
changeset
|
32 |
val c = s(0) |
6dfdb70496fe
added Outer_Syntax.quote_string, which is conceptually a bit different from Token.unparse;
wenzelm
parents:
43695
diff
changeset
|
33 |
if (c < 32 && c != YXML.X && c != YXML.Y || c == '\\' || c == '"') { |
6dfdb70496fe
added Outer_Syntax.quote_string, which is conceptually a bit different from Token.unparse;
wenzelm
parents:
43695
diff
changeset
|
34 |
result += '\\' |
6dfdb70496fe
added Outer_Syntax.quote_string, which is conceptually a bit different from Token.unparse;
wenzelm
parents:
43695
diff
changeset
|
35 |
if (c < 10) result += '0' |
6dfdb70496fe
added Outer_Syntax.quote_string, which is conceptually a bit different from Token.unparse;
wenzelm
parents:
43695
diff
changeset
|
36 |
if (c < 100) result += '0' |
60215 | 37 |
result ++= c.asInstanceOf[Int].toString |
43774
6dfdb70496fe
added Outer_Syntax.quote_string, which is conceptually a bit different from Token.unparse;
wenzelm
parents:
43695
diff
changeset
|
38 |
} |
6dfdb70496fe
added Outer_Syntax.quote_string, which is conceptually a bit different from Token.unparse;
wenzelm
parents:
43695
diff
changeset
|
39 |
else result += c |
6dfdb70496fe
added Outer_Syntax.quote_string, which is conceptually a bit different from Token.unparse;
wenzelm
parents:
43695
diff
changeset
|
40 |
} |
6dfdb70496fe
added Outer_Syntax.quote_string, which is conceptually a bit different from Token.unparse;
wenzelm
parents:
43695
diff
changeset
|
41 |
else result ++= s |
6dfdb70496fe
added Outer_Syntax.quote_string, which is conceptually a bit different from Token.unparse;
wenzelm
parents:
43695
diff
changeset
|
42 |
} |
6dfdb70496fe
added Outer_Syntax.quote_string, which is conceptually a bit different from Token.unparse;
wenzelm
parents:
43695
diff
changeset
|
43 |
result += '"' |
6dfdb70496fe
added Outer_Syntax.quote_string, which is conceptually a bit different from Token.unparse;
wenzelm
parents:
43695
diff
changeset
|
44 |
result.toString |
6dfdb70496fe
added Outer_Syntax.quote_string, which is conceptually a bit different from Token.unparse;
wenzelm
parents:
43695
diff
changeset
|
45 |
} |
6dfdb70496fe
added Outer_Syntax.quote_string, which is conceptually a bit different from Token.unparse;
wenzelm
parents:
43695
diff
changeset
|
46 |
} |
6dfdb70496fe
added Outer_Syntax.quote_string, which is conceptually a bit different from Token.unparse;
wenzelm
parents:
43695
diff
changeset
|
47 |
|
46712 | 48 |
final class Outer_Syntax private( |
58900 | 49 |
val keywords: Keyword.Keywords = Keyword.Keywords.empty, |
53280
c63a016805b9
explicit indication of outer syntax with no tokens;
wenzelm
parents:
52439
diff
changeset
|
50 |
val completion: Completion = Completion.empty, |
63867 | 51 |
val rev_abbrevs: Thy_Header.Abbrevs = Nil, |
55749 | 52 |
val language_context: Completion.Language_Context = Completion.Language_Context.outer, |
63584
68751fe1c036
tuned signature -- prover-independence is presently theoretical;
wenzelm
parents:
63579
diff
changeset
|
53 |
val has_tokens: Boolean = true) |
34166 | 54 |
{ |
58706 | 55 |
/** syntax content **/ |
56 |
||
58900 | 57 |
override def toString: String = keywords.toString |
56393
22f533e6a049
more abstract Prover.Syntax, as proposed by Carst Tankink;
wenzelm
parents:
56314
diff
changeset
|
58 |
|
58695 | 59 |
|
63867 | 60 |
/* keywords */ |
58695 | 61 |
|
65383 | 62 |
def + (name: String, kind: String = "", exts: List[String] = Nil): Outer_Syntax = |
53280
c63a016805b9
explicit indication of outer syntax with no tokens;
wenzelm
parents:
52439
diff
changeset
|
63 |
{ |
65383 | 64 |
val keywords1 = keywords + (name, kind, exts) |
53280
c63a016805b9
explicit indication of outer syntax with no tokens;
wenzelm
parents:
52439
diff
changeset
|
65 |
val completion1 = |
63587
881e8e2cfec2
implicit keyword completion only for actual words (amending 73939a9b70a3);
wenzelm
parents:
63584
diff
changeset
|
66 |
completion.add_keyword(name). |
881e8e2cfec2
implicit keyword completion only for actual words (amending 73939a9b70a3);
wenzelm
parents:
63584
diff
changeset
|
67 |
add_abbrevs( |
881e8e2cfec2
implicit keyword completion only for actual words (amending 73939a9b70a3);
wenzelm
parents:
63584
diff
changeset
|
68 |
(if (Keyword.theory_block.contains(kind)) List((name, name + "\nbegin\n\u0007\nend")) |
881e8e2cfec2
implicit keyword completion only for actual words (amending 73939a9b70a3);
wenzelm
parents:
63584
diff
changeset
|
69 |
else Nil) ::: |
881e8e2cfec2
implicit keyword completion only for actual words (amending 73939a9b70a3);
wenzelm
parents:
63584
diff
changeset
|
70 |
(if (Completion.Word_Parsers.is_word(name)) List((name, name)) else Nil)) |
63867 | 71 |
new Outer_Syntax(keywords1, completion1, rev_abbrevs, language_context, true) |
53280
c63a016805b9
explicit indication of outer syntax with no tokens;
wenzelm
parents:
52439
diff
changeset
|
72 |
} |
48706 | 73 |
|
48873 | 74 |
def add_keywords(keywords: Thy_Header.Keywords): Outer_Syntax = |
75 |
(this /: keywords) { |
|
65384 | 76 |
case (syntax, (name, spec)) => |
77 |
syntax + |
|
78 |
(Symbol.decode(name), spec.kind, spec.exts) + |
|
79 |
(Symbol.encode(name), spec.kind, spec.exts) |
|
63579 | 80 |
} |
81 |
||
63867 | 82 |
|
83 |
/* abbrevs */ |
|
84 |
||
85 |
def abbrevs: Thy_Header.Abbrevs = rev_abbrevs.reverse |
|
86 |
||
87 |
def add_abbrevs(new_abbrevs: Thy_Header.Abbrevs): Outer_Syntax = |
|
88 |
if (new_abbrevs.isEmpty) this |
|
63579 | 89 |
else { |
90 |
val completion1 = |
|
91 |
completion.add_abbrevs( |
|
63867 | 92 |
(for ((a, b) <- new_abbrevs) yield { |
63579 | 93 |
val a1 = Symbol.decode(a) |
94 |
val a2 = Symbol.encode(a) |
|
95 |
val b1 = Symbol.decode(b) |
|
96 |
List((a1, b1), (a2, b1)) |
|
97 |
}).flatten) |
|
63867 | 98 |
val rev_abbrevs1 = Library.distinct(new_abbrevs) reverse_::: rev_abbrevs |
99 |
new Outer_Syntax(keywords, completion1, rev_abbrevs1, language_context, has_tokens) |
|
46940 | 100 |
} |
34166 | 101 |
|
58695 | 102 |
|
66717
67dbf5cdc056
more informative loaded_theories: dependencies and syntax;
wenzelm
parents:
65384
diff
changeset
|
103 |
/* build */ |
67dbf5cdc056
more informative loaded_theories: dependencies and syntax;
wenzelm
parents:
65384
diff
changeset
|
104 |
|
67dbf5cdc056
more informative loaded_theories: dependencies and syntax;
wenzelm
parents:
65384
diff
changeset
|
105 |
def + (header: Document.Node.Header): Outer_Syntax = |
67dbf5cdc056
more informative loaded_theories: dependencies and syntax;
wenzelm
parents:
65384
diff
changeset
|
106 |
add_keywords(header.keywords).add_abbrevs(header.abbrevs) |
59073 | 107 |
|
63584
68751fe1c036
tuned signature -- prover-independence is presently theoretical;
wenzelm
parents:
63579
diff
changeset
|
108 |
def ++ (other: Outer_Syntax): Outer_Syntax = |
59073 | 109 |
if (this eq other) this |
66776 | 110 |
else if (this eq Outer_Syntax.empty) other |
59073 | 111 |
else { |
63865 | 112 |
val keywords1 = keywords ++ other.keywords |
113 |
val completion1 = completion ++ other.completion |
|
63867 | 114 |
val rev_abbrevs1 = Library.merge(rev_abbrevs, other.rev_abbrevs) |
66983 | 115 |
if ((keywords eq keywords1) && (completion eq completion1) && (rev_abbrevs eq rev_abbrevs1)) |
116 |
this |
|
63867 | 117 |
else new Outer_Syntax(keywords1, completion1, rev_abbrevs1, language_context, has_tokens) |
59073 | 118 |
} |
119 |
||
120 |
||
59735 | 121 |
/* load commands */ |
58900 | 122 |
|
63441 | 123 |
def load_command(name: String): Option[List[String]] = keywords.load_commands.get(name) |
58900 | 124 |
def load_commands_in(text: String): Boolean = keywords.load_commands_in(text) |
125 |
||
126 |
||
58706 | 127 |
/* language context */ |
34166 | 128 |
|
58706 | 129 |
def set_language_context(context: Completion.Language_Context): Outer_Syntax = |
63867 | 130 |
new Outer_Syntax(keywords, completion, rev_abbrevs, context, has_tokens) |
58706 | 131 |
|
132 |
def no_tokens: Outer_Syntax = |
|
46969 | 133 |
{ |
58900 | 134 |
require(keywords.is_empty) |
58706 | 135 |
new Outer_Syntax( |
136 |
completion = completion, |
|
63867 | 137 |
rev_abbrevs = rev_abbrevs, |
58706 | 138 |
language_context = language_context, |
139 |
has_tokens = false) |
|
46969 | 140 |
} |
40454
2516ea25a54b
some support for nested source structure, based on section headings;
wenzelm
parents:
38471
diff
changeset
|
141 |
|
58706 | 142 |
|
40454
2516ea25a54b
some support for nested source structure, based on section headings;
wenzelm
parents:
38471
diff
changeset
|
143 |
|
58706 | 144 |
/** parsing **/ |
34166 | 145 |
|
58706 | 146 |
/* command spans */ |
57905
c0c5652e796e
separate module Command_Span: mostly syntactic representation;
wenzelm
parents:
57901
diff
changeset
|
147 |
|
c0c5652e796e
separate module Command_Span: mostly syntactic representation;
wenzelm
parents:
57901
diff
changeset
|
148 |
def parse_spans(toks: List[Token]): List[Command_Span.Span] = |
c0c5652e796e
separate module Command_Span: mostly syntactic representation;
wenzelm
parents:
57901
diff
changeset
|
149 |
{ |
c0c5652e796e
separate module Command_Span: mostly syntactic representation;
wenzelm
parents:
57901
diff
changeset
|
150 |
val result = new mutable.ListBuffer[Command_Span.Span] |
c0c5652e796e
separate module Command_Span: mostly syntactic representation;
wenzelm
parents:
57901
diff
changeset
|
151 |
val content = new mutable.ListBuffer[Token] |
c0c5652e796e
separate module Command_Span: mostly syntactic representation;
wenzelm
parents:
57901
diff
changeset
|
152 |
val improper = new mutable.ListBuffer[Token] |
c0c5652e796e
separate module Command_Span: mostly syntactic representation;
wenzelm
parents:
57901
diff
changeset
|
153 |
|
c0c5652e796e
separate module Command_Span: mostly syntactic representation;
wenzelm
parents:
57901
diff
changeset
|
154 |
def ship(span: List[Token]) |
c0c5652e796e
separate module Command_Span: mostly syntactic representation;
wenzelm
parents:
57901
diff
changeset
|
155 |
{ |
c0c5652e796e
separate module Command_Span: mostly syntactic representation;
wenzelm
parents:
57901
diff
changeset
|
156 |
val kind = |
59924
801b979ec0c2
more general notion of command span: command keyword not necessarily at start;
wenzelm
parents:
59735
diff
changeset
|
157 |
if (span.forall(_.is_improper)) Command_Span.Ignored_Span |
801b979ec0c2
more general notion of command span: command keyword not necessarily at start;
wenzelm
parents:
59735
diff
changeset
|
158 |
else if (span.exists(_.is_error)) Command_Span.Malformed_Span |
801b979ec0c2
more general notion of command span: command keyword not necessarily at start;
wenzelm
parents:
59735
diff
changeset
|
159 |
else |
801b979ec0c2
more general notion of command span: command keyword not necessarily at start;
wenzelm
parents:
59735
diff
changeset
|
160 |
span.find(_.is_command) match { |
801b979ec0c2
more general notion of command span: command keyword not necessarily at start;
wenzelm
parents:
59735
diff
changeset
|
161 |
case None => Command_Span.Malformed_Span |
801b979ec0c2
more general notion of command span: command keyword not necessarily at start;
wenzelm
parents:
59735
diff
changeset
|
162 |
case Some(cmd) => |
801b979ec0c2
more general notion of command span: command keyword not necessarily at start;
wenzelm
parents:
59735
diff
changeset
|
163 |
val name = cmd.source |
801b979ec0c2
more general notion of command span: command keyword not necessarily at start;
wenzelm
parents:
59735
diff
changeset
|
164 |
val offset = |
801b979ec0c2
more general notion of command span: command keyword not necessarily at start;
wenzelm
parents:
59735
diff
changeset
|
165 |
(0 /: span.takeWhile(_ != cmd)) { |
64616 | 166 |
case (i, tok) => i + Symbol.length(tok.source) } |
167 |
val end_offset = offset + Symbol.length(name) |
|
59924
801b979ec0c2
more general notion of command span: command keyword not necessarily at start;
wenzelm
parents:
59735
diff
changeset
|
168 |
val pos = Position.Range(Text.Range(offset, end_offset) + 1) |
801b979ec0c2
more general notion of command span: command keyword not necessarily at start;
wenzelm
parents:
59735
diff
changeset
|
169 |
Command_Span.Command_Span(name, pos) |
801b979ec0c2
more general notion of command span: command keyword not necessarily at start;
wenzelm
parents:
59735
diff
changeset
|
170 |
} |
57905
c0c5652e796e
separate module Command_Span: mostly syntactic representation;
wenzelm
parents:
57901
diff
changeset
|
171 |
result += Command_Span.Span(kind, span) |
c0c5652e796e
separate module Command_Span: mostly syntactic representation;
wenzelm
parents:
57901
diff
changeset
|
172 |
} |
c0c5652e796e
separate module Command_Span: mostly syntactic representation;
wenzelm
parents:
57901
diff
changeset
|
173 |
|
c0c5652e796e
separate module Command_Span: mostly syntactic representation;
wenzelm
parents:
57901
diff
changeset
|
174 |
def flush() |
c0c5652e796e
separate module Command_Span: mostly syntactic representation;
wenzelm
parents:
57901
diff
changeset
|
175 |
{ |
59319 | 176 |
if (content.nonEmpty) { ship(content.toList); content.clear } |
177 |
if (improper.nonEmpty) { ship(improper.toList); improper.clear } |
|
57905
c0c5652e796e
separate module Command_Span: mostly syntactic representation;
wenzelm
parents:
57901
diff
changeset
|
178 |
} |
c0c5652e796e
separate module Command_Span: mostly syntactic representation;
wenzelm
parents:
57901
diff
changeset
|
179 |
|
c0c5652e796e
separate module Command_Span: mostly syntactic representation;
wenzelm
parents:
57901
diff
changeset
|
180 |
for (tok <- toks) { |
59924
801b979ec0c2
more general notion of command span: command keyword not necessarily at start;
wenzelm
parents:
59735
diff
changeset
|
181 |
if (tok.is_improper) improper += tok |
63441 | 182 |
else if (keywords.is_before_command(tok) || |
183 |
tok.is_command && |
|
184 |
(!content.exists(keywords.is_before_command(_)) || content.exists(_.is_command))) |
|
59924
801b979ec0c2
more general notion of command span: command keyword not necessarily at start;
wenzelm
parents:
59735
diff
changeset
|
185 |
{ flush(); content += tok } |
57905
c0c5652e796e
separate module Command_Span: mostly syntactic representation;
wenzelm
parents:
57901
diff
changeset
|
186 |
else { content ++= improper; improper.clear; content += tok } |
c0c5652e796e
separate module Command_Span: mostly syntactic representation;
wenzelm
parents:
57901
diff
changeset
|
187 |
} |
c0c5652e796e
separate module Command_Span: mostly syntactic representation;
wenzelm
parents:
57901
diff
changeset
|
188 |
flush() |
c0c5652e796e
separate module Command_Span: mostly syntactic representation;
wenzelm
parents:
57901
diff
changeset
|
189 |
|
c0c5652e796e
separate module Command_Span: mostly syntactic representation;
wenzelm
parents:
57901
diff
changeset
|
190 |
result.toList |
c0c5652e796e
separate module Command_Span: mostly syntactic representation;
wenzelm
parents:
57901
diff
changeset
|
191 |
} |
c0c5652e796e
separate module Command_Span: mostly syntactic representation;
wenzelm
parents:
57901
diff
changeset
|
192 |
|
57906 | 193 |
def parse_spans(input: CharSequence): List[Command_Span.Span] = |
59083 | 194 |
parse_spans(Token.explode(keywords, input)) |
34166 | 195 |
} |