author | wenzelm |
Sun, 19 Jun 2011 14:11:06 +0200 | |
changeset 43455 | 4b4b93672f15 |
parent 43445 | 270bbbcda059 |
child 43695 | 5130dfe1b7be |
permissions | -rw-r--r-- |
34166 | 1 |
/* Title: Pure/Isar/outer_syntax.scala |
2 |
Author: Makarius |
|
3 |
||
4 |
Isabelle/Isar outer syntax. |
|
5 |
*/ |
|
6 |
||
7 |
package isabelle |
|
8 |
||
9 |
||
10 |
import scala.util.parsing.input.{Reader, CharSequenceReader} |
|
43411
0206466ee473
some support for partial scans with explicit context;
wenzelm
parents:
40533
diff
changeset
|
11 |
import scala.collection.mutable |
34166 | 12 |
|
13 |
||
14 |
class Outer_Syntax(symbols: Symbol.Interpretation) |
|
15 |
{ |
|
36947 | 16 |
protected val keywords: Map[String, String] = Map((";" -> Keyword.DIAG)) |
34166 | 17 |
protected val lexicon: Scan.Lexicon = Scan.Lexicon.empty |
43455 | 18 |
lazy val completion: Completion = new Completion + symbols // FIXME odd initialization |
34166 | 19 |
|
38471
0924654b8163
report command token name instead of kind, which can be retrieved later via Outer_Syntax.keyword_kind;
wenzelm
parents:
36956
diff
changeset
|
20 |
def keyword_kind(name: String): Option[String] = keywords.get(name) |
0924654b8163
report command token name instead of kind, which can be retrieved later via Outer_Syntax.keyword_kind;
wenzelm
parents:
36956
diff
changeset
|
21 |
|
40533
e38e80686ce5
somewhat adhoc replacement for 'thus' and 'hence';
wenzelm
parents:
40459
diff
changeset
|
22 |
def + (name: String, kind: String, replace: String): Outer_Syntax = |
34166 | 23 |
{ |
24 |
val new_keywords = keywords + (name -> kind) |
|
25 |
val new_lexicon = lexicon + name |
|
40533
e38e80686ce5
somewhat adhoc replacement for 'thus' and 'hence';
wenzelm
parents:
40459
diff
changeset
|
26 |
val new_completion = completion + (name, replace) |
34166 | 27 |
new Outer_Syntax(symbols) { |
28 |
override val lexicon = new_lexicon |
|
29 |
override val keywords = new_keywords |
|
30 |
override lazy val completion = new_completion |
|
31 |
} |
|
32 |
} |
|
33 |
||
40533
e38e80686ce5
somewhat adhoc replacement for 'thus' and 'hence';
wenzelm
parents:
40459
diff
changeset
|
34 |
def + (name: String, kind: String): Outer_Syntax = this + (name, kind, name) |
e38e80686ce5
somewhat adhoc replacement for 'thus' and 'hence';
wenzelm
parents:
40459
diff
changeset
|
35 |
|
36947 | 36 |
def + (name: String): Outer_Syntax = this + (name, Keyword.MINOR) |
34166 | 37 |
|
38 |
def is_command(name: String): Boolean = |
|
40458
12c8c64203b3
treat main theory commands like headings, and nest anything else inside;
wenzelm
parents:
40455
diff
changeset
|
39 |
keyword_kind(name) match { |
36947 | 40 |
case Some(kind) => kind != Keyword.MINOR |
34166 | 41 |
case None => false |
42 |
} |
|
43 |
||
40454
2516ea25a54b
some support for nested source structure, based on section headings;
wenzelm
parents:
38471
diff
changeset
|
44 |
def heading_level(name: String): Option[Int] = |
2516ea25a54b
some support for nested source structure, based on section headings;
wenzelm
parents:
38471
diff
changeset
|
45 |
name match { |
40458
12c8c64203b3
treat main theory commands like headings, and nest anything else inside;
wenzelm
parents:
40455
diff
changeset
|
46 |
// FIXME avoid hard-wired info!? |
40454
2516ea25a54b
some support for nested source structure, based on section headings;
wenzelm
parents:
38471
diff
changeset
|
47 |
case "header" => Some(1) |
2516ea25a54b
some support for nested source structure, based on section headings;
wenzelm
parents:
38471
diff
changeset
|
48 |
case "chapter" => Some(2) |
2516ea25a54b
some support for nested source structure, based on section headings;
wenzelm
parents:
38471
diff
changeset
|
49 |
case "section" | "sect" => Some(3) |
2516ea25a54b
some support for nested source structure, based on section headings;
wenzelm
parents:
38471
diff
changeset
|
50 |
case "subsection" | "subsect" => Some(4) |
2516ea25a54b
some support for nested source structure, based on section headings;
wenzelm
parents:
38471
diff
changeset
|
51 |
case "subsubsection" | "subsubsect" => Some(5) |
40458
12c8c64203b3
treat main theory commands like headings, and nest anything else inside;
wenzelm
parents:
40455
diff
changeset
|
52 |
case _ => |
12c8c64203b3
treat main theory commands like headings, and nest anything else inside;
wenzelm
parents:
40455
diff
changeset
|
53 |
keyword_kind(name) match { |
12c8c64203b3
treat main theory commands like headings, and nest anything else inside;
wenzelm
parents:
40455
diff
changeset
|
54 |
case Some(kind) if Keyword.theory(kind) => Some(6) |
12c8c64203b3
treat main theory commands like headings, and nest anything else inside;
wenzelm
parents:
40455
diff
changeset
|
55 |
case _ => None |
12c8c64203b3
treat main theory commands like headings, and nest anything else inside;
wenzelm
parents:
40455
diff
changeset
|
56 |
} |
40454
2516ea25a54b
some support for nested source structure, based on section headings;
wenzelm
parents:
38471
diff
changeset
|
57 |
} |
2516ea25a54b
some support for nested source structure, based on section headings;
wenzelm
parents:
38471
diff
changeset
|
58 |
|
2516ea25a54b
some support for nested source structure, based on section headings;
wenzelm
parents:
38471
diff
changeset
|
59 |
def heading_level(command: Command): Option[Int] = |
2516ea25a54b
some support for nested source structure, based on section headings;
wenzelm
parents:
38471
diff
changeset
|
60 |
heading_level(command.name) |
2516ea25a54b
some support for nested source structure, based on section headings;
wenzelm
parents:
38471
diff
changeset
|
61 |
|
34166 | 62 |
|
63 |
/* tokenize */ |
|
64 |
||
36956
21be4832c362
renamed class Outer_Lex to Token and Token_Kind to Token.Kind;
wenzelm
parents:
36947
diff
changeset
|
65 |
def scan(input: Reader[Char]): List[Token] = |
34166 | 66 |
{ |
67 |
import lexicon._ |
|
68 |
||
69 |
parseAll(rep(token(symbols, is_command)), input) match { |
|
70 |
case Success(tokens, _) => tokens |
|
34264 | 71 |
case _ => error("Unexpected failure of tokenizing input:\n" + input.source.toString) |
34166 | 72 |
} |
73 |
} |
|
74 |
||
36956
21be4832c362
renamed class Outer_Lex to Token and Token_Kind to Token.Kind;
wenzelm
parents:
36947
diff
changeset
|
75 |
def scan(input: CharSequence): List[Token] = |
34166 | 76 |
scan(new CharSequenceReader(input)) |
43411
0206466ee473
some support for partial scans with explicit context;
wenzelm
parents:
40533
diff
changeset
|
77 |
|
0206466ee473
some support for partial scans with explicit context;
wenzelm
parents:
40533
diff
changeset
|
78 |
def scan_context(input: CharSequence, context: Scan.Context): (List[Token], Scan.Context) = |
0206466ee473
some support for partial scans with explicit context;
wenzelm
parents:
40533
diff
changeset
|
79 |
{ |
0206466ee473
some support for partial scans with explicit context;
wenzelm
parents:
40533
diff
changeset
|
80 |
import lexicon._ |
0206466ee473
some support for partial scans with explicit context;
wenzelm
parents:
40533
diff
changeset
|
81 |
|
0206466ee473
some support for partial scans with explicit context;
wenzelm
parents:
40533
diff
changeset
|
82 |
var in: Reader[Char] = new CharSequenceReader(input) |
0206466ee473
some support for partial scans with explicit context;
wenzelm
parents:
40533
diff
changeset
|
83 |
val toks = new mutable.ListBuffer[Token] |
0206466ee473
some support for partial scans with explicit context;
wenzelm
parents:
40533
diff
changeset
|
84 |
var ctxt = context |
0206466ee473
some support for partial scans with explicit context;
wenzelm
parents:
40533
diff
changeset
|
85 |
while (!in.atEnd) { |
0206466ee473
some support for partial scans with explicit context;
wenzelm
parents:
40533
diff
changeset
|
86 |
parse(token_context(symbols, is_command, ctxt), in) match { |
0206466ee473
some support for partial scans with explicit context;
wenzelm
parents:
40533
diff
changeset
|
87 |
case Success((x, c), rest) => { toks += x; ctxt = c; in = rest } |
0206466ee473
some support for partial scans with explicit context;
wenzelm
parents:
40533
diff
changeset
|
88 |
case NoSuccess(_, rest) => |
0206466ee473
some support for partial scans with explicit context;
wenzelm
parents:
40533
diff
changeset
|
89 |
error("Unexpected failure of tokenizing input:\n" + rest.source.toString) |
0206466ee473
some support for partial scans with explicit context;
wenzelm
parents:
40533
diff
changeset
|
90 |
} |
0206466ee473
some support for partial scans with explicit context;
wenzelm
parents:
40533
diff
changeset
|
91 |
} |
0206466ee473
some support for partial scans with explicit context;
wenzelm
parents:
40533
diff
changeset
|
92 |
(toks.toList, ctxt) |
0206466ee473
some support for partial scans with explicit context;
wenzelm
parents:
40533
diff
changeset
|
93 |
} |
34166 | 94 |
} |