author | wenzelm |
Fri, 23 Dec 2022 14:32:53 +0100 | |
changeset 76757 | 0d08ee0c1ea0 |
parent 76614 | ac08b6e3b9e3 |
permissions | -rw-r--r-- |
43283 | 1 |
/* Title: Pure/Isar/parse.scala |
34159
903092d61519
Generic parsers for Isabelle/Isar outer syntax -- Scala version.
wenzelm
parents:
diff
changeset
|
2 |
Author: Makarius |
903092d61519
Generic parsers for Isabelle/Isar outer syntax -- Scala version.
wenzelm
parents:
diff
changeset
|
3 |
|
903092d61519
Generic parsers for Isabelle/Isar outer syntax -- Scala version.
wenzelm
parents:
diff
changeset
|
4 |
Generic parsers for Isabelle/Isar outer syntax. |
903092d61519
Generic parsers for Isabelle/Isar outer syntax -- Scala version.
wenzelm
parents:
diff
changeset
|
5 |
*/ |
903092d61519
Generic parsers for Isabelle/Isar outer syntax -- Scala version.
wenzelm
parents:
diff
changeset
|
6 |
|
903092d61519
Generic parsers for Isabelle/Isar outer syntax -- Scala version.
wenzelm
parents:
diff
changeset
|
7 |
package isabelle |
903092d61519
Generic parsers for Isabelle/Isar outer syntax -- Scala version.
wenzelm
parents:
diff
changeset
|
8 |
|
55618 | 9 |
|
75405 | 10 |
import scala.util.parsing.combinator |
48599 | 11 |
import scala.annotation.tailrec |
34159
903092d61519
Generic parsers for Isabelle/Isar outer syntax -- Scala version.
wenzelm
parents:
diff
changeset
|
12 |
|
903092d61519
Generic parsers for Isabelle/Isar outer syntax -- Scala version.
wenzelm
parents:
diff
changeset
|
13 |
|
75393 | 14 |
object Parse { |
34161 | 15 |
/* parsing tokens */ |
16 |
||
75405 | 17 |
trait Parsers extends combinator.Parsers { |
36956
21be4832c362
renamed class Outer_Lex to Token and Token_Kind to Token.Kind;
wenzelm
parents:
36948
diff
changeset
|
18 |
type Elem = Token |
34159
903092d61519
Generic parsers for Isabelle/Isar outer syntax -- Scala version.
wenzelm
parents:
diff
changeset
|
19 |
|
48599 | 20 |
def filter_proper: Boolean = true |
34266 | 21 |
|
48599 | 22 |
@tailrec private def proper(in: Input): Input = |
23 |
if (!filter_proper || in.atEnd || in.first.is_proper) in |
|
34161 | 24 |
else proper(in.rest) |
34159
903092d61519
Generic parsers for Isabelle/Isar outer syntax -- Scala version.
wenzelm
parents:
diff
changeset
|
25 |
|
59692 | 26 |
private def proper_position: Parser[Position.T] = |
27 |
new Parser[Position.T] { |
|
75393 | 28 |
def apply(raw_input: Input) = { |
59692 | 29 |
val in = proper(raw_input) |
30 |
val pos = |
|
31 |
in.pos match { |
|
32 |
case pos: Token.Pos => pos |
|
33 |
case _ => Token.Pos.none |
|
34 |
} |
|
35 |
Success(if (in.atEnd) pos.position() else pos.position(in.first), in) |
|
36 |
} |
|
37 |
} |
|
38 |
||
39 |
def position[A](parser: Parser[A]): Parser[(A, Position.T)] = |
|
40 |
proper_position ~ parser ^^ { case x ~ y => (y, x) } |
|
41 |
||
42 |
def token(s: String, pred: Elem => Boolean): Parser[Elem] = |
|
43 |
new Parser[Elem] { |
|
75393 | 44 |
def apply(raw_input: Input) = { |
56464 | 45 |
val in = proper(raw_input) |
46 |
if (in.atEnd) Failure(s + " expected,\nbut end-of-input was found", in) |
|
47 |
else { |
|
48 |
val token = in.first |
|
59692 | 49 |
if (pred(token)) Success(token, proper(in.rest)) |
58861
5ff61774df11
command-line terminator ";" is no longer accepted;
wenzelm
parents:
56801
diff
changeset
|
50 |
else Failure(s + " expected,\nbut " + token.kind + " was found:\n" + token.source, in) |
56464 | 51 |
} |
34159
903092d61519
Generic parsers for Isabelle/Isar outer syntax -- Scala version.
wenzelm
parents:
diff
changeset
|
52 |
} |
903092d61519
Generic parsers for Isabelle/Isar outer syntax -- Scala version.
wenzelm
parents:
diff
changeset
|
53 |
} |
903092d61519
Generic parsers for Isabelle/Isar outer syntax -- Scala version.
wenzelm
parents:
diff
changeset
|
54 |
|
34168 | 55 |
def atom(s: String, pred: Elem => Boolean): Parser[String] = |
59692 | 56 |
token(s, pred) ^^ (_.content) |
34168 | 57 |
|
63446 | 58 |
def command(name: String): Parser[String] = atom("command " + quote(name), _.is_command(name)) |
59 |
def $$$(name: String): Parser[String] = atom("keyword " + quote(name), _.is_keyword(name)) |
|
46943 | 60 |
def string: Parser[String] = atom("string", _.is_string) |
48349
a78e5d399599
support Session.Queue with ordering and dependencies;
wenzelm
parents:
46943
diff
changeset
|
61 |
def nat: Parser[Int] = atom("natural number", _.is_nat) ^^ (s => Integer.parseInt(s)) |
62969 | 62 |
def name: Parser[String] = atom("name", _.is_name) |
64471
c40c2975fb02
more uniform path syntax, as in ML (see 5a7c919a4ada);
wenzelm
parents:
63446
diff
changeset
|
63 |
def embedded: Parser[String] = atom("embedded content", _.is_embedded) |
74887 | 64 |
def text: Parser[String] = atom("text", _.is_embedded) |
65 |
def ML_source: Parser[String] = atom("ML source", _.is_embedded) |
|
66 |
def document_source: Parser[String] = atom("document source", _.is_embedded) |
|
59693 | 67 |
|
70668 | 68 |
def opt_keyword(s: String): Parser[Boolean] = |
76613 | 69 |
($$$("(") ~! $$$(s) ~ $$$(")")) ^^ (_ => true) | success(false) |
70668 | 70 |
|
48484 | 71 |
def path: Parser[String] = |
64471
c40c2975fb02
more uniform path syntax, as in ML (see 5a7c919a4ada);
wenzelm
parents:
63446
diff
changeset
|
72 |
atom("file name/path specification", tok => tok.is_embedded && Path.is_wellformed(tok.content)) |
59693 | 73 |
|
76614 | 74 |
def in_path(default: String): Parser[String] = |
75 |
$$$("in") ~! path ^^ { case _ ~ x => x } | success(default) |
|
76 |
||
77 |
def in_path_parens(default: String): Parser[String] = |
|
78 |
$$$("(") ~! ($$$("in") ~ path ~ $$$(")")) ^^ { case _ ~ (_ ~ x ~ _) => x } | success(default) |
|
79 |
||
75987 | 80 |
def chapter_name: Parser[String] = atom("chapter name", _.is_system_name) |
66914 | 81 |
def session_name: Parser[String] = atom("session name", _.is_system_name) |
82 |
def theory_name: Parser[String] = atom("theory name", _.is_system_name) |
|
34168 | 83 |
|
84 |
private def tag_name: Parser[String] = |
|
85 |
atom("tag name", tok => |
|
36956
21be4832c362
renamed class Outer_Lex to Token and Token_Kind to Token.Kind;
wenzelm
parents:
36948
diff
changeset
|
86 |
tok.kind == Token.Kind.IDENT || |
21be4832c362
renamed class Outer_Lex to Token and Token_Kind to Token.Kind;
wenzelm
parents:
36948
diff
changeset
|
87 |
tok.kind == Token.Kind.STRING) |
34168 | 88 |
|
69887 | 89 |
def tag: Parser[String] = $$$("%") ~> tag_name |
90 |
def tags: Parser[List[String]] = rep(tag) |
|
91 |
||
69891
def3ec9cdb7e
document markers are formal comments, and may thus occur anywhere in the command-span;
wenzelm
parents:
69887
diff
changeset
|
92 |
def marker: Parser[String] = token("marker", _.is_marker) ^^ (_.content) |
69887 | 93 |
|
76613 | 94 |
def annotation: Parser[Unit] = rep(tag | marker) ^^ (_ => ()) |
34161 | 95 |
|
96 |
||
97 |
/* wrappers */ |
|
98 |
||
36956
21be4832c362
renamed class Outer_Lex to Token and Token_Kind to Token.Kind;
wenzelm
parents:
36948
diff
changeset
|
99 |
def parse[T](p: Parser[T], in: Token.Reader): ParseResult[T] = p(in) |
48912 | 100 |
|
75393 | 101 |
def parse_all[T](p: Parser[T], in: Token.Reader): ParseResult[T] = { |
48912 | 102 |
val result = parse(p, in) |
103 |
val rest = proper(result.next) |
|
104 |
if (result.successful && !rest.atEnd) Error("bad input", rest) |
|
105 |
else result |
|
106 |
} |
|
34159
903092d61519
Generic parsers for Isabelle/Isar outer syntax -- Scala version.
wenzelm
parents:
diff
changeset
|
107 |
} |
903092d61519
Generic parsers for Isabelle/Isar outer syntax -- Scala version.
wenzelm
parents:
diff
changeset
|
108 |
} |