src/Pure/Isar/outer_syntax.scala
author wenzelm
Tue, 21 Oct 2014 15:21:44 +0200
changeset 58748 8f92f17d8781
parent 58747 c680f181b32e
child 58753 960bf499ca5d
permissions -rw-r--r--
support for structure matching; misc tuning;
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
34166
446a33b874b3 renamed class Outer_Keyword to Outer_Syntax;
wenzelm
parents:
diff changeset
     1
/*  Title:      Pure/Isar/outer_syntax.scala
446a33b874b3 renamed class Outer_Keyword to Outer_Syntax;
wenzelm
parents:
diff changeset
     2
    Author:     Makarius
446a33b874b3 renamed class Outer_Keyword to Outer_Syntax;
wenzelm
parents:
diff changeset
     3
446a33b874b3 renamed class Outer_Keyword to Outer_Syntax;
wenzelm
parents:
diff changeset
     4
Isabelle/Isar outer syntax.
446a33b874b3 renamed class Outer_Keyword to Outer_Syntax;
wenzelm
parents:
diff changeset
     5
*/
446a33b874b3 renamed class Outer_Keyword to Outer_Syntax;
wenzelm
parents:
diff changeset
     6
446a33b874b3 renamed class Outer_Keyword to Outer_Syntax;
wenzelm
parents:
diff changeset
     7
package isabelle
446a33b874b3 renamed class Outer_Keyword to Outer_Syntax;
wenzelm
parents:
diff changeset
     8
446a33b874b3 renamed class Outer_Keyword to Outer_Syntax;
wenzelm
parents:
diff changeset
     9
446a33b874b3 renamed class Outer_Keyword to Outer_Syntax;
wenzelm
parents:
diff changeset
    10
import scala.util.parsing.input.{Reader, CharSequenceReader}
43411
0206466ee473 some support for partial scans with explicit context;
wenzelm
parents: 40533
diff changeset
    11
import scala.collection.mutable
58706
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
    12
import scala.annotation.tailrec
34166
446a33b874b3 renamed class Outer_Keyword to Outer_Syntax;
wenzelm
parents:
diff changeset
    13
446a33b874b3 renamed class Outer_Keyword to Outer_Syntax;
wenzelm
parents:
diff changeset
    14
43774
6dfdb70496fe added Outer_Syntax.quote_string, which is conceptually a bit different from Token.unparse;
wenzelm
parents: 43695
diff changeset
    15
object Outer_Syntax
6dfdb70496fe added Outer_Syntax.quote_string, which is conceptually a bit different from Token.unparse;
wenzelm
parents: 43695
diff changeset
    16
{
58706
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
    17
  /* syntax */
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
    18
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
    19
  val empty: Outer_Syntax = new Outer_Syntax()
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
    20
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
    21
  def init(): Outer_Syntax = new Outer_Syntax(completion = Completion.init())
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
    22
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
    23
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
    24
  /* string literals */
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
    25
43774
6dfdb70496fe added Outer_Syntax.quote_string, which is conceptually a bit different from Token.unparse;
wenzelm
parents: 43695
diff changeset
    26
  def quote_string(str: String): String =
6dfdb70496fe added Outer_Syntax.quote_string, which is conceptually a bit different from Token.unparse;
wenzelm
parents: 43695
diff changeset
    27
  {
6dfdb70496fe added Outer_Syntax.quote_string, which is conceptually a bit different from Token.unparse;
wenzelm
parents: 43695
diff changeset
    28
    val result = new StringBuilder(str.length + 10)
6dfdb70496fe added Outer_Syntax.quote_string, which is conceptually a bit different from Token.unparse;
wenzelm
parents: 43695
diff changeset
    29
    result += '"'
6dfdb70496fe added Outer_Syntax.quote_string, which is conceptually a bit different from Token.unparse;
wenzelm
parents: 43695
diff changeset
    30
    for (s <- Symbol.iterator(str)) {
6dfdb70496fe added Outer_Syntax.quote_string, which is conceptually a bit different from Token.unparse;
wenzelm
parents: 43695
diff changeset
    31
      if (s.length == 1) {
6dfdb70496fe added Outer_Syntax.quote_string, which is conceptually a bit different from Token.unparse;
wenzelm
parents: 43695
diff changeset
    32
        val c = s(0)
6dfdb70496fe added Outer_Syntax.quote_string, which is conceptually a bit different from Token.unparse;
wenzelm
parents: 43695
diff changeset
    33
        if (c < 32 && c != YXML.X && c != YXML.Y || c == '\\' || c == '"') {
6dfdb70496fe added Outer_Syntax.quote_string, which is conceptually a bit different from Token.unparse;
wenzelm
parents: 43695
diff changeset
    34
          result += '\\'
6dfdb70496fe added Outer_Syntax.quote_string, which is conceptually a bit different from Token.unparse;
wenzelm
parents: 43695
diff changeset
    35
          if (c < 10) result += '0'
6dfdb70496fe added Outer_Syntax.quote_string, which is conceptually a bit different from Token.unparse;
wenzelm
parents: 43695
diff changeset
    36
          if (c < 100) result += '0'
6dfdb70496fe added Outer_Syntax.quote_string, which is conceptually a bit different from Token.unparse;
wenzelm
parents: 43695
diff changeset
    37
          result ++= (c.asInstanceOf[Int].toString)
6dfdb70496fe added Outer_Syntax.quote_string, which is conceptually a bit different from Token.unparse;
wenzelm
parents: 43695
diff changeset
    38
        }
6dfdb70496fe added Outer_Syntax.quote_string, which is conceptually a bit different from Token.unparse;
wenzelm
parents: 43695
diff changeset
    39
        else result += c
6dfdb70496fe added Outer_Syntax.quote_string, which is conceptually a bit different from Token.unparse;
wenzelm
parents: 43695
diff changeset
    40
      }
6dfdb70496fe added Outer_Syntax.quote_string, which is conceptually a bit different from Token.unparse;
wenzelm
parents: 43695
diff changeset
    41
      else result ++= s
6dfdb70496fe added Outer_Syntax.quote_string, which is conceptually a bit different from Token.unparse;
wenzelm
parents: 43695
diff changeset
    42
    }
6dfdb70496fe added Outer_Syntax.quote_string, which is conceptually a bit different from Token.unparse;
wenzelm
parents: 43695
diff changeset
    43
    result += '"'
6dfdb70496fe added Outer_Syntax.quote_string, which is conceptually a bit different from Token.unparse;
wenzelm
parents: 43695
diff changeset
    44
    result.toString
6dfdb70496fe added Outer_Syntax.quote_string, which is conceptually a bit different from Token.unparse;
wenzelm
parents: 43695
diff changeset
    45
  }
46626
a02115865bcc streamlined abstract datatype;
wenzelm
parents: 46624
diff changeset
    46
58696
6b7445774ce3 more explicit Line_Nesting;
wenzelm
parents: 58695
diff changeset
    47
58697
5bc1d6c4a499 tuned signature;
wenzelm
parents: 58696
diff changeset
    48
  /* line-oriented structure */
58696
6b7445774ce3 more explicit Line_Nesting;
wenzelm
parents: 58695
diff changeset
    49
58697
5bc1d6c4a499 tuned signature;
wenzelm
parents: 58696
diff changeset
    50
  object Line_Structure
58696
6b7445774ce3 more explicit Line_Nesting;
wenzelm
parents: 58695
diff changeset
    51
  {
58700
4717d18cc619 clarified Line_Structure wrt. command span;
wenzelm
parents: 58697
diff changeset
    52
    val init = Line_Structure()
58696
6b7445774ce3 more explicit Line_Nesting;
wenzelm
parents: 58695
diff changeset
    53
  }
6b7445774ce3 more explicit Line_Nesting;
wenzelm
parents: 58695
diff changeset
    54
58700
4717d18cc619 clarified Line_Structure wrt. command span;
wenzelm
parents: 58697
diff changeset
    55
  sealed case class Line_Structure(
4717d18cc619 clarified Line_Structure wrt. command span;
wenzelm
parents: 58697
diff changeset
    56
    improper: Boolean = true,
4717d18cc619 clarified Line_Structure wrt. command span;
wenzelm
parents: 58697
diff changeset
    57
    command: Boolean = false,
4717d18cc619 clarified Line_Structure wrt. command span;
wenzelm
parents: 58697
diff changeset
    58
    depth: Int = 0,
4717d18cc619 clarified Line_Structure wrt. command span;
wenzelm
parents: 58697
diff changeset
    59
    span_depth: Int = 0,
4717d18cc619 clarified Line_Structure wrt. command span;
wenzelm
parents: 58697
diff changeset
    60
    after_span_depth: Int = 0)
58706
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
    61
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
    62
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
    63
  /* overall document structure */
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
    64
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
    65
  sealed abstract class Document { def length: Int }
58747
c680f181b32e tuned rendering;
wenzelm
parents: 58743
diff changeset
    66
  case class Document_Block(name: String, text: String, body: List[Document]) extends Document
58706
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
    67
  {
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
    68
    val length: Int = (0 /: body)(_ + _.length)
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
    69
  }
58747
c680f181b32e tuned rendering;
wenzelm
parents: 58743
diff changeset
    70
  case class Document_Atom(command: Command) extends Document
58706
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
    71
  {
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
    72
    def length: Int = command.length
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
    73
  }
43774
6dfdb70496fe added Outer_Syntax.quote_string, which is conceptually a bit different from Token.unparse;
wenzelm
parents: 43695
diff changeset
    74
}
6dfdb70496fe added Outer_Syntax.quote_string, which is conceptually a bit different from Token.unparse;
wenzelm
parents: 43695
diff changeset
    75
46712
8650d9a95736 prefer final ADTs -- prevent ooddities;
wenzelm
parents: 46626
diff changeset
    76
final class Outer_Syntax private(
48864
3ee314ae1e0a added keyword kind "thy_load" (with optional list of file extensions);
wenzelm
parents: 48708
diff changeset
    77
  keywords: Map[String, (String, List[String])] = Map.empty,
46626
a02115865bcc streamlined abstract datatype;
wenzelm
parents: 46624
diff changeset
    78
  lexicon: Scan.Lexicon = Scan.Lexicon.empty,
53280
c63a016805b9 explicit indication of outer syntax with no tokens;
wenzelm
parents: 52439
diff changeset
    79
  val completion: Completion = Completion.empty,
55749
75a48dc4383e tuned signature;
wenzelm
parents: 55666
diff changeset
    80
  val language_context: Completion.Language_Context = Completion.Language_Context.outer,
56393
22f533e6a049 more abstract Prover.Syntax, as proposed by Carst Tankink;
wenzelm
parents: 56314
diff changeset
    81
  val has_tokens: Boolean = true) extends Prover.Syntax
34166
446a33b874b3 renamed class Outer_Keyword to Outer_Syntax;
wenzelm
parents:
diff changeset
    82
{
58706
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
    83
  /** syntax content **/
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
    84
48660
730ca503e955 static outer syntax based on session specifications;
wenzelm
parents: 47469
diff changeset
    85
  override def toString: String =
48864
3ee314ae1e0a added keyword kind "thy_load" (with optional list of file extensions);
wenzelm
parents: 48708
diff changeset
    86
    (for ((name, (kind, files)) <- keywords) yield {
48660
730ca503e955 static outer syntax based on session specifications;
wenzelm
parents: 47469
diff changeset
    87
      if (kind == Keyword.MINOR) quote(name)
48864
3ee314ae1e0a added keyword kind "thy_load" (with optional list of file extensions);
wenzelm
parents: 48708
diff changeset
    88
      else
3ee314ae1e0a added keyword kind "thy_load" (with optional list of file extensions);
wenzelm
parents: 48708
diff changeset
    89
        quote(name) + " :: " + quote(kind) +
3ee314ae1e0a added keyword kind "thy_load" (with optional list of file extensions);
wenzelm
parents: 48708
diff changeset
    90
        (if (files.isEmpty) "" else " (" + commas_quote(files) + ")")
48671
951bc4c3ee17 refined outer syntax;
wenzelm
parents: 48660
diff changeset
    91
    }).toList.sorted.mkString("keywords\n  ", " and\n  ", "")
48660
730ca503e955 static outer syntax based on session specifications;
wenzelm
parents: 47469
diff changeset
    92
58695
91839729224e tuned comments;
wenzelm
parents: 58694
diff changeset
    93
91839729224e tuned comments;
wenzelm
parents: 58694
diff changeset
    94
  /* keyword kind */
91839729224e tuned comments;
wenzelm
parents: 58694
diff changeset
    95
48864
3ee314ae1e0a added keyword kind "thy_load" (with optional list of file extensions);
wenzelm
parents: 48708
diff changeset
    96
  def keyword_kind_files(name: String): Option[(String, List[String])] = keywords.get(name)
3ee314ae1e0a added keyword kind "thy_load" (with optional list of file extensions);
wenzelm
parents: 48708
diff changeset
    97
  def keyword_kind(name: String): Option[String] = keyword_kind_files(name).map(_._1)
38471
0924654b8163 report command token name instead of kind, which can be retrieved later via Outer_Syntax.keyword_kind;
wenzelm
parents: 36956
diff changeset
    98
58695
91839729224e tuned comments;
wenzelm
parents: 58694
diff changeset
    99
  def is_command(name: String): Boolean =
91839729224e tuned comments;
wenzelm
parents: 58694
diff changeset
   100
    keyword_kind(name) match {
91839729224e tuned comments;
wenzelm
parents: 58694
diff changeset
   101
      case Some(kind) => kind != Keyword.MINOR
91839729224e tuned comments;
wenzelm
parents: 58694
diff changeset
   102
      case None => false
91839729224e tuned comments;
wenzelm
parents: 58694
diff changeset
   103
    }
91839729224e tuned comments;
wenzelm
parents: 58694
diff changeset
   104
58696
6b7445774ce3 more explicit Line_Nesting;
wenzelm
parents: 58695
diff changeset
   105
  def command_kind(token: Token, pred: String => Boolean): Boolean =
6b7445774ce3 more explicit Line_Nesting;
wenzelm
parents: 58695
diff changeset
   106
    token.is_command && is_command(token.source) &&
6b7445774ce3 more explicit Line_Nesting;
wenzelm
parents: 58695
diff changeset
   107
      pred(keyword_kind(token.source).get)
6b7445774ce3 more explicit Line_Nesting;
wenzelm
parents: 58695
diff changeset
   108
58695
91839729224e tuned comments;
wenzelm
parents: 58694
diff changeset
   109
91839729224e tuned comments;
wenzelm
parents: 58694
diff changeset
   110
  /* load commands */
91839729224e tuned comments;
wenzelm
parents: 58694
diff changeset
   111
57901
e1abca2527da more explicit type Span in Scala, according to ML version;
wenzelm
parents: 56393
diff changeset
   112
  def load_command(name: String): Option[List[String]] =
e1abca2527da more explicit type Span in Scala, according to ML version;
wenzelm
parents: 56393
diff changeset
   113
    keywords.get(name) match {
54513
5545aff878b1 inline blobs into command, via SHA1 digest;
wenzelm
parents: 54462
diff changeset
   114
      case Some((Keyword.THY_LOAD, exts)) => Some(exts)
54462
c9bb76303348 explicit indication of thy_load commands;
wenzelm
parents: 53280
diff changeset
   115
      case _ => None
c9bb76303348 explicit indication of thy_load commands;
wenzelm
parents: 53280
diff changeset
   116
    }
c9bb76303348 explicit indication of thy_load commands;
wenzelm
parents: 53280
diff changeset
   117
56314
9a513737a0b2 tuned signature;
wenzelm
parents: 55749
diff changeset
   118
  val load_commands: List[(String, List[String])] =
48885
d5fdaf7dd1f8 find files via load commands within theory text;
wenzelm
parents: 48873
diff changeset
   119
    (for ((name, (Keyword.THY_LOAD, files)) <- keywords.iterator) yield (name, files)).toList
48872
6124e0d1120a some support for thy_load_commands;
wenzelm
parents: 48870
diff changeset
   120
56393
22f533e6a049 more abstract Prover.Syntax, as proposed by Carst Tankink;
wenzelm
parents: 56314
diff changeset
   121
  def load_commands_in(text: String): Boolean =
22f533e6a049 more abstract Prover.Syntax, as proposed by Carst Tankink;
wenzelm
parents: 56314
diff changeset
   122
    load_commands.exists({ case (cmd, _) => text.containsSlice(cmd) })
22f533e6a049 more abstract Prover.Syntax, as proposed by Carst Tankink;
wenzelm
parents: 56314
diff changeset
   123
58695
91839729224e tuned comments;
wenzelm
parents: 58694
diff changeset
   124
91839729224e tuned comments;
wenzelm
parents: 58694
diff changeset
   125
  /* add keywords */
91839729224e tuned comments;
wenzelm
parents: 58694
diff changeset
   126
50128
599c935aac82 alternative completion for outer syntax keywords;
wenzelm
parents: 48885
diff changeset
   127
  def + (name: String, kind: (String, List[String]), replace: Option[String]): Outer_Syntax =
53280
c63a016805b9 explicit indication of outer syntax with no tokens;
wenzelm
parents: 52439
diff changeset
   128
  {
c63a016805b9 explicit indication of outer syntax with no tokens;
wenzelm
parents: 52439
diff changeset
   129
    val keywords1 = keywords + (name -> kind)
c63a016805b9 explicit indication of outer syntax with no tokens;
wenzelm
parents: 52439
diff changeset
   130
    val lexicon1 = lexicon + name
c63a016805b9 explicit indication of outer syntax with no tokens;
wenzelm
parents: 52439
diff changeset
   131
    val completion1 =
50128
599c935aac82 alternative completion for outer syntax keywords;
wenzelm
parents: 48885
diff changeset
   132
      if (Keyword.control(kind._1) || replace == Some("")) completion
53280
c63a016805b9 explicit indication of outer syntax with no tokens;
wenzelm
parents: 52439
diff changeset
   133
      else completion + (name, replace getOrElse name)
55749
75a48dc4383e tuned signature;
wenzelm
parents: 55666
diff changeset
   134
    new Outer_Syntax(keywords1, lexicon1, completion1, language_context, true)
53280
c63a016805b9 explicit indication of outer syntax with no tokens;
wenzelm
parents: 52439
diff changeset
   135
  }
34166
446a33b874b3 renamed class Outer_Keyword to Outer_Syntax;
wenzelm
parents:
diff changeset
   136
53280
c63a016805b9 explicit indication of outer syntax with no tokens;
wenzelm
parents: 52439
diff changeset
   137
  def + (name: String, kind: (String, List[String])): Outer_Syntax =
c63a016805b9 explicit indication of outer syntax with no tokens;
wenzelm
parents: 52439
diff changeset
   138
    this + (name, kind, Some(name))
c63a016805b9 explicit indication of outer syntax with no tokens;
wenzelm
parents: 52439
diff changeset
   139
  def + (name: String, kind: String): Outer_Syntax =
c63a016805b9 explicit indication of outer syntax with no tokens;
wenzelm
parents: 52439
diff changeset
   140
    this + (name, (kind, Nil), Some(name))
50128
599c935aac82 alternative completion for outer syntax keywords;
wenzelm
parents: 48885
diff changeset
   141
  def + (name: String, replace: Option[String]): Outer_Syntax =
599c935aac82 alternative completion for outer syntax keywords;
wenzelm
parents: 48885
diff changeset
   142
    this + (name, (Keyword.MINOR, Nil), replace)
599c935aac82 alternative completion for outer syntax keywords;
wenzelm
parents: 48885
diff changeset
   143
  def + (name: String): Outer_Syntax = this + (name, None)
48706
e2b512024eab tuned signature;
wenzelm
parents: 48671
diff changeset
   144
48873
18b17f15bc62 more direct cumulation of (sparse) keywords;
wenzelm
parents: 48872
diff changeset
   145
  def add_keywords(keywords: Thy_Header.Keywords): Outer_Syntax =
18b17f15bc62 more direct cumulation of (sparse) keywords;
wenzelm
parents: 48872
diff changeset
   146
    (this /: keywords) {
52439
4cf3f6153eb8 improved "isabelle keywords" and "isabelle update_keywords" based on Isabelle/Scala, without requiring to build sessions first;
wenzelm
parents: 52066
diff changeset
   147
      case (syntax, (name, Some((kind, _)), replace)) =>
50128
599c935aac82 alternative completion for outer syntax keywords;
wenzelm
parents: 48885
diff changeset
   148
        syntax +
599c935aac82 alternative completion for outer syntax keywords;
wenzelm
parents: 48885
diff changeset
   149
          (Symbol.decode(name), kind, replace) +
599c935aac82 alternative completion for outer syntax keywords;
wenzelm
parents: 48885
diff changeset
   150
          (Symbol.encode(name), kind, replace)
52439
4cf3f6153eb8 improved "isabelle keywords" and "isabelle update_keywords" based on Isabelle/Scala, without requiring to build sessions first;
wenzelm
parents: 52066
diff changeset
   151
      case (syntax, (name, None, replace)) =>
50128
599c935aac82 alternative completion for outer syntax keywords;
wenzelm
parents: 48885
diff changeset
   152
        syntax +
599c935aac82 alternative completion for outer syntax keywords;
wenzelm
parents: 48885
diff changeset
   153
          (Symbol.decode(name), replace) +
599c935aac82 alternative completion for outer syntax keywords;
wenzelm
parents: 48885
diff changeset
   154
          (Symbol.encode(name), replace)
46940
a40be2f10ca9 explicit Outer_Syntax.Decl;
wenzelm
parents: 46712
diff changeset
   155
    }
34166
446a33b874b3 renamed class Outer_Keyword to Outer_Syntax;
wenzelm
parents:
diff changeset
   156
58695
91839729224e tuned comments;
wenzelm
parents: 58694
diff changeset
   157
58706
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   158
  /* language context */
34166
446a33b874b3 renamed class Outer_Keyword to Outer_Syntax;
wenzelm
parents:
diff changeset
   159
58706
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   160
  def set_language_context(context: Completion.Language_Context): Outer_Syntax =
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   161
    new Outer_Syntax(keywords, lexicon, completion, context, has_tokens)
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   162
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   163
  def no_tokens: Outer_Syntax =
46969
481b7d9ad6fe more abstract heading level;
wenzelm
parents: 46941
diff changeset
   164
  {
58706
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   165
    require(keywords.isEmpty && lexicon.isEmpty)
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   166
    new Outer_Syntax(
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   167
      completion = completion,
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   168
      language_context = language_context,
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   169
      has_tokens = false)
46969
481b7d9ad6fe more abstract heading level;
wenzelm
parents: 46941
diff changeset
   170
  }
40454
2516ea25a54b some support for nested source structure, based on section headings;
wenzelm
parents: 38471
diff changeset
   171
58706
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   172
40454
2516ea25a54b some support for nested source structure, based on section headings;
wenzelm
parents: 38471
diff changeset
   173
58706
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   174
  /** parsing **/
34166
446a33b874b3 renamed class Outer_Keyword to Outer_Syntax;
wenzelm
parents:
diff changeset
   175
58697
5bc1d6c4a499 tuned signature;
wenzelm
parents: 58696
diff changeset
   176
  /* line-oriented structure */
58696
6b7445774ce3 more explicit Line_Nesting;
wenzelm
parents: 58695
diff changeset
   177
58700
4717d18cc619 clarified Line_Structure wrt. command span;
wenzelm
parents: 58697
diff changeset
   178
  def line_structure(tokens: List[Token], struct: Outer_Syntax.Line_Structure)
4717d18cc619 clarified Line_Structure wrt. command span;
wenzelm
parents: 58697
diff changeset
   179
    : Outer_Syntax.Line_Structure =
58696
6b7445774ce3 more explicit Line_Nesting;
wenzelm
parents: 58695
diff changeset
   180
  {
58700
4717d18cc619 clarified Line_Structure wrt. command span;
wenzelm
parents: 58697
diff changeset
   181
    val improper1 = tokens.forall(_.is_improper)
4717d18cc619 clarified Line_Structure wrt. command span;
wenzelm
parents: 58697
diff changeset
   182
    val command1 = tokens.exists(_.is_command)
4717d18cc619 clarified Line_Structure wrt. command span;
wenzelm
parents: 58697
diff changeset
   183
58696
6b7445774ce3 more explicit Line_Nesting;
wenzelm
parents: 58695
diff changeset
   184
    val depth1 =
6b7445774ce3 more explicit Line_Nesting;
wenzelm
parents: 58695
diff changeset
   185
      if (tokens.exists(tok => command_kind(tok, Keyword.theory))) 0
58700
4717d18cc619 clarified Line_Structure wrt. command span;
wenzelm
parents: 58697
diff changeset
   186
      else if (command1) struct.after_span_depth
4717d18cc619 clarified Line_Structure wrt. command span;
wenzelm
parents: 58697
diff changeset
   187
      else struct.span_depth
4717d18cc619 clarified Line_Structure wrt. command span;
wenzelm
parents: 58697
diff changeset
   188
4717d18cc619 clarified Line_Structure wrt. command span;
wenzelm
parents: 58697
diff changeset
   189
    val (span_depth1, after_span_depth1) =
4717d18cc619 clarified Line_Structure wrt. command span;
wenzelm
parents: 58697
diff changeset
   190
      ((struct.span_depth, struct.after_span_depth) /: tokens) {
58703
883efcc7a50d more folds;
wenzelm
parents: 58700
diff changeset
   191
        case ((x, y), tok) =>
883efcc7a50d more folds;
wenzelm
parents: 58700
diff changeset
   192
          if (tok.is_command) {
883efcc7a50d more folds;
wenzelm
parents: 58700
diff changeset
   193
            if (command_kind(tok, Keyword.theory_goal)) (2, 1)
883efcc7a50d more folds;
wenzelm
parents: 58700
diff changeset
   194
            else if (command_kind(tok, Keyword.theory)) (1, 0)
883efcc7a50d more folds;
wenzelm
parents: 58700
diff changeset
   195
            else if (command_kind(tok, Keyword.proof_goal) || tok.source == "{") (y + 2, y + 1)
883efcc7a50d more folds;
wenzelm
parents: 58700
diff changeset
   196
            else if (command_kind(tok, Keyword.qed) || tok.source == "}") (y + 1, y - 1)
883efcc7a50d more folds;
wenzelm
parents: 58700
diff changeset
   197
            else if (command_kind(tok, Keyword.qed_global)) (1, 0)
883efcc7a50d more folds;
wenzelm
parents: 58700
diff changeset
   198
            else (x, y)
883efcc7a50d more folds;
wenzelm
parents: 58700
diff changeset
   199
          }
883efcc7a50d more folds;
wenzelm
parents: 58700
diff changeset
   200
          else (x, y)
58696
6b7445774ce3 more explicit Line_Nesting;
wenzelm
parents: 58695
diff changeset
   201
      }
58700
4717d18cc619 clarified Line_Structure wrt. command span;
wenzelm
parents: 58697
diff changeset
   202
4717d18cc619 clarified Line_Structure wrt. command span;
wenzelm
parents: 58697
diff changeset
   203
    Outer_Syntax.Line_Structure(improper1, command1, depth1, span_depth1, after_span_depth1)
58696
6b7445774ce3 more explicit Line_Nesting;
wenzelm
parents: 58695
diff changeset
   204
  }
6b7445774ce3 more explicit Line_Nesting;
wenzelm
parents: 58695
diff changeset
   205
6b7445774ce3 more explicit Line_Nesting;
wenzelm
parents: 58695
diff changeset
   206
53280
c63a016805b9 explicit indication of outer syntax with no tokens;
wenzelm
parents: 52439
diff changeset
   207
  /* token language */
c63a016805b9 explicit indication of outer syntax with no tokens;
wenzelm
parents: 52439
diff changeset
   208
57907
7fc36b4c7cce tuned signature;
wenzelm
parents: 57906
diff changeset
   209
  def scan(input: CharSequence): List[Token] =
52066
83b7b88770c9 discontinued odd workaround for scala-2.9.2, which is hopefully obsolete in scala-2.10.x;
wenzelm
parents: 50428
diff changeset
   210
  {
58503
wenzelm
parents: 57911
diff changeset
   211
    val in: Reader[Char] = new CharSequenceReader(input)
55616
25a7a998852a default completion context via outer syntax;
wenzelm
parents: 55510
diff changeset
   212
    Token.Parsers.parseAll(
57907
7fc36b4c7cce tuned signature;
wenzelm
parents: 57906
diff changeset
   213
        Token.Parsers.rep(Token.Parsers.token(lexicon, is_command)), in) match {
55494
009b71c1ed23 tuned signature (in accordance to ML version);
wenzelm
parents: 55492
diff changeset
   214
      case Token.Parsers.Success(tokens, _) => tokens
57907
7fc36b4c7cce tuned signature;
wenzelm
parents: 57906
diff changeset
   215
      case _ => error("Unexpected failure of tokenizing input:\n" + input.toString)
34166
446a33b874b3 renamed class Outer_Keyword to Outer_Syntax;
wenzelm
parents:
diff changeset
   216
    }
52066
83b7b88770c9 discontinued odd workaround for scala-2.9.2, which is hopefully obsolete in scala-2.10.x;
wenzelm
parents: 50428
diff changeset
   217
  }
34166
446a33b874b3 renamed class Outer_Keyword to Outer_Syntax;
wenzelm
parents:
diff changeset
   218
58748
8f92f17d8781 support for structure matching;
wenzelm
parents: 58747
diff changeset
   219
  def scan_line(input: CharSequence, context: Scan.Line_Context): (List[Token], Scan.Line_Context) =
52066
83b7b88770c9 discontinued odd workaround for scala-2.9.2, which is hopefully obsolete in scala-2.10.x;
wenzelm
parents: 50428
diff changeset
   220
  {
83b7b88770c9 discontinued odd workaround for scala-2.9.2, which is hopefully obsolete in scala-2.10.x;
wenzelm
parents: 50428
diff changeset
   221
    var in: Reader[Char] = new CharSequenceReader(input)
83b7b88770c9 discontinued odd workaround for scala-2.9.2, which is hopefully obsolete in scala-2.10.x;
wenzelm
parents: 50428
diff changeset
   222
    val toks = new mutable.ListBuffer[Token]
83b7b88770c9 discontinued odd workaround for scala-2.9.2, which is hopefully obsolete in scala-2.10.x;
wenzelm
parents: 50428
diff changeset
   223
    var ctxt = context
83b7b88770c9 discontinued odd workaround for scala-2.9.2, which is hopefully obsolete in scala-2.10.x;
wenzelm
parents: 50428
diff changeset
   224
    while (!in.atEnd) {
55510
1585a65aad64 tuned signature -- emphasize line-oriented aspect;
wenzelm
parents: 55494
diff changeset
   225
      Token.Parsers.parse(Token.Parsers.token_line(lexicon, is_command, ctxt), in) match {
55494
009b71c1ed23 tuned signature (in accordance to ML version);
wenzelm
parents: 55492
diff changeset
   226
        case Token.Parsers.Success((x, c), rest) => { toks += x; ctxt = c; in = rest }
009b71c1ed23 tuned signature (in accordance to ML version);
wenzelm
parents: 55492
diff changeset
   227
        case Token.Parsers.NoSuccess(_, rest) =>
52066
83b7b88770c9 discontinued odd workaround for scala-2.9.2, which is hopefully obsolete in scala-2.10.x;
wenzelm
parents: 50428
diff changeset
   228
          error("Unexpected failure of tokenizing input:\n" + rest.source.toString)
43411
0206466ee473 some support for partial scans with explicit context;
wenzelm
parents: 40533
diff changeset
   229
      }
0206466ee473 some support for partial scans with explicit context;
wenzelm
parents: 40533
diff changeset
   230
    }
58748
8f92f17d8781 support for structure matching;
wenzelm
parents: 58747
diff changeset
   231
    (toks.toList, ctxt)
52066
83b7b88770c9 discontinued odd workaround for scala-2.9.2, which is hopefully obsolete in scala-2.10.x;
wenzelm
parents: 50428
diff changeset
   232
  }
55616
25a7a998852a default completion context via outer syntax;
wenzelm
parents: 55510
diff changeset
   233
25a7a998852a default completion context via outer syntax;
wenzelm
parents: 55510
diff changeset
   234
58706
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   235
  /* command spans */
57905
c0c5652e796e separate module Command_Span: mostly syntactic representation;
wenzelm
parents: 57901
diff changeset
   236
c0c5652e796e separate module Command_Span: mostly syntactic representation;
wenzelm
parents: 57901
diff changeset
   237
  def parse_spans(toks: List[Token]): List[Command_Span.Span] =
c0c5652e796e separate module Command_Span: mostly syntactic representation;
wenzelm
parents: 57901
diff changeset
   238
  {
c0c5652e796e separate module Command_Span: mostly syntactic representation;
wenzelm
parents: 57901
diff changeset
   239
    val result = new mutable.ListBuffer[Command_Span.Span]
c0c5652e796e separate module Command_Span: mostly syntactic representation;
wenzelm
parents: 57901
diff changeset
   240
    val content = new mutable.ListBuffer[Token]
c0c5652e796e separate module Command_Span: mostly syntactic representation;
wenzelm
parents: 57901
diff changeset
   241
    val improper = new mutable.ListBuffer[Token]
c0c5652e796e separate module Command_Span: mostly syntactic representation;
wenzelm
parents: 57901
diff changeset
   242
c0c5652e796e separate module Command_Span: mostly syntactic representation;
wenzelm
parents: 57901
diff changeset
   243
    def ship(span: List[Token])
c0c5652e796e separate module Command_Span: mostly syntactic representation;
wenzelm
parents: 57901
diff changeset
   244
    {
c0c5652e796e separate module Command_Span: mostly syntactic representation;
wenzelm
parents: 57901
diff changeset
   245
      val kind =
57910
a50837b637dc maintain Command_Range position as in ML;
wenzelm
parents: 57907
diff changeset
   246
        if (!span.isEmpty && span.head.is_command && !span.exists(_.is_error)) {
a50837b637dc maintain Command_Range position as in ML;
wenzelm
parents: 57907
diff changeset
   247
          val name = span.head.source
57911
dcb758188aa6 clarified Position.Identified: do not require range from prover, default to command position;
wenzelm
parents: 57910
diff changeset
   248
          val pos = Position.Range(Text.Range(0, Symbol.iterator(name).length) + 1)
57910
a50837b637dc maintain Command_Range position as in ML;
wenzelm
parents: 57907
diff changeset
   249
          Command_Span.Command_Span(name, pos)
a50837b637dc maintain Command_Range position as in ML;
wenzelm
parents: 57907
diff changeset
   250
        }
57905
c0c5652e796e separate module Command_Span: mostly syntactic representation;
wenzelm
parents: 57901
diff changeset
   251
        else if (span.forall(_.is_improper)) Command_Span.Ignored_Span
c0c5652e796e separate module Command_Span: mostly syntactic representation;
wenzelm
parents: 57901
diff changeset
   252
        else Command_Span.Malformed_Span
c0c5652e796e separate module Command_Span: mostly syntactic representation;
wenzelm
parents: 57901
diff changeset
   253
      result += Command_Span.Span(kind, span)
c0c5652e796e separate module Command_Span: mostly syntactic representation;
wenzelm
parents: 57901
diff changeset
   254
    }
c0c5652e796e separate module Command_Span: mostly syntactic representation;
wenzelm
parents: 57901
diff changeset
   255
c0c5652e796e separate module Command_Span: mostly syntactic representation;
wenzelm
parents: 57901
diff changeset
   256
    def flush()
c0c5652e796e separate module Command_Span: mostly syntactic representation;
wenzelm
parents: 57901
diff changeset
   257
    {
c0c5652e796e separate module Command_Span: mostly syntactic representation;
wenzelm
parents: 57901
diff changeset
   258
      if (!content.isEmpty) { ship(content.toList); content.clear }
c0c5652e796e separate module Command_Span: mostly syntactic representation;
wenzelm
parents: 57901
diff changeset
   259
      if (!improper.isEmpty) { ship(improper.toList); improper.clear }
c0c5652e796e separate module Command_Span: mostly syntactic representation;
wenzelm
parents: 57901
diff changeset
   260
    }
c0c5652e796e separate module Command_Span: mostly syntactic representation;
wenzelm
parents: 57901
diff changeset
   261
c0c5652e796e separate module Command_Span: mostly syntactic representation;
wenzelm
parents: 57901
diff changeset
   262
    for (tok <- toks) {
c0c5652e796e separate module Command_Span: mostly syntactic representation;
wenzelm
parents: 57901
diff changeset
   263
      if (tok.is_command) { flush(); content += tok }
c0c5652e796e separate module Command_Span: mostly syntactic representation;
wenzelm
parents: 57901
diff changeset
   264
      else if (tok.is_improper) improper += tok
c0c5652e796e separate module Command_Span: mostly syntactic representation;
wenzelm
parents: 57901
diff changeset
   265
      else { content ++= improper; improper.clear; content += tok }
c0c5652e796e separate module Command_Span: mostly syntactic representation;
wenzelm
parents: 57901
diff changeset
   266
    }
c0c5652e796e separate module Command_Span: mostly syntactic representation;
wenzelm
parents: 57901
diff changeset
   267
    flush()
c0c5652e796e separate module Command_Span: mostly syntactic representation;
wenzelm
parents: 57901
diff changeset
   268
c0c5652e796e separate module Command_Span: mostly syntactic representation;
wenzelm
parents: 57901
diff changeset
   269
    result.toList
c0c5652e796e separate module Command_Span: mostly syntactic representation;
wenzelm
parents: 57901
diff changeset
   270
  }
c0c5652e796e separate module Command_Span: mostly syntactic representation;
wenzelm
parents: 57901
diff changeset
   271
57906
020df63dd0a9 tuned signature;
wenzelm
parents: 57905
diff changeset
   272
  def parse_spans(input: CharSequence): List[Command_Span.Span] =
020df63dd0a9 tuned signature;
wenzelm
parents: 57905
diff changeset
   273
    parse_spans(scan(input))
020df63dd0a9 tuned signature;
wenzelm
parents: 57905
diff changeset
   274
57905
c0c5652e796e separate module Command_Span: mostly syntactic representation;
wenzelm
parents: 57901
diff changeset
   275
58706
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   276
  /* overall document structure */
55616
25a7a998852a default completion context via outer syntax;
wenzelm
parents: 55510
diff changeset
   277
58706
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   278
  def heading_level(command: Command): Option[Int] =
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   279
  {
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   280
    keyword_kind(command.name) match {
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   281
      case _ if command.name == "header" => Some(0)
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   282
      case Some(Keyword.THY_HEADING1) => Some(1)
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   283
      case Some(Keyword.THY_HEADING2) | Some(Keyword.PRF_HEADING2) => Some(2)
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   284
      case Some(Keyword.THY_HEADING3) | Some(Keyword.PRF_HEADING3) => Some(3)
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   285
      case Some(Keyword.THY_HEADING4) | Some(Keyword.PRF_HEADING4) => Some(4)
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   286
      case Some(kind) if Keyword.theory(kind) => Some(5)
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   287
      case _ => None
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   288
    }
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   289
  }
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   290
58743
c07a59140fee clarified tree root;
wenzelm
parents: 58706
diff changeset
   291
  def parse_document(node_name: Document.Node.Name, text: CharSequence):
c07a59140fee clarified tree root;
wenzelm
parents: 58706
diff changeset
   292
    List[Outer_Syntax.Document] =
58706
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   293
  {
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   294
    /* stack operations */
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   295
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   296
    def buffer(): mutable.ListBuffer[Outer_Syntax.Document] =
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   297
      new mutable.ListBuffer[Outer_Syntax.Document]
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   298
58747
c680f181b32e tuned rendering;
wenzelm
parents: 58743
diff changeset
   299
    var stack: List[(Int, Command, mutable.ListBuffer[Outer_Syntax.Document])] =
c680f181b32e tuned rendering;
wenzelm
parents: 58743
diff changeset
   300
      List((0, Command.empty, buffer()))
55616
25a7a998852a default completion context via outer syntax;
wenzelm
parents: 55510
diff changeset
   301
58706
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   302
    @tailrec def close(level: Int => Boolean)
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   303
    {
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   304
      stack match {
58747
c680f181b32e tuned rendering;
wenzelm
parents: 58743
diff changeset
   305
        case (lev, command, body) :: (_, _, body2) :: rest if level(lev) =>
c680f181b32e tuned rendering;
wenzelm
parents: 58743
diff changeset
   306
          body2 += Outer_Syntax.Document_Block(command.name, command.source, body.toList)
58706
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   307
          stack = stack.tail
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   308
          close(level)
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   309
        case _ =>
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   310
      }
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   311
    }
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   312
58743
c07a59140fee clarified tree root;
wenzelm
parents: 58706
diff changeset
   313
    def result(): List[Outer_Syntax.Document] =
58706
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   314
    {
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   315
      close(_ => true)
58743
c07a59140fee clarified tree root;
wenzelm
parents: 58706
diff changeset
   316
      stack.head._3.toList
58706
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   317
    }
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   318
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   319
    def add(command: Command)
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   320
    {
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   321
      heading_level(command) match {
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   322
        case Some(i) =>
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   323
          close(_ > i)
58747
c680f181b32e tuned rendering;
wenzelm
parents: 58743
diff changeset
   324
          stack = (i + 1, command, buffer()) :: stack
58706
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   325
        case None =>
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   326
      }
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   327
      stack.head._3 += Outer_Syntax.Document_Atom(command)
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   328
    }
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   329
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   330
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   331
    /* result structure */
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   332
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   333
    val spans = parse_spans(text)
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   334
    spans.foreach(span => add(Command(Document_ID.none, node_name, Nil, span)))
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   335
    result()
55616
25a7a998852a default completion context via outer syntax;
wenzelm
parents: 55510
diff changeset
   336
  }
34166
446a33b874b3 renamed class Outer_Keyword to Outer_Syntax;
wenzelm
parents:
diff changeset
   337
}