src/Pure/Isar/outer_syntax.scala
author wenzelm
Mon, 11 Jul 2016 16:36:29 +0200
changeset 63441 4c3fa4dba79f
parent 63429 baedd4724f08
child 63458 723f9c673c1c
permissions -rw-r--r--
explicit kind "before_command"; tuned signature;
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
34166
446a33b874b3 renamed class Outer_Keyword to Outer_Syntax;
wenzelm
parents:
diff changeset
     1
/*  Title:      Pure/Isar/outer_syntax.scala
446a33b874b3 renamed class Outer_Keyword to Outer_Syntax;
wenzelm
parents:
diff changeset
     2
    Author:     Makarius
446a33b874b3 renamed class Outer_Keyword to Outer_Syntax;
wenzelm
parents:
diff changeset
     3
446a33b874b3 renamed class Outer_Keyword to Outer_Syntax;
wenzelm
parents:
diff changeset
     4
Isabelle/Isar outer syntax.
446a33b874b3 renamed class Outer_Keyword to Outer_Syntax;
wenzelm
parents:
diff changeset
     5
*/
446a33b874b3 renamed class Outer_Keyword to Outer_Syntax;
wenzelm
parents:
diff changeset
     6
446a33b874b3 renamed class Outer_Keyword to Outer_Syntax;
wenzelm
parents:
diff changeset
     7
package isabelle
446a33b874b3 renamed class Outer_Keyword to Outer_Syntax;
wenzelm
parents:
diff changeset
     8
446a33b874b3 renamed class Outer_Keyword to Outer_Syntax;
wenzelm
parents:
diff changeset
     9
43411
0206466ee473 some support for partial scans with explicit context;
wenzelm
parents: 40533
diff changeset
    10
import scala.collection.mutable
58706
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
    11
import scala.annotation.tailrec
34166
446a33b874b3 renamed class Outer_Keyword to Outer_Syntax;
wenzelm
parents:
diff changeset
    12
446a33b874b3 renamed class Outer_Keyword to Outer_Syntax;
wenzelm
parents:
diff changeset
    13
43774
6dfdb70496fe added Outer_Syntax.quote_string, which is conceptually a bit different from Token.unparse;
wenzelm
parents: 43695
diff changeset
    14
object Outer_Syntax
6dfdb70496fe added Outer_Syntax.quote_string, which is conceptually a bit different from Token.unparse;
wenzelm
parents: 43695
diff changeset
    15
{
58706
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
    16
  /* syntax */
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
    17
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
    18
  val empty: Outer_Syntax = new Outer_Syntax()
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
    19
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
    20
  def init(): Outer_Syntax = new Outer_Syntax(completion = Completion.init())
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
    21
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
    22
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
    23
  /* string literals */
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
    24
43774
6dfdb70496fe added Outer_Syntax.quote_string, which is conceptually a bit different from Token.unparse;
wenzelm
parents: 43695
diff changeset
    25
  def quote_string(str: String): String =
6dfdb70496fe added Outer_Syntax.quote_string, which is conceptually a bit different from Token.unparse;
wenzelm
parents: 43695
diff changeset
    26
  {
6dfdb70496fe added Outer_Syntax.quote_string, which is conceptually a bit different from Token.unparse;
wenzelm
parents: 43695
diff changeset
    27
    val result = new StringBuilder(str.length + 10)
6dfdb70496fe added Outer_Syntax.quote_string, which is conceptually a bit different from Token.unparse;
wenzelm
parents: 43695
diff changeset
    28
    result += '"'
6dfdb70496fe added Outer_Syntax.quote_string, which is conceptually a bit different from Token.unparse;
wenzelm
parents: 43695
diff changeset
    29
    for (s <- Symbol.iterator(str)) {
6dfdb70496fe added Outer_Syntax.quote_string, which is conceptually a bit different from Token.unparse;
wenzelm
parents: 43695
diff changeset
    30
      if (s.length == 1) {
6dfdb70496fe added Outer_Syntax.quote_string, which is conceptually a bit different from Token.unparse;
wenzelm
parents: 43695
diff changeset
    31
        val c = s(0)
6dfdb70496fe added Outer_Syntax.quote_string, which is conceptually a bit different from Token.unparse;
wenzelm
parents: 43695
diff changeset
    32
        if (c < 32 && c != YXML.X && c != YXML.Y || c == '\\' || c == '"') {
6dfdb70496fe added Outer_Syntax.quote_string, which is conceptually a bit different from Token.unparse;
wenzelm
parents: 43695
diff changeset
    33
          result += '\\'
6dfdb70496fe added Outer_Syntax.quote_string, which is conceptually a bit different from Token.unparse;
wenzelm
parents: 43695
diff changeset
    34
          if (c < 10) result += '0'
6dfdb70496fe added Outer_Syntax.quote_string, which is conceptually a bit different from Token.unparse;
wenzelm
parents: 43695
diff changeset
    35
          if (c < 100) result += '0'
60215
5fb4990dfc73 misc tuning, based on warnings by IntelliJ IDEA;
wenzelm
parents: 59939
diff changeset
    36
          result ++= c.asInstanceOf[Int].toString
43774
6dfdb70496fe added Outer_Syntax.quote_string, which is conceptually a bit different from Token.unparse;
wenzelm
parents: 43695
diff changeset
    37
        }
6dfdb70496fe added Outer_Syntax.quote_string, which is conceptually a bit different from Token.unparse;
wenzelm
parents: 43695
diff changeset
    38
        else result += c
6dfdb70496fe added Outer_Syntax.quote_string, which is conceptually a bit different from Token.unparse;
wenzelm
parents: 43695
diff changeset
    39
      }
6dfdb70496fe added Outer_Syntax.quote_string, which is conceptually a bit different from Token.unparse;
wenzelm
parents: 43695
diff changeset
    40
      else result ++= s
6dfdb70496fe added Outer_Syntax.quote_string, which is conceptually a bit different from Token.unparse;
wenzelm
parents: 43695
diff changeset
    41
    }
6dfdb70496fe added Outer_Syntax.quote_string, which is conceptually a bit different from Token.unparse;
wenzelm
parents: 43695
diff changeset
    42
    result += '"'
6dfdb70496fe added Outer_Syntax.quote_string, which is conceptually a bit different from Token.unparse;
wenzelm
parents: 43695
diff changeset
    43
    result.toString
6dfdb70496fe added Outer_Syntax.quote_string, which is conceptually a bit different from Token.unparse;
wenzelm
parents: 43695
diff changeset
    44
  }
46626
a02115865bcc streamlined abstract datatype;
wenzelm
parents: 46624
diff changeset
    45
58696
6b7445774ce3 more explicit Line_Nesting;
wenzelm
parents: 58695
diff changeset
    46
58697
5bc1d6c4a499 tuned signature;
wenzelm
parents: 58696
diff changeset
    47
  /* line-oriented structure */
58696
6b7445774ce3 more explicit Line_Nesting;
wenzelm
parents: 58695
diff changeset
    48
58697
5bc1d6c4a499 tuned signature;
wenzelm
parents: 58696
diff changeset
    49
  object Line_Structure
58696
6b7445774ce3 more explicit Line_Nesting;
wenzelm
parents: 58695
diff changeset
    50
  {
58700
4717d18cc619 clarified Line_Structure wrt. command span;
wenzelm
parents: 58697
diff changeset
    51
    val init = Line_Structure()
58696
6b7445774ce3 more explicit Line_Nesting;
wenzelm
parents: 58695
diff changeset
    52
  }
6b7445774ce3 more explicit Line_Nesting;
wenzelm
parents: 58695
diff changeset
    53
58700
4717d18cc619 clarified Line_Structure wrt. command span;
wenzelm
parents: 58697
diff changeset
    54
  sealed case class Line_Structure(
4717d18cc619 clarified Line_Structure wrt. command span;
wenzelm
parents: 58697
diff changeset
    55
    improper: Boolean = true,
4717d18cc619 clarified Line_Structure wrt. command span;
wenzelm
parents: 58697
diff changeset
    56
    command: Boolean = false,
4717d18cc619 clarified Line_Structure wrt. command span;
wenzelm
parents: 58697
diff changeset
    57
    depth: Int = 0,
4717d18cc619 clarified Line_Structure wrt. command span;
wenzelm
parents: 58697
diff changeset
    58
    span_depth: Int = 0,
4717d18cc619 clarified Line_Structure wrt. command span;
wenzelm
parents: 58697
diff changeset
    59
    after_span_depth: Int = 0)
58706
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
    60
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
    61
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
    62
  /* overall document structure */
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
    63
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
    64
  sealed abstract class Document { def length: Int }
58747
c680f181b32e tuned rendering;
wenzelm
parents: 58743
diff changeset
    65
  case class Document_Block(name: String, text: String, body: List[Document]) extends Document
58706
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
    66
  {
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
    67
    val length: Int = (0 /: body)(_ + _.length)
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
    68
  }
58747
c680f181b32e tuned rendering;
wenzelm
parents: 58743
diff changeset
    69
  case class Document_Atom(command: Command) extends Document
58706
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
    70
  {
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
    71
    def length: Int = command.length
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
    72
  }
43774
6dfdb70496fe added Outer_Syntax.quote_string, which is conceptually a bit different from Token.unparse;
wenzelm
parents: 43695
diff changeset
    73
}
6dfdb70496fe added Outer_Syntax.quote_string, which is conceptually a bit different from Token.unparse;
wenzelm
parents: 43695
diff changeset
    74
46712
8650d9a95736 prefer final ADTs -- prevent ooddities;
wenzelm
parents: 46626
diff changeset
    75
final class Outer_Syntax private(
58900
1435cc20b022 explicit type Keyword.Keywords;
wenzelm
parents: 58899
diff changeset
    76
  val keywords: Keyword.Keywords = Keyword.Keywords.empty,
53280
c63a016805b9 explicit indication of outer syntax with no tokens;
wenzelm
parents: 52439
diff changeset
    77
  val completion: Completion = Completion.empty,
55749
75a48dc4383e tuned signature;
wenzelm
parents: 55666
diff changeset
    78
  val language_context: Completion.Language_Context = Completion.Language_Context.outer,
56393
22f533e6a049 more abstract Prover.Syntax, as proposed by Carst Tankink;
wenzelm
parents: 56314
diff changeset
    79
  val has_tokens: Boolean = true) extends Prover.Syntax
34166
446a33b874b3 renamed class Outer_Keyword to Outer_Syntax;
wenzelm
parents:
diff changeset
    80
{
58706
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
    81
  /** syntax content **/
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
    82
58900
1435cc20b022 explicit type Keyword.Keywords;
wenzelm
parents: 58899
diff changeset
    83
  override def toString: String = keywords.toString
56393
22f533e6a049 more abstract Prover.Syntax, as proposed by Carst Tankink;
wenzelm
parents: 56314
diff changeset
    84
58695
91839729224e tuned comments;
wenzelm
parents: 58694
diff changeset
    85
91839729224e tuned comments;
wenzelm
parents: 58694
diff changeset
    86
  /* add keywords */
91839729224e tuned comments;
wenzelm
parents: 58694
diff changeset
    87
63429
baedd4724f08 tuned signature: more uniform Keyword.spec;
wenzelm
parents: 63424
diff changeset
    88
  def + (name: String, kind: String = "", tags: List[String] = Nil, replace: Option[String] = None)
58901
47809a811eba clarified representation of type Keywords;
wenzelm
parents: 58900
diff changeset
    89
    : Outer_Syntax =
53280
c63a016805b9 explicit indication of outer syntax with no tokens;
wenzelm
parents: 52439
diff changeset
    90
  {
63429
baedd4724f08 tuned signature: more uniform Keyword.spec;
wenzelm
parents: 63424
diff changeset
    91
    val keywords1 = keywords + (name, kind, tags)
53280
c63a016805b9 explicit indication of outer syntax with no tokens;
wenzelm
parents: 52439
diff changeset
    92
    val completion1 =
58853
f8715e7c1be6 discontinued obsolete control command category;
wenzelm
parents: 58753
diff changeset
    93
      if (replace == Some("")) completion
53280
c63a016805b9 explicit indication of outer syntax with no tokens;
wenzelm
parents: 52439
diff changeset
    94
      else completion + (name, replace getOrElse name)
58900
1435cc20b022 explicit type Keyword.Keywords;
wenzelm
parents: 58899
diff changeset
    95
    new Outer_Syntax(keywords1, completion1, language_context, true)
53280
c63a016805b9 explicit indication of outer syntax with no tokens;
wenzelm
parents: 52439
diff changeset
    96
  }
48706
e2b512024eab tuned signature;
wenzelm
parents: 48671
diff changeset
    97
48873
18b17f15bc62 more direct cumulation of (sparse) keywords;
wenzelm
parents: 48872
diff changeset
    98
  def add_keywords(keywords: Thy_Header.Keywords): Outer_Syntax =
18b17f15bc62 more direct cumulation of (sparse) keywords;
wenzelm
parents: 48872
diff changeset
    99
    (this /: keywords) {
63429
baedd4724f08 tuned signature: more uniform Keyword.spec;
wenzelm
parents: 63424
diff changeset
   100
      case (syntax, (name, ((kind, tags), _), replace)) =>
50128
599c935aac82 alternative completion for outer syntax keywords;
wenzelm
parents: 48885
diff changeset
   101
        syntax +
63429
baedd4724f08 tuned signature: more uniform Keyword.spec;
wenzelm
parents: 63424
diff changeset
   102
          (Symbol.decode(name), kind, tags, replace) +
baedd4724f08 tuned signature: more uniform Keyword.spec;
wenzelm
parents: 63424
diff changeset
   103
          (Symbol.encode(name), kind, tags, replace)
46940
a40be2f10ca9 explicit Outer_Syntax.Decl;
wenzelm
parents: 46712
diff changeset
   104
    }
34166
446a33b874b3 renamed class Outer_Keyword to Outer_Syntax;
wenzelm
parents:
diff changeset
   105
58695
91839729224e tuned comments;
wenzelm
parents: 58694
diff changeset
   106
59073
dcecfcc56dce more merge operations;
wenzelm
parents: 58938
diff changeset
   107
  /* merge */
dcecfcc56dce more merge operations;
wenzelm
parents: 58938
diff changeset
   108
59077
7e0d3da6e6d8 node-specific syntax, with base_syntax as default;
wenzelm
parents: 59073
diff changeset
   109
  def ++ (other: Prover.Syntax): Prover.Syntax =
59073
dcecfcc56dce more merge operations;
wenzelm
parents: 58938
diff changeset
   110
    if (this eq other) this
dcecfcc56dce more merge operations;
wenzelm
parents: 58938
diff changeset
   111
    else {
59077
7e0d3da6e6d8 node-specific syntax, with base_syntax as default;
wenzelm
parents: 59073
diff changeset
   112
      val keywords1 = keywords ++ other.asInstanceOf[Outer_Syntax].keywords
7e0d3da6e6d8 node-specific syntax, with base_syntax as default;
wenzelm
parents: 59073
diff changeset
   113
      val completion1 = completion ++ other.asInstanceOf[Outer_Syntax].completion
7e0d3da6e6d8 node-specific syntax, with base_syntax as default;
wenzelm
parents: 59073
diff changeset
   114
      if ((keywords eq keywords1) && (completion eq completion1)) this
7e0d3da6e6d8 node-specific syntax, with base_syntax as default;
wenzelm
parents: 59073
diff changeset
   115
      else new Outer_Syntax(keywords1, completion1, language_context, has_tokens)
59073
dcecfcc56dce more merge operations;
wenzelm
parents: 58938
diff changeset
   116
    }
dcecfcc56dce more merge operations;
wenzelm
parents: 58938
diff changeset
   117
dcecfcc56dce more merge operations;
wenzelm
parents: 58938
diff changeset
   118
59735
24bee1b11fce misc tuning and simplification;
wenzelm
parents: 59702
diff changeset
   119
  /* load commands */
58900
1435cc20b022 explicit type Keyword.Keywords;
wenzelm
parents: 58899
diff changeset
   120
63441
4c3fa4dba79f explicit kind "before_command";
wenzelm
parents: 63429
diff changeset
   121
  def load_command(name: String): Option[List[String]] = keywords.load_commands.get(name)
58900
1435cc20b022 explicit type Keyword.Keywords;
wenzelm
parents: 58899
diff changeset
   122
  def load_commands_in(text: String): Boolean = keywords.load_commands_in(text)
1435cc20b022 explicit type Keyword.Keywords;
wenzelm
parents: 58899
diff changeset
   123
1435cc20b022 explicit type Keyword.Keywords;
wenzelm
parents: 58899
diff changeset
   124
58706
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   125
  /* language context */
34166
446a33b874b3 renamed class Outer_Keyword to Outer_Syntax;
wenzelm
parents:
diff changeset
   126
58706
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   127
  def set_language_context(context: Completion.Language_Context): Outer_Syntax =
58900
1435cc20b022 explicit type Keyword.Keywords;
wenzelm
parents: 58899
diff changeset
   128
    new Outer_Syntax(keywords, completion, context, has_tokens)
58706
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   129
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   130
  def no_tokens: Outer_Syntax =
46969
481b7d9ad6fe more abstract heading level;
wenzelm
parents: 46941
diff changeset
   131
  {
58900
1435cc20b022 explicit type Keyword.Keywords;
wenzelm
parents: 58899
diff changeset
   132
    require(keywords.is_empty)
58706
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   133
    new Outer_Syntax(
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   134
      completion = completion,
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   135
      language_context = language_context,
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   136
      has_tokens = false)
46969
481b7d9ad6fe more abstract heading level;
wenzelm
parents: 46941
diff changeset
   137
  }
40454
2516ea25a54b some support for nested source structure, based on section headings;
wenzelm
parents: 38471
diff changeset
   138
58706
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   139
40454
2516ea25a54b some support for nested source structure, based on section headings;
wenzelm
parents: 38471
diff changeset
   140
58706
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   141
  /** parsing **/
34166
446a33b874b3 renamed class Outer_Keyword to Outer_Syntax;
wenzelm
parents:
diff changeset
   142
58697
5bc1d6c4a499 tuned signature;
wenzelm
parents: 58696
diff changeset
   143
  /* line-oriented structure */
58696
6b7445774ce3 more explicit Line_Nesting;
wenzelm
parents: 58695
diff changeset
   144
59924
801b979ec0c2 more general notion of command span: command keyword not necessarily at start;
wenzelm
parents: 59735
diff changeset
   145
  def line_structure(tokens: List[Token], structure: Outer_Syntax.Line_Structure)
58700
4717d18cc619 clarified Line_Structure wrt. command span;
wenzelm
parents: 58697
diff changeset
   146
    : Outer_Syntax.Line_Structure =
58696
6b7445774ce3 more explicit Line_Nesting;
wenzelm
parents: 58695
diff changeset
   147
  {
58700
4717d18cc619 clarified Line_Structure wrt. command span;
wenzelm
parents: 58697
diff changeset
   148
    val improper1 = tokens.forall(_.is_improper)
4717d18cc619 clarified Line_Structure wrt. command span;
wenzelm
parents: 58697
diff changeset
   149
    val command1 = tokens.exists(_.is_command)
4717d18cc619 clarified Line_Structure wrt. command span;
wenzelm
parents: 58697
diff changeset
   150
58696
6b7445774ce3 more explicit Line_Nesting;
wenzelm
parents: 58695
diff changeset
   151
    val depth1 =
63424
e4e15bbfb3e2 clarified signature;
wenzelm
parents: 62453
diff changeset
   152
      if (tokens.exists(keywords.is_command(_, Keyword.theory))) 0
59924
801b979ec0c2 more general notion of command span: command keyword not necessarily at start;
wenzelm
parents: 59735
diff changeset
   153
      else if (command1) structure.after_span_depth
801b979ec0c2 more general notion of command span: command keyword not necessarily at start;
wenzelm
parents: 59735
diff changeset
   154
      else structure.span_depth
58700
4717d18cc619 clarified Line_Structure wrt. command span;
wenzelm
parents: 58697
diff changeset
   155
4717d18cc619 clarified Line_Structure wrt. command span;
wenzelm
parents: 58697
diff changeset
   156
    val (span_depth1, after_span_depth1) =
59924
801b979ec0c2 more general notion of command span: command keyword not necessarily at start;
wenzelm
parents: 59735
diff changeset
   157
      ((structure.span_depth, structure.after_span_depth) /: tokens) {
58703
883efcc7a50d more folds;
wenzelm
parents: 58700
diff changeset
   158
        case ((x, y), tok) =>
883efcc7a50d more folds;
wenzelm
parents: 58700
diff changeset
   159
          if (tok.is_command) {
63424
e4e15bbfb3e2 clarified signature;
wenzelm
parents: 62453
diff changeset
   160
            if (keywords.is_command(tok, Keyword.theory_goal)) (2, 1)
e4e15bbfb3e2 clarified signature;
wenzelm
parents: 62453
diff changeset
   161
            else if (keywords.is_command(tok, Keyword.theory)) (1, 0)
e4e15bbfb3e2 clarified signature;
wenzelm
parents: 62453
diff changeset
   162
            else if (keywords.is_command(tok, Keyword.proof_open)) (y + 2, y + 1)
e4e15bbfb3e2 clarified signature;
wenzelm
parents: 62453
diff changeset
   163
            else if (keywords.is_command(tok, Keyword.PRF_BLOCK == _)) (y + 2, y + 1)
e4e15bbfb3e2 clarified signature;
wenzelm
parents: 62453
diff changeset
   164
            else if (keywords.is_command(tok, Keyword.QED_BLOCK == _)) (y + 1, y - 2)
e4e15bbfb3e2 clarified signature;
wenzelm
parents: 62453
diff changeset
   165
            else if (keywords.is_command(tok, Keyword.proof_close)) (y + 1, y - 1)
e4e15bbfb3e2 clarified signature;
wenzelm
parents: 62453
diff changeset
   166
            else if (keywords.is_command(tok, Keyword.qed_global)) (1, 0)
58703
883efcc7a50d more folds;
wenzelm
parents: 58700
diff changeset
   167
            else (x, y)
883efcc7a50d more folds;
wenzelm
parents: 58700
diff changeset
   168
          }
883efcc7a50d more folds;
wenzelm
parents: 58700
diff changeset
   169
          else (x, y)
58696
6b7445774ce3 more explicit Line_Nesting;
wenzelm
parents: 58695
diff changeset
   170
      }
58700
4717d18cc619 clarified Line_Structure wrt. command span;
wenzelm
parents: 58697
diff changeset
   171
4717d18cc619 clarified Line_Structure wrt. command span;
wenzelm
parents: 58697
diff changeset
   172
    Outer_Syntax.Line_Structure(improper1, command1, depth1, span_depth1, after_span_depth1)
58696
6b7445774ce3 more explicit Line_Nesting;
wenzelm
parents: 58695
diff changeset
   173
  }
6b7445774ce3 more explicit Line_Nesting;
wenzelm
parents: 58695
diff changeset
   174
6b7445774ce3 more explicit Line_Nesting;
wenzelm
parents: 58695
diff changeset
   175
58706
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   176
  /* command spans */
57905
c0c5652e796e separate module Command_Span: mostly syntactic representation;
wenzelm
parents: 57901
diff changeset
   177
c0c5652e796e separate module Command_Span: mostly syntactic representation;
wenzelm
parents: 57901
diff changeset
   178
  def parse_spans(toks: List[Token]): List[Command_Span.Span] =
c0c5652e796e separate module Command_Span: mostly syntactic representation;
wenzelm
parents: 57901
diff changeset
   179
  {
c0c5652e796e separate module Command_Span: mostly syntactic representation;
wenzelm
parents: 57901
diff changeset
   180
    val result = new mutable.ListBuffer[Command_Span.Span]
c0c5652e796e separate module Command_Span: mostly syntactic representation;
wenzelm
parents: 57901
diff changeset
   181
    val content = new mutable.ListBuffer[Token]
c0c5652e796e separate module Command_Span: mostly syntactic representation;
wenzelm
parents: 57901
diff changeset
   182
    val improper = new mutable.ListBuffer[Token]
c0c5652e796e separate module Command_Span: mostly syntactic representation;
wenzelm
parents: 57901
diff changeset
   183
c0c5652e796e separate module Command_Span: mostly syntactic representation;
wenzelm
parents: 57901
diff changeset
   184
    def ship(span: List[Token])
c0c5652e796e separate module Command_Span: mostly syntactic representation;
wenzelm
parents: 57901
diff changeset
   185
    {
c0c5652e796e separate module Command_Span: mostly syntactic representation;
wenzelm
parents: 57901
diff changeset
   186
      val kind =
59924
801b979ec0c2 more general notion of command span: command keyword not necessarily at start;
wenzelm
parents: 59735
diff changeset
   187
        if (span.forall(_.is_improper)) Command_Span.Ignored_Span
801b979ec0c2 more general notion of command span: command keyword not necessarily at start;
wenzelm
parents: 59735
diff changeset
   188
        else if (span.exists(_.is_error)) Command_Span.Malformed_Span
801b979ec0c2 more general notion of command span: command keyword not necessarily at start;
wenzelm
parents: 59735
diff changeset
   189
        else
801b979ec0c2 more general notion of command span: command keyword not necessarily at start;
wenzelm
parents: 59735
diff changeset
   190
          span.find(_.is_command) match {
801b979ec0c2 more general notion of command span: command keyword not necessarily at start;
wenzelm
parents: 59735
diff changeset
   191
            case None => Command_Span.Malformed_Span
801b979ec0c2 more general notion of command span: command keyword not necessarily at start;
wenzelm
parents: 59735
diff changeset
   192
            case Some(cmd) =>
801b979ec0c2 more general notion of command span: command keyword not necessarily at start;
wenzelm
parents: 59735
diff changeset
   193
              val name = cmd.source
801b979ec0c2 more general notion of command span: command keyword not necessarily at start;
wenzelm
parents: 59735
diff changeset
   194
              val offset =
801b979ec0c2 more general notion of command span: command keyword not necessarily at start;
wenzelm
parents: 59735
diff changeset
   195
                (0 /: span.takeWhile(_ != cmd)) {
801b979ec0c2 more general notion of command span: command keyword not necessarily at start;
wenzelm
parents: 59735
diff changeset
   196
                  case (i, tok) => i + Symbol.iterator(tok.source).length }
801b979ec0c2 more general notion of command span: command keyword not necessarily at start;
wenzelm
parents: 59735
diff changeset
   197
              val end_offset = offset + Symbol.iterator(name).length
801b979ec0c2 more general notion of command span: command keyword not necessarily at start;
wenzelm
parents: 59735
diff changeset
   198
              val pos = Position.Range(Text.Range(offset, end_offset) + 1)
801b979ec0c2 more general notion of command span: command keyword not necessarily at start;
wenzelm
parents: 59735
diff changeset
   199
              Command_Span.Command_Span(name, pos)
801b979ec0c2 more general notion of command span: command keyword not necessarily at start;
wenzelm
parents: 59735
diff changeset
   200
          }
57905
c0c5652e796e separate module Command_Span: mostly syntactic representation;
wenzelm
parents: 57901
diff changeset
   201
      result += Command_Span.Span(kind, span)
c0c5652e796e separate module Command_Span: mostly syntactic representation;
wenzelm
parents: 57901
diff changeset
   202
    }
c0c5652e796e separate module Command_Span: mostly syntactic representation;
wenzelm
parents: 57901
diff changeset
   203
c0c5652e796e separate module Command_Span: mostly syntactic representation;
wenzelm
parents: 57901
diff changeset
   204
    def flush()
c0c5652e796e separate module Command_Span: mostly syntactic representation;
wenzelm
parents: 57901
diff changeset
   205
    {
59319
wenzelm
parents: 59122
diff changeset
   206
      if (content.nonEmpty) { ship(content.toList); content.clear }
wenzelm
parents: 59122
diff changeset
   207
      if (improper.nonEmpty) { ship(improper.toList); improper.clear }
57905
c0c5652e796e separate module Command_Span: mostly syntactic representation;
wenzelm
parents: 57901
diff changeset
   208
    }
c0c5652e796e separate module Command_Span: mostly syntactic representation;
wenzelm
parents: 57901
diff changeset
   209
c0c5652e796e separate module Command_Span: mostly syntactic representation;
wenzelm
parents: 57901
diff changeset
   210
    for (tok <- toks) {
59924
801b979ec0c2 more general notion of command span: command keyword not necessarily at start;
wenzelm
parents: 59735
diff changeset
   211
      if (tok.is_improper) improper += tok
63441
4c3fa4dba79f explicit kind "before_command";
wenzelm
parents: 63429
diff changeset
   212
      else if (keywords.is_before_command(tok) ||
4c3fa4dba79f explicit kind "before_command";
wenzelm
parents: 63429
diff changeset
   213
        tok.is_command &&
4c3fa4dba79f explicit kind "before_command";
wenzelm
parents: 63429
diff changeset
   214
          (!content.exists(keywords.is_before_command(_)) || content.exists(_.is_command)))
59924
801b979ec0c2 more general notion of command span: command keyword not necessarily at start;
wenzelm
parents: 59735
diff changeset
   215
      { flush(); content += tok }
57905
c0c5652e796e separate module Command_Span: mostly syntactic representation;
wenzelm
parents: 57901
diff changeset
   216
      else { content ++= improper; improper.clear; content += tok }
c0c5652e796e separate module Command_Span: mostly syntactic representation;
wenzelm
parents: 57901
diff changeset
   217
    }
c0c5652e796e separate module Command_Span: mostly syntactic representation;
wenzelm
parents: 57901
diff changeset
   218
    flush()
c0c5652e796e separate module Command_Span: mostly syntactic representation;
wenzelm
parents: 57901
diff changeset
   219
c0c5652e796e separate module Command_Span: mostly syntactic representation;
wenzelm
parents: 57901
diff changeset
   220
    result.toList
c0c5652e796e separate module Command_Span: mostly syntactic representation;
wenzelm
parents: 57901
diff changeset
   221
  }
c0c5652e796e separate module Command_Span: mostly syntactic representation;
wenzelm
parents: 57901
diff changeset
   222
57906
020df63dd0a9 tuned signature;
wenzelm
parents: 57905
diff changeset
   223
  def parse_spans(input: CharSequence): List[Command_Span.Span] =
59083
88b0b1f28adc tuned signature;
wenzelm
parents: 59077
diff changeset
   224
    parse_spans(Token.explode(keywords, input))
57906
020df63dd0a9 tuned signature;
wenzelm
parents: 57905
diff changeset
   225
57905
c0c5652e796e separate module Command_Span: mostly syntactic representation;
wenzelm
parents: 57901
diff changeset
   226
58706
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   227
  /* overall document structure */
55616
25a7a998852a default completion context via outer syntax;
wenzelm
parents: 55510
diff changeset
   228
58706
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   229
  def heading_level(command: Command): Option[Int] =
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   230
  {
59735
24bee1b11fce misc tuning and simplification;
wenzelm
parents: 59702
diff changeset
   231
    val name = command.span.name
24bee1b11fce misc tuning and simplification;
wenzelm
parents: 59702
diff changeset
   232
    name match {
24bee1b11fce misc tuning and simplification;
wenzelm
parents: 59702
diff changeset
   233
      case Thy_Header.CHAPTER => Some(0)
62453
b93cc7d73431 discontinued old 'header';
wenzelm
parents: 62244
diff changeset
   234
      case Thy_Header.SECTION => Some(1)
59735
24bee1b11fce misc tuning and simplification;
wenzelm
parents: 59702
diff changeset
   235
      case Thy_Header.SUBSECTION => Some(2)
24bee1b11fce misc tuning and simplification;
wenzelm
parents: 59702
diff changeset
   236
      case Thy_Header.SUBSUBSECTION => Some(3)
61463
8e46cea6a45a added 'paragraph', 'subparagraph';
wenzelm
parents: 60694
diff changeset
   237
      case Thy_Header.PARAGRAPH => Some(4)
8e46cea6a45a added 'paragraph', 'subparagraph';
wenzelm
parents: 60694
diff changeset
   238
      case Thy_Header.SUBPARAGRAPH => Some(5)
58868
c5e1cce7ace3 uniform heading commands work in any context, even in theory header;
wenzelm
parents: 58853
diff changeset
   239
      case _ =>
63441
4c3fa4dba79f explicit kind "before_command";
wenzelm
parents: 63429
diff changeset
   240
        keywords.kinds.get(name) match {
61463
8e46cea6a45a added 'paragraph', 'subparagraph';
wenzelm
parents: 60694
diff changeset
   241
          case Some(kind) if Keyword.theory(kind) && !Keyword.theory_end(kind) => Some(6)
58868
c5e1cce7ace3 uniform heading commands work in any context, even in theory header;
wenzelm
parents: 58853
diff changeset
   242
          case _ => None
c5e1cce7ace3 uniform heading commands work in any context, even in theory header;
wenzelm
parents: 58853
diff changeset
   243
        }
58706
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   244
    }
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   245
  }
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   246
58743
c07a59140fee clarified tree root;
wenzelm
parents: 58706
diff changeset
   247
  def parse_document(node_name: Document.Node.Name, text: CharSequence):
c07a59140fee clarified tree root;
wenzelm
parents: 58706
diff changeset
   248
    List[Outer_Syntax.Document] =
58706
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   249
  {
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   250
    /* stack operations */
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   251
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   252
    def buffer(): mutable.ListBuffer[Outer_Syntax.Document] =
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   253
      new mutable.ListBuffer[Outer_Syntax.Document]
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   254
58747
c680f181b32e tuned rendering;
wenzelm
parents: 58743
diff changeset
   255
    var stack: List[(Int, Command, mutable.ListBuffer[Outer_Syntax.Document])] =
c680f181b32e tuned rendering;
wenzelm
parents: 58743
diff changeset
   256
      List((0, Command.empty, buffer()))
55616
25a7a998852a default completion context via outer syntax;
wenzelm
parents: 55510
diff changeset
   257
58706
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   258
    @tailrec def close(level: Int => Boolean)
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   259
    {
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   260
      stack match {
58747
c680f181b32e tuned rendering;
wenzelm
parents: 58743
diff changeset
   261
        case (lev, command, body) :: (_, _, body2) :: rest if level(lev) =>
59735
24bee1b11fce misc tuning and simplification;
wenzelm
parents: 59702
diff changeset
   262
          body2 += Outer_Syntax.Document_Block(command.span.name, command.source, body.toList)
58706
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   263
          stack = stack.tail
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   264
          close(level)
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   265
        case _ =>
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   266
      }
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   267
    }
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   268
58743
c07a59140fee clarified tree root;
wenzelm
parents: 58706
diff changeset
   269
    def result(): List[Outer_Syntax.Document] =
58706
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   270
    {
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   271
      close(_ => true)
58743
c07a59140fee clarified tree root;
wenzelm
parents: 58706
diff changeset
   272
      stack.head._3.toList
58706
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   273
    }
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   274
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   275
    def add(command: Command)
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   276
    {
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   277
      heading_level(command) match {
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   278
        case Some(i) =>
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   279
          close(_ > i)
58747
c680f181b32e tuned rendering;
wenzelm
parents: 58743
diff changeset
   280
          stack = (i + 1, command, buffer()) :: stack
58706
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   281
        case None =>
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   282
      }
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   283
      stack.head._3 += Outer_Syntax.Document_Atom(command)
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   284
    }
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   285
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   286
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   287
    /* result structure */
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   288
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   289
    val spans = parse_spans(text)
59702
58dfaa369c11 hybrid use of command blobs: inlined errors and auxiliary files;
wenzelm
parents: 59700
diff changeset
   290
    spans.foreach(span => add(Command(Document_ID.none, node_name, Command.no_blobs, span)))
58706
70a947611792 tuned signature and modules;
wenzelm
parents: 58703
diff changeset
   291
    result()
55616
25a7a998852a default completion context via outer syntax;
wenzelm
parents: 55510
diff changeset
   292
  }
34166
446a33b874b3 renamed class Outer_Keyword to Outer_Syntax;
wenzelm
parents:
diff changeset
   293
}