src/Pure/Thy/thy_syntax.scala
author wenzelm
Wed Nov 10 15:42:20 2010 +0100 (2010-11-10)
changeset 40457 3b0050718b31
parent 40454 2516ea25a54b
child 40478 4bae781b8f7c
permissions -rw-r--r--
proper treatment of equal heading level;
wenzelm@34268
     1
/*  Title:      Pure/Thy/thy_syntax.scala
wenzelm@34268
     2
    Author:     Makarius
wenzelm@34268
     3
wenzelm@38374
     4
Superficial theory syntax: tokens and spans.
wenzelm@34268
     5
*/
wenzelm@34268
     6
wenzelm@34268
     7
package isabelle
wenzelm@34268
     8
wenzelm@34268
     9
wenzelm@38239
    10
import scala.collection.mutable
wenzelm@38374
    11
import scala.annotation.tailrec
wenzelm@38239
    12
wenzelm@38239
    13
wenzelm@34303
    14
object Thy_Syntax
wenzelm@34268
    15
{
wenzelm@40454
    16
  /** nested structure **/
wenzelm@40454
    17
wenzelm@40454
    18
  object Structure
wenzelm@40454
    19
  {
wenzelm@40454
    20
    sealed abstract class Entry
wenzelm@40454
    21
    {
wenzelm@40454
    22
      def length: Int
wenzelm@40454
    23
    }
wenzelm@40454
    24
    case class Block(val name: String, val body: List[Entry]) extends Entry
wenzelm@40454
    25
    {
wenzelm@40454
    26
      val length: Int = (0 /: body)(_ + _.length)
wenzelm@40454
    27
    }
wenzelm@40454
    28
    case class Atom(val command: Command) extends Entry
wenzelm@40454
    29
    {
wenzelm@40454
    30
      def length: Int = command.length
wenzelm@40454
    31
    }
wenzelm@40454
    32
wenzelm@40454
    33
    def parse_sections(syntax: Outer_Syntax, root_name: String, text: CharSequence): Entry =
wenzelm@40454
    34
    {
wenzelm@40454
    35
      /* stack operations */
wenzelm@40454
    36
wenzelm@40454
    37
      def buffer(): mutable.ListBuffer[Entry] = new mutable.ListBuffer[Entry]
wenzelm@40454
    38
      var stack: List[(Int, String, mutable.ListBuffer[Entry])] = List((0, root_name, buffer()))
wenzelm@40454
    39
wenzelm@40454
    40
      @tailrec def close(level: Int => Boolean)
wenzelm@40454
    41
      {
wenzelm@40454
    42
        stack match {
wenzelm@40454
    43
          case (lev, name, body) :: (_, _, body2) :: rest if level(lev) =>
wenzelm@40454
    44
            body2 += Block(name, body.toList)
wenzelm@40454
    45
            stack = stack.tail
wenzelm@40454
    46
            close(level)
wenzelm@40454
    47
          case _ =>
wenzelm@40454
    48
        }
wenzelm@40454
    49
      }
wenzelm@40454
    50
wenzelm@40454
    51
      def result(): Entry =
wenzelm@40454
    52
      {
wenzelm@40454
    53
        close(_ => true)
wenzelm@40454
    54
        val (_, name, body) = stack.head
wenzelm@40454
    55
        Block(name, body.toList)
wenzelm@40454
    56
      }
wenzelm@40454
    57
wenzelm@40454
    58
      def add(command: Command)
wenzelm@40454
    59
      {
wenzelm@40454
    60
        syntax.heading_level(command) match {
wenzelm@40454
    61
          case Some(i) =>
wenzelm@40457
    62
            close(_ >= i)
wenzelm@40454
    63
            stack = (i, command.source, buffer()) :: stack
wenzelm@40454
    64
          case None =>
wenzelm@40454
    65
        }
wenzelm@40454
    66
        stack.head._3 += Atom(command)
wenzelm@40454
    67
      }
wenzelm@40454
    68
wenzelm@40454
    69
wenzelm@40454
    70
      /* result structure */
wenzelm@40454
    71
wenzelm@40454
    72
      val spans = parse_spans(syntax.scan(text))
wenzelm@40454
    73
      spans.foreach(span => add(Command.span(span)))
wenzelm@40454
    74
      result()
wenzelm@40454
    75
    }
wenzelm@40454
    76
  }
wenzelm@40454
    77
wenzelm@40454
    78
wenzelm@40454
    79
wenzelm@38374
    80
  /** parse spans **/
wenzelm@38374
    81
wenzelm@38373
    82
  def parse_spans(toks: List[Token]): List[List[Token]] =
wenzelm@34268
    83
  {
wenzelm@38373
    84
    val result = new mutable.ListBuffer[List[Token]]
wenzelm@38239
    85
    val span = new mutable.ListBuffer[Token]
wenzelm@38239
    86
    val whitespace = new mutable.ListBuffer[Token]
wenzelm@34268
    87
wenzelm@38239
    88
    def flush(buffer: mutable.ListBuffer[Token])
wenzelm@38239
    89
    {
wenzelm@38239
    90
      if (!buffer.isEmpty) { result += buffer.toList; buffer.clear }
wenzelm@34268
    91
    }
wenzelm@38239
    92
    for (tok <- toks) {
wenzelm@38239
    93
      if (tok.is_command) { flush(span); flush(whitespace); span += tok }
wenzelm@38239
    94
      else if (tok.is_ignored) whitespace += tok
wenzelm@38239
    95
      else { span ++= whitespace; whitespace.clear; span += tok }
wenzelm@38239
    96
    }
wenzelm@38239
    97
    flush(span); flush(whitespace)
wenzelm@38239
    98
    result.toList
wenzelm@34268
    99
  }
wenzelm@38374
   100
wenzelm@38374
   101
wenzelm@38374
   102
wenzelm@38374
   103
  /** text edits **/
wenzelm@38374
   104
wenzelm@38417
   105
  def text_edits(session: Session, previous: Document.Version,
wenzelm@38417
   106
      edits: List[Document.Node_Text_Edit]): (List[Document.Edit[Command]], Document.Version) =
wenzelm@38374
   107
  {
wenzelm@38374
   108
    /* phase 1: edit individual command source */
wenzelm@38374
   109
wenzelm@38425
   110
    @tailrec def edit_text(eds: List[Text.Edit], commands: Linear_Set[Command])
wenzelm@38374
   111
        : Linear_Set[Command] =
wenzelm@38374
   112
    {
wenzelm@38374
   113
      eds match {
wenzelm@38374
   114
        case e :: es =>
wenzelm@38374
   115
          Document.Node.command_starts(commands.iterator).find {
wenzelm@38374
   116
            case (cmd, cmd_start) =>
wenzelm@38374
   117
              e.can_edit(cmd.source, cmd_start) ||
wenzelm@38374
   118
                e.is_insert && e.start == cmd_start + cmd.length
wenzelm@38374
   119
          } match {
wenzelm@38374
   120
            case Some((cmd, cmd_start)) if e.can_edit(cmd.source, cmd_start) =>
wenzelm@38374
   121
              val (rest, text) = e.edit(cmd.source, cmd_start)
wenzelm@38374
   122
              val new_commands = commands.insert_after(Some(cmd), Command.unparsed(text)) - cmd
wenzelm@38374
   123
              edit_text(rest.toList ::: es, new_commands)
wenzelm@38374
   124
wenzelm@38374
   125
            case Some((cmd, cmd_start)) =>
wenzelm@38374
   126
              edit_text(es, commands.insert_after(Some(cmd), Command.unparsed(e.text)))
wenzelm@38374
   127
wenzelm@38374
   128
            case None =>
wenzelm@38374
   129
              require(e.is_insert && e.start == 0)
wenzelm@38374
   130
              edit_text(es, commands.insert_after(None, Command.unparsed(e.text)))
wenzelm@38374
   131
          }
wenzelm@38374
   132
        case Nil => commands
wenzelm@38374
   133
      }
wenzelm@38374
   134
    }
wenzelm@38374
   135
wenzelm@38374
   136
wenzelm@38374
   137
    /* phase 2: recover command spans */
wenzelm@38374
   138
wenzelm@38374
   139
    @tailrec def recover_spans(commands: Linear_Set[Command]): Linear_Set[Command] =
wenzelm@38374
   140
    {
wenzelm@38374
   141
      commands.iterator.find(_.is_unparsed) match {
wenzelm@38374
   142
        case Some(first_unparsed) =>
wenzelm@38374
   143
          val first =
wenzelm@38878
   144
            commands.reverse_iterator(first_unparsed).
wenzelm@38878
   145
              dropWhile(_.newlines == 0).find(_.is_command) getOrElse commands.head
wenzelm@38374
   146
          val last =
wenzelm@38878
   147
            commands.iterator(first_unparsed).
wenzelm@38878
   148
              dropWhile(_.newlines == 0).find(_.is_command) getOrElse commands.last
wenzelm@38374
   149
          val range =
wenzelm@38374
   150
            commands.iterator(first).takeWhile(_ != last).toList ::: List(last)
wenzelm@38374
   151
wenzelm@38374
   152
          val sources = range.flatMap(_.span.map(_.source))
wenzelm@38569
   153
          val spans0 = parse_spans(session.current_syntax().scan(sources.mkString))
wenzelm@38374
   154
wenzelm@38374
   155
          val (before_edit, spans1) =
wenzelm@38374
   156
            if (!spans0.isEmpty && first.is_command && first.span == spans0.head)
wenzelm@38374
   157
              (Some(first), spans0.tail)
wenzelm@38374
   158
            else (commands.prev(first), spans0)
wenzelm@38374
   159
wenzelm@38374
   160
          val (after_edit, spans2) =
wenzelm@38374
   161
            if (!spans1.isEmpty && last.is_command && last.span == spans1.last)
wenzelm@38374
   162
              (Some(last), spans1.take(spans1.length - 1))
wenzelm@38374
   163
            else (commands.next(last), spans1)
wenzelm@38374
   164
wenzelm@38419
   165
          val inserted = spans2.map(span => new Command(session.new_id(), span))
wenzelm@38374
   166
          val new_commands =
wenzelm@38374
   167
            commands.delete_between(before_edit, after_edit).append_after(before_edit, inserted)
wenzelm@38374
   168
          recover_spans(new_commands)
wenzelm@38374
   169
wenzelm@38374
   170
        case None => commands
wenzelm@38374
   171
      }
wenzelm@38374
   172
    }
wenzelm@38374
   173
wenzelm@38374
   174
wenzelm@38374
   175
    /* resulting document edits */
wenzelm@38374
   176
wenzelm@38374
   177
    {
wenzelm@38374
   178
      val doc_edits = new mutable.ListBuffer[Document.Edit[Command]]
wenzelm@38417
   179
      var nodes = previous.nodes
wenzelm@38374
   180
wenzelm@38374
   181
      for ((name, text_edits) <- edits) {
wenzelm@38374
   182
        val commands0 = nodes(name).commands
wenzelm@38374
   183
        val commands1 = edit_text(text_edits, commands0)
wenzelm@38374
   184
        val commands2 = recover_spans(commands1)   // FIXME somewhat slow
wenzelm@38374
   185
wenzelm@38374
   186
        val removed_commands = commands0.iterator.filter(!commands2.contains(_)).toList
wenzelm@38374
   187
        val inserted_commands = commands2.iterator.filter(!commands0.contains(_)).toList
wenzelm@38374
   188
wenzelm@38374
   189
        val cmd_edits =
wenzelm@38374
   190
          removed_commands.reverse.map(cmd => (commands0.prev(cmd), None)) :::
wenzelm@38374
   191
          inserted_commands.map(cmd => (commands2.prev(cmd), Some(cmd)))
wenzelm@38374
   192
wenzelm@38374
   193
        doc_edits += (name -> Some(cmd_edits))
wenzelm@38374
   194
        nodes += (name -> new Document.Node(commands2))
wenzelm@38374
   195
      }
wenzelm@38419
   196
      (doc_edits.toList, new Document.Version(session.new_id(), nodes))
wenzelm@38374
   197
    }
wenzelm@38374
   198
  }
wenzelm@34268
   199
}