src/Pure/PIDE/xml.scala
author wenzelm
Sat, 07 Sep 2013 17:32:55 +0200
changeset 53461 26c609ada983
parent 52890 36e2c0c308eb
child 55618 995162143ef4
permissions -rw-r--r--
clarified modules;
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
44698
0385292321a0 moved XML/YXML to src/Pure/PIDE;
wenzelm
parents: 44697
diff changeset
     1
/*  Title:      Pure/PIDE/xml.scala
45673
cd41e3903fbf separate compilation of PIDE vs. Pure sources, which enables independent Scala library;
wenzelm
parents: 45667
diff changeset
     2
    Module:     PIDE
27931
b533a9de87a7 Minimalistic XML tree values.
wenzelm
parents:
diff changeset
     3
    Author:     Makarius
b533a9de87a7 Minimalistic XML tree values.
wenzelm
parents:
diff changeset
     4
44698
0385292321a0 moved XML/YXML to src/Pure/PIDE;
wenzelm
parents: 44697
diff changeset
     5
Untyped XML trees and basic data representation.
27931
b533a9de87a7 Minimalistic XML tree values.
wenzelm
parents:
diff changeset
     6
*/
b533a9de87a7 Minimalistic XML tree values.
wenzelm
parents:
diff changeset
     7
b533a9de87a7 Minimalistic XML tree values.
wenzelm
parents:
diff changeset
     8
package isabelle
b533a9de87a7 Minimalistic XML tree values.
wenzelm
parents:
diff changeset
     9
34108
54d48ca8708f cache for partial sharing;
wenzelm
parents: 34047
diff changeset
    10
import java.util.WeakHashMap
54d48ca8708f cache for partial sharing;
wenzelm
parents: 34047
diff changeset
    11
import java.lang.ref.WeakReference
54d48ca8708f cache for partial sharing;
wenzelm
parents: 34047
diff changeset
    12
import javax.xml.parsers.DocumentBuilderFactory
54d48ca8708f cache for partial sharing;
wenzelm
parents: 34047
diff changeset
    13
27947
b6dc0a396857 tuned comments;
wenzelm
parents: 27942
diff changeset
    14
29203
0c4effb73518 override toString method;
wenzelm
parents: 29140
diff changeset
    15
object XML
0c4effb73518 override toString method;
wenzelm
parents: 29140
diff changeset
    16
{
43767
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
    17
  /** XML trees **/
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
    18
27947
b6dc0a396857 tuned comments;
wenzelm
parents: 27942
diff changeset
    19
  /* datatype representation */
b6dc0a396857 tuned comments;
wenzelm
parents: 27942
diff changeset
    20
43780
2cb2310d68b6 more uniform Properties in ML and Scala;
wenzelm
parents: 43778
diff changeset
    21
  type Attributes = Properties.T
27931
b533a9de87a7 Minimalistic XML tree values.
wenzelm
parents:
diff changeset
    22
38268
beb86b805590 more uniform XML/YXML string_of_body/string_of_tree;
wenzelm
parents: 38267
diff changeset
    23
  sealed abstract class Tree { override def toString = string_of_tree(this) }
38230
ed147003de4b simplified type XML.Tree: embed Markup directly, avoid slightly odd triple;
wenzelm
parents: 36817
diff changeset
    24
  case class Elem(markup: Markup, body: List[Tree]) extends Tree
52890
36e2c0c308eb tuned signature;
wenzelm
parents: 51987
diff changeset
    25
  {
36e2c0c308eb tuned signature;
wenzelm
parents: 51987
diff changeset
    26
    def name: String = markup.name
36e2c0c308eb tuned signature;
wenzelm
parents: 51987
diff changeset
    27
  }
29204
wenzelm
parents: 29203
diff changeset
    28
  case class Text(content: String) extends Tree
29203
0c4effb73518 override toString method;
wenzelm
parents: 29140
diff changeset
    29
38230
ed147003de4b simplified type XML.Tree: embed Markup directly, avoid slightly odd triple;
wenzelm
parents: 36817
diff changeset
    30
  def elem(name: String, body: List[Tree]) = Elem(Markup(name, Nil), body)
ed147003de4b simplified type XML.Tree: embed Markup directly, avoid slightly odd triple;
wenzelm
parents: 36817
diff changeset
    31
  def elem(name: String) = Elem(Markup(name, Nil), Nil)
33999
d3b200894e21 added auxiliary constructors;
wenzelm
parents: 33953
diff changeset
    32
38267
e50c283dd125 type XML.Body as basic data representation language (Scala version);
wenzelm
parents: 38263
diff changeset
    33
  type Body = List[Tree]
e50c283dd125 type XML.Body as basic data representation language (Scala version);
wenzelm
parents: 38263
diff changeset
    34
29203
0c4effb73518 override toString method;
wenzelm
parents: 29140
diff changeset
    35
49650
9fad6480300d support for wrapped XML elements, which allows to preserve full markup tree information in to_XML/from_XML conversion;
wenzelm
parents: 49613
diff changeset
    36
  /* wrapped elements */
9fad6480300d support for wrapped XML elements, which allows to preserve full markup tree information in to_XML/from_XML conversion;
wenzelm
parents: 49613
diff changeset
    37
9fad6480300d support for wrapped XML elements, which allows to preserve full markup tree information in to_XML/from_XML conversion;
wenzelm
parents: 49613
diff changeset
    38
  val XML_ELEM = "xml_elem";
9fad6480300d support for wrapped XML elements, which allows to preserve full markup tree information in to_XML/from_XML conversion;
wenzelm
parents: 49613
diff changeset
    39
  val XML_NAME = "xml_name";
9fad6480300d support for wrapped XML elements, which allows to preserve full markup tree information in to_XML/from_XML conversion;
wenzelm
parents: 49613
diff changeset
    40
  val XML_BODY = "xml_body";
9fad6480300d support for wrapped XML elements, which allows to preserve full markup tree information in to_XML/from_XML conversion;
wenzelm
parents: 49613
diff changeset
    41
9fad6480300d support for wrapped XML elements, which allows to preserve full markup tree information in to_XML/from_XML conversion;
wenzelm
parents: 49613
diff changeset
    42
  object Wrapped_Elem
9fad6480300d support for wrapped XML elements, which allows to preserve full markup tree information in to_XML/from_XML conversion;
wenzelm
parents: 49613
diff changeset
    43
  {
9fad6480300d support for wrapped XML elements, which allows to preserve full markup tree information in to_XML/from_XML conversion;
wenzelm
parents: 49613
diff changeset
    44
    def apply(markup: Markup, body1: Body, body2: Body): XML.Elem =
9fad6480300d support for wrapped XML elements, which allows to preserve full markup tree information in to_XML/from_XML conversion;
wenzelm
parents: 49613
diff changeset
    45
      Elem(Markup(XML_ELEM, (XML_NAME, markup.name) :: markup.properties),
9fad6480300d support for wrapped XML elements, which allows to preserve full markup tree information in to_XML/from_XML conversion;
wenzelm
parents: 49613
diff changeset
    46
        Elem(Markup(XML_BODY, Nil), body1) :: body2)
9fad6480300d support for wrapped XML elements, which allows to preserve full markup tree information in to_XML/from_XML conversion;
wenzelm
parents: 49613
diff changeset
    47
9fad6480300d support for wrapped XML elements, which allows to preserve full markup tree information in to_XML/from_XML conversion;
wenzelm
parents: 49613
diff changeset
    48
    def unapply(tree: Tree): Option[(Markup, Body, Body)] =
9fad6480300d support for wrapped XML elements, which allows to preserve full markup tree information in to_XML/from_XML conversion;
wenzelm
parents: 49613
diff changeset
    49
      tree match {
9fad6480300d support for wrapped XML elements, which allows to preserve full markup tree information in to_XML/from_XML conversion;
wenzelm
parents: 49613
diff changeset
    50
        case
9fad6480300d support for wrapped XML elements, which allows to preserve full markup tree information in to_XML/from_XML conversion;
wenzelm
parents: 49613
diff changeset
    51
          Elem(Markup(XML_ELEM, (XML_NAME, name) :: props),
9fad6480300d support for wrapped XML elements, which allows to preserve full markup tree information in to_XML/from_XML conversion;
wenzelm
parents: 49613
diff changeset
    52
            Elem(Markup(XML_BODY, Nil), body1) :: body2) =>
9fad6480300d support for wrapped XML elements, which allows to preserve full markup tree information in to_XML/from_XML conversion;
wenzelm
parents: 49613
diff changeset
    53
          Some(Markup(name, props), body1, body2)
9fad6480300d support for wrapped XML elements, which allows to preserve full markup tree information in to_XML/from_XML conversion;
wenzelm
parents: 49613
diff changeset
    54
        case _ => None
9fad6480300d support for wrapped XML elements, which allows to preserve full markup tree information in to_XML/from_XML conversion;
wenzelm
parents: 49613
diff changeset
    55
      }
9fad6480300d support for wrapped XML elements, which allows to preserve full markup tree information in to_XML/from_XML conversion;
wenzelm
parents: 49613
diff changeset
    56
  }
9fad6480300d support for wrapped XML elements, which allows to preserve full markup tree information in to_XML/from_XML conversion;
wenzelm
parents: 49613
diff changeset
    57
9fad6480300d support for wrapped XML elements, which allows to preserve full markup tree information in to_XML/from_XML conversion;
wenzelm
parents: 49613
diff changeset
    58
9fad6480300d support for wrapped XML elements, which allows to preserve full markup tree information in to_XML/from_XML conversion;
wenzelm
parents: 49613
diff changeset
    59
  /* traverse text */
9fad6480300d support for wrapped XML elements, which allows to preserve full markup tree information in to_XML/from_XML conversion;
wenzelm
parents: 49613
diff changeset
    60
9fad6480300d support for wrapped XML elements, which allows to preserve full markup tree information in to_XML/from_XML conversion;
wenzelm
parents: 49613
diff changeset
    61
  def traverse_text[A](body: Body)(a: A)(op: (A, String) => A): A =
9fad6480300d support for wrapped XML elements, which allows to preserve full markup tree information in to_XML/from_XML conversion;
wenzelm
parents: 49613
diff changeset
    62
  {
9fad6480300d support for wrapped XML elements, which allows to preserve full markup tree information in to_XML/from_XML conversion;
wenzelm
parents: 49613
diff changeset
    63
    def traverse(x: A, t: Tree): A =
9fad6480300d support for wrapped XML elements, which allows to preserve full markup tree information in to_XML/from_XML conversion;
wenzelm
parents: 49613
diff changeset
    64
      t match {
9fad6480300d support for wrapped XML elements, which allows to preserve full markup tree information in to_XML/from_XML conversion;
wenzelm
parents: 49613
diff changeset
    65
        case Wrapped_Elem(_, _, ts) => (x /: ts)(traverse)
9fad6480300d support for wrapped XML elements, which allows to preserve full markup tree information in to_XML/from_XML conversion;
wenzelm
parents: 49613
diff changeset
    66
        case Elem(_, ts) => (x /: ts)(traverse)
9fad6480300d support for wrapped XML elements, which allows to preserve full markup tree information in to_XML/from_XML conversion;
wenzelm
parents: 49613
diff changeset
    67
        case Text(s) => op(x, s)
9fad6480300d support for wrapped XML elements, which allows to preserve full markup tree information in to_XML/from_XML conversion;
wenzelm
parents: 49613
diff changeset
    68
      }
9fad6480300d support for wrapped XML elements, which allows to preserve full markup tree information in to_XML/from_XML conversion;
wenzelm
parents: 49613
diff changeset
    69
    (a /: body)(traverse)
9fad6480300d support for wrapped XML elements, which allows to preserve full markup tree information in to_XML/from_XML conversion;
wenzelm
parents: 49613
diff changeset
    70
  }
9fad6480300d support for wrapped XML elements, which allows to preserve full markup tree information in to_XML/from_XML conversion;
wenzelm
parents: 49613
diff changeset
    71
9fad6480300d support for wrapped XML elements, which allows to preserve full markup tree information in to_XML/from_XML conversion;
wenzelm
parents: 49613
diff changeset
    72
  def text_length(body: Body): Int = traverse_text(body)(0) { case (n, s) => n + s.length }
9fad6480300d support for wrapped XML elements, which allows to preserve full markup tree information in to_XML/from_XML conversion;
wenzelm
parents: 49613
diff changeset
    73
9fad6480300d support for wrapped XML elements, which allows to preserve full markup tree information in to_XML/from_XML conversion;
wenzelm
parents: 49613
diff changeset
    74
9fad6480300d support for wrapped XML elements, which allows to preserve full markup tree information in to_XML/from_XML conversion;
wenzelm
parents: 49613
diff changeset
    75
  /* text content */
9fad6480300d support for wrapped XML elements, which allows to preserve full markup tree information in to_XML/from_XML conversion;
wenzelm
parents: 49613
diff changeset
    76
9fad6480300d support for wrapped XML elements, which allows to preserve full markup tree information in to_XML/from_XML conversion;
wenzelm
parents: 49613
diff changeset
    77
  def content(body: Body): String =
9fad6480300d support for wrapped XML elements, which allows to preserve full markup tree information in to_XML/from_XML conversion;
wenzelm
parents: 49613
diff changeset
    78
  {
9fad6480300d support for wrapped XML elements, which allows to preserve full markup tree information in to_XML/from_XML conversion;
wenzelm
parents: 49613
diff changeset
    79
    val text = new StringBuilder(text_length(body))
9fad6480300d support for wrapped XML elements, which allows to preserve full markup tree information in to_XML/from_XML conversion;
wenzelm
parents: 49613
diff changeset
    80
    traverse_text(body)(()) { case (_, s) => text.append(s) }
9fad6480300d support for wrapped XML elements, which allows to preserve full markup tree information in to_XML/from_XML conversion;
wenzelm
parents: 49613
diff changeset
    81
    text.toString
9fad6480300d support for wrapped XML elements, which allows to preserve full markup tree information in to_XML/from_XML conversion;
wenzelm
parents: 49613
diff changeset
    82
  }
9fad6480300d support for wrapped XML elements, which allows to preserve full markup tree information in to_XML/from_XML conversion;
wenzelm
parents: 49613
diff changeset
    83
9fad6480300d support for wrapped XML elements, which allows to preserve full markup tree information in to_XML/from_XML conversion;
wenzelm
parents: 49613
diff changeset
    84
  def content(tree: Tree): String = content(List(tree))
9fad6480300d support for wrapped XML elements, which allows to preserve full markup tree information in to_XML/from_XML conversion;
wenzelm
parents: 49613
diff changeset
    85
9fad6480300d support for wrapped XML elements, which allows to preserve full markup tree information in to_XML/from_XML conversion;
wenzelm
parents: 49613
diff changeset
    86
9fad6480300d support for wrapped XML elements, which allows to preserve full markup tree information in to_XML/from_XML conversion;
wenzelm
parents: 49613
diff changeset
    87
9fad6480300d support for wrapped XML elements, which allows to preserve full markup tree information in to_XML/from_XML conversion;
wenzelm
parents: 49613
diff changeset
    88
  /** string representation **/
29203
0c4effb73518 override toString method;
wenzelm
parents: 29140
diff changeset
    89
38268
beb86b805590 more uniform XML/YXML string_of_body/string_of_tree;
wenzelm
parents: 38267
diff changeset
    90
  def string_of_body(body: Body): String =
beb86b805590 more uniform XML/YXML string_of_body/string_of_tree;
wenzelm
parents: 38267
diff changeset
    91
  {
beb86b805590 more uniform XML/YXML string_of_body/string_of_tree;
wenzelm
parents: 38267
diff changeset
    92
    val s = new StringBuilder
beb86b805590 more uniform XML/YXML string_of_body/string_of_tree;
wenzelm
parents: 38267
diff changeset
    93
beb86b805590 more uniform XML/YXML string_of_body/string_of_tree;
wenzelm
parents: 38267
diff changeset
    94
    def text(txt: String) {
beb86b805590 more uniform XML/YXML string_of_body/string_of_tree;
wenzelm
parents: 38267
diff changeset
    95
      if (txt == null) s ++= txt
beb86b805590 more uniform XML/YXML string_of_body/string_of_tree;
wenzelm
parents: 38267
diff changeset
    96
      else {
beb86b805590 more uniform XML/YXML string_of_body/string_of_tree;
wenzelm
parents: 38267
diff changeset
    97
        for (c <- txt.iterator) c match {
beb86b805590 more uniform XML/YXML string_of_body/string_of_tree;
wenzelm
parents: 38267
diff changeset
    98
          case '<' => s ++= "&lt;"
beb86b805590 more uniform XML/YXML string_of_body/string_of_tree;
wenzelm
parents: 38267
diff changeset
    99
          case '>' => s ++= "&gt;"
beb86b805590 more uniform XML/YXML string_of_body/string_of_tree;
wenzelm
parents: 38267
diff changeset
   100
          case '&' => s ++= "&amp;"
beb86b805590 more uniform XML/YXML string_of_body/string_of_tree;
wenzelm
parents: 38267
diff changeset
   101
          case '"' => s ++= "&quot;"
beb86b805590 more uniform XML/YXML string_of_body/string_of_tree;
wenzelm
parents: 38267
diff changeset
   102
          case '\'' => s ++= "&apos;"
beb86b805590 more uniform XML/YXML string_of_body/string_of_tree;
wenzelm
parents: 38267
diff changeset
   103
          case _ => s += c
beb86b805590 more uniform XML/YXML string_of_body/string_of_tree;
wenzelm
parents: 38267
diff changeset
   104
        }
34005
ada5098506af toString: more robust handling of null;
wenzelm
parents: 33999
diff changeset
   105
      }
29203
0c4effb73518 override toString method;
wenzelm
parents: 29140
diff changeset
   106
    }
38268
beb86b805590 more uniform XML/YXML string_of_body/string_of_tree;
wenzelm
parents: 38267
diff changeset
   107
    def attrib(p: (String, String)) { s ++= " "; s ++= p._1; s ++= "=\""; text(p._2); s ++= "\"" }
beb86b805590 more uniform XML/YXML string_of_body/string_of_tree;
wenzelm
parents: 38267
diff changeset
   108
    def elem(markup: Markup) { s ++= markup.name; markup.properties.foreach(attrib) }
beb86b805590 more uniform XML/YXML string_of_body/string_of_tree;
wenzelm
parents: 38267
diff changeset
   109
    def tree(t: Tree): Unit =
beb86b805590 more uniform XML/YXML string_of_body/string_of_tree;
wenzelm
parents: 38267
diff changeset
   110
      t match {
beb86b805590 more uniform XML/YXML string_of_body/string_of_tree;
wenzelm
parents: 38267
diff changeset
   111
        case Elem(markup, Nil) =>
beb86b805590 more uniform XML/YXML string_of_body/string_of_tree;
wenzelm
parents: 38267
diff changeset
   112
          s ++= "<"; elem(markup); s ++= "/>"
beb86b805590 more uniform XML/YXML string_of_body/string_of_tree;
wenzelm
parents: 38267
diff changeset
   113
        case Elem(markup, ts) =>
beb86b805590 more uniform XML/YXML string_of_body/string_of_tree;
wenzelm
parents: 38267
diff changeset
   114
          s ++= "<"; elem(markup); s ++= ">"
beb86b805590 more uniform XML/YXML string_of_body/string_of_tree;
wenzelm
parents: 38267
diff changeset
   115
          ts.foreach(tree)
beb86b805590 more uniform XML/YXML string_of_body/string_of_tree;
wenzelm
parents: 38267
diff changeset
   116
          s ++= "</"; s ++= markup.name; s ++= ">"
beb86b805590 more uniform XML/YXML string_of_body/string_of_tree;
wenzelm
parents: 38267
diff changeset
   117
        case Text(txt) => text(txt)
beb86b805590 more uniform XML/YXML string_of_body/string_of_tree;
wenzelm
parents: 38267
diff changeset
   118
      }
beb86b805590 more uniform XML/YXML string_of_body/string_of_tree;
wenzelm
parents: 38267
diff changeset
   119
    body.foreach(tree)
beb86b805590 more uniform XML/YXML string_of_body/string_of_tree;
wenzelm
parents: 38267
diff changeset
   120
    s.toString
29203
0c4effb73518 override toString method;
wenzelm
parents: 29140
diff changeset
   121
  }
0c4effb73518 override toString method;
wenzelm
parents: 29140
diff changeset
   122
38268
beb86b805590 more uniform XML/YXML string_of_body/string_of_tree;
wenzelm
parents: 38267
diff changeset
   123
  def string_of_tree(tree: XML.Tree): String = string_of_body(List(tree))
27941
b4656b671cce added iterator over content;
wenzelm
parents: 27931
diff changeset
   124
b4656b671cce added iterator over content;
wenzelm
parents: 27931
diff changeset
   125
44808
05b8997899a2 XML.cache for partial sharing (strings only);
wenzelm
parents: 44721
diff changeset
   126
05b8997899a2 XML.cache for partial sharing (strings only);
wenzelm
parents: 44721
diff changeset
   127
  /** cache for partial sharing (weak table) **/
34108
54d48ca8708f cache for partial sharing;
wenzelm
parents: 34047
diff changeset
   128
43745
562e35bc351e tuned XML.Cache parameters;
wenzelm
parents: 43520
diff changeset
   129
  class Cache(initial_size: Int = 131071, max_string: Int = 100)
34108
54d48ca8708f cache for partial sharing;
wenzelm
parents: 34047
diff changeset
   130
  {
44704
528d635ef6f0 synchronous XML.Cache without actor -- potentially more efficient on machines with few cores;
wenzelm
parents: 44698
diff changeset
   131
    private var table = new WeakHashMap[Any, WeakReference[Any]](initial_size)
38446
9d59dab38fef XML.Cache: pipe-lined (thread-safe) version using actor;
wenzelm
parents: 38268
diff changeset
   132
44704
528d635ef6f0 synchronous XML.Cache without actor -- potentially more efficient on machines with few cores;
wenzelm
parents: 44698
diff changeset
   133
    private def lookup[A](x: A): Option[A] =
528d635ef6f0 synchronous XML.Cache without actor -- potentially more efficient on machines with few cores;
wenzelm
parents: 44698
diff changeset
   134
    {
528d635ef6f0 synchronous XML.Cache without actor -- potentially more efficient on machines with few cores;
wenzelm
parents: 44698
diff changeset
   135
      val ref = table.get(x)
528d635ef6f0 synchronous XML.Cache without actor -- potentially more efficient on machines with few cores;
wenzelm
parents: 44698
diff changeset
   136
      if (ref == null) None
528d635ef6f0 synchronous XML.Cache without actor -- potentially more efficient on machines with few cores;
wenzelm
parents: 44698
diff changeset
   137
      else {
528d635ef6f0 synchronous XML.Cache without actor -- potentially more efficient on machines with few cores;
wenzelm
parents: 44698
diff changeset
   138
        val y = ref.asInstanceOf[WeakReference[A]].get
528d635ef6f0 synchronous XML.Cache without actor -- potentially more efficient on machines with few cores;
wenzelm
parents: 44698
diff changeset
   139
        if (y == null) None
528d635ef6f0 synchronous XML.Cache without actor -- potentially more efficient on machines with few cores;
wenzelm
parents: 44698
diff changeset
   140
        else Some(y)
38446
9d59dab38fef XML.Cache: pipe-lined (thread-safe) version using actor;
wenzelm
parents: 38268
diff changeset
   141
      }
44704
528d635ef6f0 synchronous XML.Cache without actor -- potentially more efficient on machines with few cores;
wenzelm
parents: 44698
diff changeset
   142
    }
528d635ef6f0 synchronous XML.Cache without actor -- potentially more efficient on machines with few cores;
wenzelm
parents: 44698
diff changeset
   143
    private def store[A](x: A): A =
528d635ef6f0 synchronous XML.Cache without actor -- potentially more efficient on machines with few cores;
wenzelm
parents: 44698
diff changeset
   144
    {
528d635ef6f0 synchronous XML.Cache without actor -- potentially more efficient on machines with few cores;
wenzelm
parents: 44698
diff changeset
   145
      table.put(x, new WeakReference[Any](x))
528d635ef6f0 synchronous XML.Cache without actor -- potentially more efficient on machines with few cores;
wenzelm
parents: 44698
diff changeset
   146
      x
528d635ef6f0 synchronous XML.Cache without actor -- potentially more efficient on machines with few cores;
wenzelm
parents: 44698
diff changeset
   147
    }
34108
54d48ca8708f cache for partial sharing;
wenzelm
parents: 34047
diff changeset
   148
44704
528d635ef6f0 synchronous XML.Cache without actor -- potentially more efficient on machines with few cores;
wenzelm
parents: 44698
diff changeset
   149
    private def trim_bytes(s: String): String = new String(s.toCharArray)
38869
wenzelm
parents: 38844
diff changeset
   150
51663
098f3cf6c809 tuned signature;
wenzelm
parents: 51223
diff changeset
   151
    private def cache_string(x: String): String =
44704
528d635ef6f0 synchronous XML.Cache without actor -- potentially more efficient on machines with few cores;
wenzelm
parents: 44698
diff changeset
   152
      lookup(x) match {
528d635ef6f0 synchronous XML.Cache without actor -- potentially more efficient on machines with few cores;
wenzelm
parents: 44698
diff changeset
   153
        case Some(y) => y
528d635ef6f0 synchronous XML.Cache without actor -- potentially more efficient on machines with few cores;
wenzelm
parents: 44698
diff changeset
   154
        case None =>
528d635ef6f0 synchronous XML.Cache without actor -- potentially more efficient on machines with few cores;
wenzelm
parents: 44698
diff changeset
   155
          val z = trim_bytes(x)
528d635ef6f0 synchronous XML.Cache without actor -- potentially more efficient on machines with few cores;
wenzelm
parents: 44698
diff changeset
   156
          if (z.length > max_string) z else store(z)
528d635ef6f0 synchronous XML.Cache without actor -- potentially more efficient on machines with few cores;
wenzelm
parents: 44698
diff changeset
   157
      }
51663
098f3cf6c809 tuned signature;
wenzelm
parents: 51223
diff changeset
   158
    private def cache_props(x: Properties.T): Properties.T =
44704
528d635ef6f0 synchronous XML.Cache without actor -- potentially more efficient on machines with few cores;
wenzelm
parents: 44698
diff changeset
   159
      if (x.isEmpty) x
528d635ef6f0 synchronous XML.Cache without actor -- potentially more efficient on machines with few cores;
wenzelm
parents: 44698
diff changeset
   160
      else
34133
wenzelm
parents: 34119
diff changeset
   161
        lookup(x) match {
wenzelm
parents: 34119
diff changeset
   162
          case Some(y) => y
51663
098f3cf6c809 tuned signature;
wenzelm
parents: 51223
diff changeset
   163
          case None => store(x.map(p => (trim_bytes(p._1).intern, cache_string(p._2))))
34133
wenzelm
parents: 34119
diff changeset
   164
        }
51663
098f3cf6c809 tuned signature;
wenzelm
parents: 51223
diff changeset
   165
    private def cache_markup(x: Markup): Markup =
44704
528d635ef6f0 synchronous XML.Cache without actor -- potentially more efficient on machines with few cores;
wenzelm
parents: 44698
diff changeset
   166
      lookup(x) match {
528d635ef6f0 synchronous XML.Cache without actor -- potentially more efficient on machines with few cores;
wenzelm
parents: 44698
diff changeset
   167
        case Some(y) => y
528d635ef6f0 synchronous XML.Cache without actor -- potentially more efficient on machines with few cores;
wenzelm
parents: 44698
diff changeset
   168
        case None =>
528d635ef6f0 synchronous XML.Cache without actor -- potentially more efficient on machines with few cores;
wenzelm
parents: 44698
diff changeset
   169
          x match {
528d635ef6f0 synchronous XML.Cache without actor -- potentially more efficient on machines with few cores;
wenzelm
parents: 44698
diff changeset
   170
            case Markup(name, props) =>
51663
098f3cf6c809 tuned signature;
wenzelm
parents: 51223
diff changeset
   171
              store(Markup(cache_string(name), cache_props(props)))
44704
528d635ef6f0 synchronous XML.Cache without actor -- potentially more efficient on machines with few cores;
wenzelm
parents: 44698
diff changeset
   172
          }
528d635ef6f0 synchronous XML.Cache without actor -- potentially more efficient on machines with few cores;
wenzelm
parents: 44698
diff changeset
   173
      }
51663
098f3cf6c809 tuned signature;
wenzelm
parents: 51223
diff changeset
   174
    private def cache_tree(x: XML.Tree): XML.Tree =
44704
528d635ef6f0 synchronous XML.Cache without actor -- potentially more efficient on machines with few cores;
wenzelm
parents: 44698
diff changeset
   175
      lookup(x) match {
528d635ef6f0 synchronous XML.Cache without actor -- potentially more efficient on machines with few cores;
wenzelm
parents: 44698
diff changeset
   176
        case Some(y) => y
528d635ef6f0 synchronous XML.Cache without actor -- potentially more efficient on machines with few cores;
wenzelm
parents: 44698
diff changeset
   177
        case None =>
528d635ef6f0 synchronous XML.Cache without actor -- potentially more efficient on machines with few cores;
wenzelm
parents: 44698
diff changeset
   178
          x match {
528d635ef6f0 synchronous XML.Cache without actor -- potentially more efficient on machines with few cores;
wenzelm
parents: 44698
diff changeset
   179
            case XML.Elem(markup, body) =>
51663
098f3cf6c809 tuned signature;
wenzelm
parents: 51223
diff changeset
   180
              store(XML.Elem(cache_markup(markup), cache_body(body)))
098f3cf6c809 tuned signature;
wenzelm
parents: 51223
diff changeset
   181
            case XML.Text(text) => store(XML.Text(cache_string(text)))
44704
528d635ef6f0 synchronous XML.Cache without actor -- potentially more efficient on machines with few cores;
wenzelm
parents: 44698
diff changeset
   182
          }
528d635ef6f0 synchronous XML.Cache without actor -- potentially more efficient on machines with few cores;
wenzelm
parents: 44698
diff changeset
   183
      }
51663
098f3cf6c809 tuned signature;
wenzelm
parents: 51223
diff changeset
   184
    private def cache_body(x: XML.Body): XML.Body =
44704
528d635ef6f0 synchronous XML.Cache without actor -- potentially more efficient on machines with few cores;
wenzelm
parents: 44698
diff changeset
   185
      if (x.isEmpty) x
528d635ef6f0 synchronous XML.Cache without actor -- potentially more efficient on machines with few cores;
wenzelm
parents: 44698
diff changeset
   186
      else
34133
wenzelm
parents: 34119
diff changeset
   187
        lookup(x) match {
wenzelm
parents: 34119
diff changeset
   188
          case Some(y) => y
51663
098f3cf6c809 tuned signature;
wenzelm
parents: 51223
diff changeset
   189
          case None => x.map(cache_tree(_))
34133
wenzelm
parents: 34119
diff changeset
   190
        }
38446
9d59dab38fef XML.Cache: pipe-lined (thread-safe) version using actor;
wenzelm
parents: 38268
diff changeset
   191
9d59dab38fef XML.Cache: pipe-lined (thread-safe) version using actor;
wenzelm
parents: 38268
diff changeset
   192
    // main methods
51663
098f3cf6c809 tuned signature;
wenzelm
parents: 51223
diff changeset
   193
    def string(x: String): String = synchronized { cache_string(x) }
098f3cf6c809 tuned signature;
wenzelm
parents: 51223
diff changeset
   194
    def props(x: Properties.T): Properties.T = synchronized { cache_props(x) }
098f3cf6c809 tuned signature;
wenzelm
parents: 51223
diff changeset
   195
    def markup(x: Markup): Markup = synchronized { cache_markup(x) }
098f3cf6c809 tuned signature;
wenzelm
parents: 51223
diff changeset
   196
    def tree(x: XML.Tree): XML.Tree = synchronized { cache_tree(x) }
098f3cf6c809 tuned signature;
wenzelm
parents: 51223
diff changeset
   197
    def body(x: XML.Body): XML.Body = synchronized { cache_body(x) }
098f3cf6c809 tuned signature;
wenzelm
parents: 51223
diff changeset
   198
    def elem(x: XML.Elem): XML.Elem = synchronized { cache_tree(x).asInstanceOf[XML.Elem] }
34108
54d48ca8708f cache for partial sharing;
wenzelm
parents: 34047
diff changeset
   199
  }
54d48ca8708f cache for partial sharing;
wenzelm
parents: 34047
diff changeset
   200
54d48ca8708f cache for partial sharing;
wenzelm
parents: 34047
diff changeset
   201
43767
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   202
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   203
  /** XML as data representation language **/
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   204
51987
7d8e0e3c553b tuned signature;
wenzelm
parents: 51663
diff changeset
   205
  abstract class Error(s: String) extends Exception(s)
7d8e0e3c553b tuned signature;
wenzelm
parents: 51663
diff changeset
   206
  class XML_Atom(s: String) extends Error(s)
7d8e0e3c553b tuned signature;
wenzelm
parents: 51663
diff changeset
   207
  class XML_Body(body: XML.Body) extends Error("")
43767
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   208
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   209
  object Encode
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   210
  {
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   211
    type T[A] = A => XML.Body
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   212
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   213
43778
ce9189450447 more compact representation of XML data (notably sort/typ/term), using properties as vector of atomic values;
wenzelm
parents: 43768
diff changeset
   214
    /* atomic values */
43767
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   215
43778
ce9189450447 more compact representation of XML data (notably sort/typ/term), using properties as vector of atomic values;
wenzelm
parents: 43768
diff changeset
   216
    def long_atom(i: Long): String = i.toString
43767
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   217
43778
ce9189450447 more compact representation of XML data (notably sort/typ/term), using properties as vector of atomic values;
wenzelm
parents: 43768
diff changeset
   218
    def int_atom(i: Int): String = i.toString
43767
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   219
43778
ce9189450447 more compact representation of XML data (notably sort/typ/term), using properties as vector of atomic values;
wenzelm
parents: 43768
diff changeset
   220
    def bool_atom(b: Boolean): String = if (b) "1" else "0"
43767
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   221
43778
ce9189450447 more compact representation of XML data (notably sort/typ/term), using properties as vector of atomic values;
wenzelm
parents: 43768
diff changeset
   222
    def unit_atom(u: Unit) = ""
43767
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   223
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   224
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   225
    /* structural nodes */
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   226
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   227
    private def node(ts: XML.Body): XML.Tree = XML.Elem(Markup(":", Nil), ts)
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   228
43781
d43e5f79bdc2 retain some terminology of "XML attributes";
wenzelm
parents: 43780
diff changeset
   229
    private def vector(xs: List[String]): XML.Attributes =
46839
f7232c078fa5 simplified -- plain map_index is sufficient (pointed out by Enrico Tassi);
wenzelm
parents: 45673
diff changeset
   230
      xs.zipWithIndex.map({ case (x, i) => (int_atom(i), x) })
43778
ce9189450447 more compact representation of XML data (notably sort/typ/term), using properties as vector of atomic values;
wenzelm
parents: 43768
diff changeset
   231
ce9189450447 more compact representation of XML data (notably sort/typ/term), using properties as vector of atomic values;
wenzelm
parents: 43768
diff changeset
   232
    private def tagged(tag: Int, data: (List[String], XML.Body)): XML.Tree =
ce9189450447 more compact representation of XML data (notably sort/typ/term), using properties as vector of atomic values;
wenzelm
parents: 43768
diff changeset
   233
      XML.Elem(Markup(int_atom(tag), vector(data._1)), data._2)
43767
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   234
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   235
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   236
    /* representation of standard types */
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   237
43780
2cb2310d68b6 more uniform Properties in ML and Scala;
wenzelm
parents: 43778
diff changeset
   238
    val properties: T[Properties.T] =
43767
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   239
      (props => List(XML.Elem(Markup(":", props), Nil)))
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   240
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   241
    val string: T[String] = (s => if (s.isEmpty) Nil else List(XML.Text(s)))
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   242
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   243
    val long: T[Long] = (x => string(long_atom(x)))
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   244
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   245
    val int: T[Int] = (x => string(int_atom(x)))
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   246
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   247
    val bool: T[Boolean] = (x => string(bool_atom(x)))
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   248
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   249
    val unit: T[Unit] = (x => string(unit_atom(x)))
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   250
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   251
    def pair[A, B](f: T[A], g: T[B]): T[(A, B)] =
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   252
      (x => List(node(f(x._1)), node(g(x._2))))
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   253
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   254
    def triple[A, B, C](f: T[A], g: T[B], h: T[C]): T[(A, B, C)] =
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   255
      (x => List(node(f(x._1)), node(g(x._2)), node(h(x._3))))
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   256
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   257
    def list[A](f: T[A]): T[List[A]] =
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   258
      (xs => xs.map((x: A) => node(f(x))))
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   259
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   260
    def option[A](f: T[A]): T[Option[A]] =
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   261
    {
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   262
      case None => Nil
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   263
      case Some(x) => List(node(f(x)))
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   264
    }
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   265
43778
ce9189450447 more compact representation of XML data (notably sort/typ/term), using properties as vector of atomic values;
wenzelm
parents: 43768
diff changeset
   266
    def variant[A](fs: List[PartialFunction[A, (List[String], XML.Body)]]): T[A] =
43767
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   267
    {
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   268
      case x =>
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   269
        val (f, tag) = fs.iterator.zipWithIndex.find(p => p._1.isDefinedAt(x)).get
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   270
        List(tagged(tag, f(x)))
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   271
    }
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   272
  }
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   273
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   274
  object Decode
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   275
  {
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   276
    type T[A] = XML.Body => A
43778
ce9189450447 more compact representation of XML data (notably sort/typ/term), using properties as vector of atomic values;
wenzelm
parents: 43768
diff changeset
   277
    type V[A] = (List[String], XML.Body) => A
43767
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   278
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   279
43778
ce9189450447 more compact representation of XML data (notably sort/typ/term), using properties as vector of atomic values;
wenzelm
parents: 43768
diff changeset
   280
    /* atomic values */
43767
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   281
43778
ce9189450447 more compact representation of XML data (notably sort/typ/term), using properties as vector of atomic values;
wenzelm
parents: 43768
diff changeset
   282
    def long_atom(s: String): Long =
43767
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   283
      try { java.lang.Long.parseLong(s) }
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   284
      catch { case e: NumberFormatException => throw new XML_Atom(s) }
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   285
43778
ce9189450447 more compact representation of XML data (notably sort/typ/term), using properties as vector of atomic values;
wenzelm
parents: 43768
diff changeset
   286
    def int_atom(s: String): Int =
43767
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   287
      try { Integer.parseInt(s) }
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   288
      catch { case e: NumberFormatException => throw new XML_Atom(s) }
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   289
43778
ce9189450447 more compact representation of XML data (notably sort/typ/term), using properties as vector of atomic values;
wenzelm
parents: 43768
diff changeset
   290
    def bool_atom(s: String): Boolean =
43767
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   291
      if (s == "1") true
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   292
      else if (s == "0") false
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   293
      else throw new XML_Atom(s)
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   294
43778
ce9189450447 more compact representation of XML data (notably sort/typ/term), using properties as vector of atomic values;
wenzelm
parents: 43768
diff changeset
   295
    def unit_atom(s: String): Unit =
43767
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   296
      if (s == "") () else throw new XML_Atom(s)
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   297
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   298
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   299
    /* structural nodes */
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   300
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   301
    private def node(t: XML.Tree): XML.Body =
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   302
      t match {
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   303
        case XML.Elem(Markup(":", Nil), ts) => ts
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   304
        case _ => throw new XML_Body(List(t))
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   305
      }
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   306
43781
d43e5f79bdc2 retain some terminology of "XML attributes";
wenzelm
parents: 43780
diff changeset
   307
    private def vector(atts: XML.Attributes): List[String] =
46839
f7232c078fa5 simplified -- plain map_index is sufficient (pointed out by Enrico Tassi);
wenzelm
parents: 45673
diff changeset
   308
      atts.iterator.zipWithIndex.map(
f7232c078fa5 simplified -- plain map_index is sufficient (pointed out by Enrico Tassi);
wenzelm
parents: 45673
diff changeset
   309
        { case ((a, x), i) => if (int_atom(a) == i) x else throw new XML_Atom(a) }).toList
43778
ce9189450447 more compact representation of XML data (notably sort/typ/term), using properties as vector of atomic values;
wenzelm
parents: 43768
diff changeset
   310
ce9189450447 more compact representation of XML data (notably sort/typ/term), using properties as vector of atomic values;
wenzelm
parents: 43768
diff changeset
   311
    private def tagged(t: XML.Tree): (Int, (List[String], XML.Body)) =
43767
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   312
      t match {
43781
d43e5f79bdc2 retain some terminology of "XML attributes";
wenzelm
parents: 43780
diff changeset
   313
        case XML.Elem(Markup(name, atts), ts) => (int_atom(name), (vector(atts), ts))
43767
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   314
        case _ => throw new XML_Body(List(t))
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   315
      }
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   316
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   317
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   318
    /* representation of standard types */
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   319
43780
2cb2310d68b6 more uniform Properties in ML and Scala;
wenzelm
parents: 43778
diff changeset
   320
    val properties: T[Properties.T] =
43767
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   321
    {
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   322
      case List(XML.Elem(Markup(":", props), Nil)) => props
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   323
      case ts => throw new XML_Body(ts)
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   324
    }
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   325
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   326
    val string: T[String] =
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   327
    {
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   328
      case Nil => ""
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   329
      case List(XML.Text(s)) => s
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   330
      case ts => throw new XML_Body(ts)
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   331
    }
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   332
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   333
    val long: T[Long] = (x => long_atom(string(x)))
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   334
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   335
    val int: T[Int] = (x => int_atom(string(x)))
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   336
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   337
    val bool: T[Boolean] = (x => bool_atom(string(x)))
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   338
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   339
    val unit: T[Unit] = (x => unit_atom(string(x)))
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   340
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   341
    def pair[A, B](f: T[A], g: T[B]): T[(A, B)] =
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   342
    {
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   343
      case List(t1, t2) => (f(node(t1)), g(node(t2)))
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   344
      case ts => throw new XML_Body(ts)
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   345
    }
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   346
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   347
    def triple[A, B, C](f: T[A], g: T[B], h: T[C]): T[(A, B, C)] =
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   348
    {
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   349
      case List(t1, t2, t3) => (f(node(t1)), g(node(t2)), h(node(t3)))
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   350
      case ts => throw new XML_Body(ts)
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   351
    }
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   352
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   353
    def list[A](f: T[A]): T[List[A]] =
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   354
      (ts => ts.map(t => f(node(t))))
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   355
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   356
    def option[A](f: T[A]): T[Option[A]] =
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   357
    {
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   358
      case Nil => None
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   359
      case List(t) => Some(f(node(t)))
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   360
      case ts => throw new XML_Body(ts)
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   361
    }
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   362
43778
ce9189450447 more compact representation of XML data (notably sort/typ/term), using properties as vector of atomic values;
wenzelm
parents: 43768
diff changeset
   363
    def variant[A](fs: List[V[A]]): T[A] =
43767
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   364
    {
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   365
      case List(t) =>
43778
ce9189450447 more compact representation of XML data (notably sort/typ/term), using properties as vector of atomic values;
wenzelm
parents: 43768
diff changeset
   366
        val (tag, (xs, ts)) = tagged(t)
43768
d52ab827d62b more precise exceptions;
wenzelm
parents: 43767
diff changeset
   367
        val f =
d52ab827d62b more precise exceptions;
wenzelm
parents: 43767
diff changeset
   368
          try { fs(tag) }
d52ab827d62b more precise exceptions;
wenzelm
parents: 43767
diff changeset
   369
          catch { case _: IndexOutOfBoundsException => throw new XML_Body(List(t)) }
43778
ce9189450447 more compact representation of XML data (notably sort/typ/term), using properties as vector of atomic values;
wenzelm
parents: 43768
diff changeset
   370
        f(xs, ts)
43767
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   371
      case ts => throw new XML_Body(ts)
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   372
    }
e0219ef7f84c tuned XML modules;
wenzelm
parents: 43747
diff changeset
   373
  }
27931
b533a9de87a7 Minimalistic XML tree values.
wenzelm
parents:
diff changeset
   374
}