src/Pure/Thy/thy_header.scala
author wenzelm
Wed, 01 Aug 2012 19:53:20 +0200
changeset 48638 22d65e375c01
parent 48484 70898d016538
child 48706 e2b512024eab
permissions -rw-r--r--
more standard bootstrapping of Pure.thy;
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
28495
c5f86d04743b Theory header keywords.
wenzelm
parents:
diff changeset
     1
/*  Title:      Pure/Thy/thy_header.scala
c5f86d04743b Theory header keywords.
wenzelm
parents:
diff changeset
     2
    Author:     Makarius
c5f86d04743b Theory header keywords.
wenzelm
parents:
diff changeset
     3
46939
5b67ac48b384 allow multiple 'keywords' as in 'fixes';
wenzelm
parents: 46938
diff changeset
     4
Static theory header information.
28495
c5f86d04743b Theory header keywords.
wenzelm
parents:
diff changeset
     5
*/
c5f86d04743b Theory header keywords.
wenzelm
parents:
diff changeset
     6
c5f86d04743b Theory header keywords.
wenzelm
parents:
diff changeset
     7
package isabelle
c5f86d04743b Theory header keywords.
wenzelm
parents:
diff changeset
     8
c5f86d04743b Theory header keywords.
wenzelm
parents:
diff changeset
     9
43611
21a57a0c5f25 more general theory header parsing;
wenzelm
parents: 41535
diff changeset
    10
import scala.annotation.tailrec
34169
7501b2910900 basic setup for header scanning/parsing;
wenzelm
parents: 32466
diff changeset
    11
import scala.collection.mutable
43646
598b2c6ce13f Thy_Header.read convenience;
wenzelm
parents: 43611
diff changeset
    12
import scala.util.parsing.input.{Reader, CharSequenceReader}
38149
3c380380beac somewhat uniform Thy_Header.split_thy_path in ML and Scala;
wenzelm
parents: 36956
diff changeset
    13
import scala.util.matching.Regex
34169
7501b2910900 basic setup for header scanning/parsing;
wenzelm
parents: 32466
diff changeset
    14
48409
0d2114eb412a more explicit java.io.{File => JFile};
wenzelm
parents: 46943
diff changeset
    15
import java.io.{File => JFile}
34188
fbfc18be1f8c scan: operate on file (via Scan.byte_reader), more robust exception handling;
wenzelm
parents: 34169
diff changeset
    16
34169
7501b2910900 basic setup for header scanning/parsing;
wenzelm
parents: 32466
diff changeset
    17
43661
39fdbd814c7f quasi-static Isabelle_System -- reduced tendency towards "functorial style";
wenzelm
parents: 43652
diff changeset
    18
object Thy_Header extends Parse.Parser
32450
375db037f4d2 misc tuning;
wenzelm
parents: 29140
diff changeset
    19
{
28495
c5f86d04743b Theory header keywords.
wenzelm
parents:
diff changeset
    20
  val HEADER = "header"
c5f86d04743b Theory header keywords.
wenzelm
parents:
diff changeset
    21
  val THEORY = "theory"
c5f86d04743b Theory header keywords.
wenzelm
parents:
diff changeset
    22
  val IMPORTS = "imports"
46938
cda018294515 some support for outer syntax keyword declarations within theory header;
wenzelm
parents: 46737
diff changeset
    23
  val KEYWORDS = "keywords"
cda018294515 some support for outer syntax keyword declarations within theory header;
wenzelm
parents: 46737
diff changeset
    24
  val AND = "and"
28495
c5f86d04743b Theory header keywords.
wenzelm
parents:
diff changeset
    25
  val USES = "uses"
c5f86d04743b Theory header keywords.
wenzelm
parents:
diff changeset
    26
  val BEGIN = "begin"
c5f86d04743b Theory header keywords.
wenzelm
parents:
diff changeset
    27
46938
cda018294515 some support for outer syntax keyword declarations within theory header;
wenzelm
parents: 46737
diff changeset
    28
  private val lexicon =
cda018294515 some support for outer syntax keyword declarations within theory header;
wenzelm
parents: 46737
diff changeset
    29
    Scan.Lexicon("%", "(", ")", "::", ";", AND, BEGIN, HEADER, IMPORTS, KEYWORDS, THEORY, USES)
34190
dfcf667bbfed read header by scanning/parsing file;
wenzelm
parents: 34188
diff changeset
    30
38149
3c380380beac somewhat uniform Thy_Header.split_thy_path in ML and Scala;
wenzelm
parents: 36956
diff changeset
    31
44160
8848867501fb clarified document model header: master_dir (native wrt. editor, potentially URL) and node_name (full canonical path);
wenzelm
parents: 44159
diff changeset
    32
  /* theory file name */
8848867501fb clarified document model header: master_dir (native wrt. editor, potentially URL) and node_name (full canonical path);
wenzelm
parents: 44159
diff changeset
    33
44225
a8f921e6484f more robust Thy_Header.base_name, with minimal assumptions about path syntax;
wenzelm
parents: 44222
diff changeset
    34
  private val Base_Name = new Regex(""".*?([^/\\:]+)""")
44222
9d5ef6cd4ee1 use full .thy file name as node name, which makes MiscUtilities.resolveSymlinks/File.getCanonicalPath more predictable;
wenzelm
parents: 44185
diff changeset
    35
  private val Thy_Name = new Regex(""".*?([^/\\:]+)\.thy""")
44160
8848867501fb clarified document model header: master_dir (native wrt. editor, potentially URL) and node_name (full canonical path);
wenzelm
parents: 44159
diff changeset
    36
44225
a8f921e6484f more robust Thy_Header.base_name, with minimal assumptions about path syntax;
wenzelm
parents: 44222
diff changeset
    37
  def base_name(s: String): String =
a8f921e6484f more robust Thy_Header.base_name, with minimal assumptions about path syntax;
wenzelm
parents: 44222
diff changeset
    38
    s match { case Base_Name(name) => name case _ => error("Malformed import: " + quote(s)) }
a8f921e6484f more robust Thy_Header.base_name, with minimal assumptions about path syntax;
wenzelm
parents: 44222
diff changeset
    39
44222
9d5ef6cd4ee1 use full .thy file name as node name, which makes MiscUtilities.resolveSymlinks/File.getCanonicalPath more predictable;
wenzelm
parents: 44185
diff changeset
    40
  def thy_name(s: String): Option[String] =
9d5ef6cd4ee1 use full .thy file name as node name, which makes MiscUtilities.resolveSymlinks/File.getCanonicalPath more predictable;
wenzelm
parents: 44185
diff changeset
    41
    s match { case Thy_Name(name) => Some(name) case _ => None }
38149
3c380380beac somewhat uniform Thy_Header.split_thy_path in ML and Scala;
wenzelm
parents: 36956
diff changeset
    42
34169
7501b2910900 basic setup for header scanning/parsing;
wenzelm
parents: 32466
diff changeset
    43
7501b2910900 basic setup for header scanning/parsing;
wenzelm
parents: 32466
diff changeset
    44
  /* header */
7501b2910900 basic setup for header scanning/parsing;
wenzelm
parents: 32466
diff changeset
    45
44159
9a35e88d9dc9 simplified class Thy_Header;
wenzelm
parents: 44157
diff changeset
    46
  val header: Parser[Thy_Header] =
34169
7501b2910900 basic setup for header scanning/parsing;
wenzelm
parents: 32466
diff changeset
    47
  {
43611
21a57a0c5f25 more general theory header parsing;
wenzelm
parents: 41535
diff changeset
    48
    val file_name = atom("file name", _.is_name)
34169
7501b2910900 basic setup for header scanning/parsing;
wenzelm
parents: 32466
diff changeset
    49
46938
cda018294515 some support for outer syntax keyword declarations within theory header;
wenzelm
parents: 46737
diff changeset
    50
    val keyword_kind =
cda018294515 some support for outer syntax keyword declarations within theory header;
wenzelm
parents: 46737
diff changeset
    51
      atom("outer syntax keyword kind", _.is_name) ~ tags ^^ { case x ~ y => (x, y) }
cda018294515 some support for outer syntax keyword declarations within theory header;
wenzelm
parents: 46737
diff changeset
    52
    val keyword_decl =
46943
ac1c41ea856d clarified syntax of prospective keywords;
wenzelm
parents: 46940
diff changeset
    53
      rep1(string) ~ opt(keyword("::") ~! keyword_kind ^^ { case _ ~ x => x }) ^^
46939
5b67ac48b384 allow multiple 'keywords' as in 'fixes';
wenzelm
parents: 46938
diff changeset
    54
      { case xs ~ y => xs.map((_, y)) }
5b67ac48b384 allow multiple 'keywords' as in 'fixes';
wenzelm
parents: 46938
diff changeset
    55
    val keyword_decls =
46938
cda018294515 some support for outer syntax keyword declarations within theory header;
wenzelm
parents: 46737
diff changeset
    56
      keyword_decl ~ rep(keyword(AND) ~! keyword_decl ^^ { case _ ~ x => x }) ^^
46939
5b67ac48b384 allow multiple 'keywords' as in 'fixes';
wenzelm
parents: 46938
diff changeset
    57
      { case xs ~ yss => (xs :: yss).flatten }
46938
cda018294515 some support for outer syntax keyword declarations within theory header;
wenzelm
parents: 46737
diff changeset
    58
34169
7501b2910900 basic setup for header scanning/parsing;
wenzelm
parents: 32466
diff changeset
    59
    val file =
44185
05641edb5d30 provide node header via Scala layer;
wenzelm
parents: 44163
diff changeset
    60
      keyword("(") ~! (file_name ~ keyword(")")) ^^ { case _ ~ (x ~ _) => (x, false) } |
05641edb5d30 provide node header via Scala layer;
wenzelm
parents: 44163
diff changeset
    61
      file_name ^^ (x => (x, true))
34169
7501b2910900 basic setup for header scanning/parsing;
wenzelm
parents: 32466
diff changeset
    62
7501b2910900 basic setup for header scanning/parsing;
wenzelm
parents: 32466
diff changeset
    63
    val args =
46938
cda018294515 some support for outer syntax keyword declarations within theory header;
wenzelm
parents: 46737
diff changeset
    64
      theory_name ~
48638
22d65e375c01 more standard bootstrapping of Pure.thy;
wenzelm
parents: 48484
diff changeset
    65
      (opt(keyword(IMPORTS) ~! (rep1(theory_name))) ^^ { case None => Nil case Some(_ ~ xs) => xs }) ~
46939
5b67ac48b384 allow multiple 'keywords' as in 'fixes';
wenzelm
parents: 46938
diff changeset
    66
      (opt(keyword(KEYWORDS) ~! keyword_decls) ^^ { case None => Nil case Some(_ ~ xs) => xs }) ~
46938
cda018294515 some support for outer syntax keyword declarations within theory header;
wenzelm
parents: 46737
diff changeset
    67
      (opt(keyword(USES) ~! (rep1(file))) ^^ { case None => Nil case Some(_ ~ xs) => xs }) ~
cda018294515 some support for outer syntax keyword declarations within theory header;
wenzelm
parents: 46737
diff changeset
    68
      keyword(BEGIN) ^^
cda018294515 some support for outer syntax keyword declarations within theory header;
wenzelm
parents: 46737
diff changeset
    69
      { case x ~ ys ~ zs ~ ws ~ _ => Thy_Header(x, ys, zs, ws) }
34169
7501b2910900 basic setup for header scanning/parsing;
wenzelm
parents: 32466
diff changeset
    70
7501b2910900 basic setup for header scanning/parsing;
wenzelm
parents: 32466
diff changeset
    71
    (keyword(HEADER) ~ tags) ~!
7501b2910900 basic setup for header scanning/parsing;
wenzelm
parents: 32466
diff changeset
    72
      ((doc_source ~ rep(keyword(";")) ~ keyword(THEORY) ~ tags) ~> args) ^^ { case _ ~ x => x } |
7501b2910900 basic setup for header scanning/parsing;
wenzelm
parents: 32466
diff changeset
    73
    (keyword(THEORY) ~ tags) ~! args ^^ { case _ ~ x => x }
7501b2910900 basic setup for header scanning/parsing;
wenzelm
parents: 32466
diff changeset
    74
  }
7501b2910900 basic setup for header scanning/parsing;
wenzelm
parents: 32466
diff changeset
    75
7501b2910900 basic setup for header scanning/parsing;
wenzelm
parents: 32466
diff changeset
    76
34190
dfcf667bbfed read header by scanning/parsing file;
wenzelm
parents: 34188
diff changeset
    77
  /* read -- lazy scanning */
34169
7501b2910900 basic setup for header scanning/parsing;
wenzelm
parents: 32466
diff changeset
    78
44159
9a35e88d9dc9 simplified class Thy_Header;
wenzelm
parents: 44157
diff changeset
    79
  def read(reader: Reader[Char]): Thy_Header =
34169
7501b2910900 basic setup for header scanning/parsing;
wenzelm
parents: 32466
diff changeset
    80
  {
43695
5130dfe1b7be simplified Symbol based on lazy Symbol.Interpretation -- reduced odd "functorial style";
wenzelm
parents: 43672
diff changeset
    81
    val token = lexicon.token(_ => false)
36956
21be4832c362 renamed class Outer_Lex to Token and Token_Kind to Token.Kind;
wenzelm
parents: 36948
diff changeset
    82
    val toks = new mutable.ListBuffer[Token]
34188
fbfc18be1f8c scan: operate on file (via Scan.byte_reader), more robust exception handling;
wenzelm
parents: 34169
diff changeset
    83
43611
21a57a0c5f25 more general theory header parsing;
wenzelm
parents: 41535
diff changeset
    84
    @tailrec def scan_to_begin(in: Reader[Char])
34169
7501b2910900 basic setup for header scanning/parsing;
wenzelm
parents: 32466
diff changeset
    85
    {
7501b2910900 basic setup for header scanning/parsing;
wenzelm
parents: 32466
diff changeset
    86
      token(in) match {
7501b2910900 basic setup for header scanning/parsing;
wenzelm
parents: 32466
diff changeset
    87
        case lexicon.Success(tok, rest) =>
7501b2910900 basic setup for header scanning/parsing;
wenzelm
parents: 32466
diff changeset
    88
          toks += tok
43611
21a57a0c5f25 more general theory header parsing;
wenzelm
parents: 41535
diff changeset
    89
          if (!tok.is_begin) scan_to_begin(rest)
34169
7501b2910900 basic setup for header scanning/parsing;
wenzelm
parents: 32466
diff changeset
    90
        case _ =>
7501b2910900 basic setup for header scanning/parsing;
wenzelm
parents: 32466
diff changeset
    91
      }
7501b2910900 basic setup for header scanning/parsing;
wenzelm
parents: 32466
diff changeset
    92
    }
43611
21a57a0c5f25 more general theory header parsing;
wenzelm
parents: 41535
diff changeset
    93
    scan_to_begin(reader)
34190
dfcf667bbfed read header by scanning/parsing file;
wenzelm
parents: 34188
diff changeset
    94
36956
21be4832c362 renamed class Outer_Lex to Token and Token_Kind to Token.Kind;
wenzelm
parents: 36948
diff changeset
    95
    parse(commit(header), Token.reader(toks.toList)) match {
34190
dfcf667bbfed read header by scanning/parsing file;
wenzelm
parents: 34188
diff changeset
    96
      case Success(result, _) => result
dfcf667bbfed read header by scanning/parsing file;
wenzelm
parents: 34188
diff changeset
    97
      case bad => error(bad.toString)
dfcf667bbfed read header by scanning/parsing file;
wenzelm
parents: 34188
diff changeset
    98
    }
34169
7501b2910900 basic setup for header scanning/parsing;
wenzelm
parents: 32466
diff changeset
    99
  }
43611
21a57a0c5f25 more general theory header parsing;
wenzelm
parents: 41535
diff changeset
   100
44159
9a35e88d9dc9 simplified class Thy_Header;
wenzelm
parents: 44157
diff changeset
   101
  def read(source: CharSequence): Thy_Header =
43646
598b2c6ce13f Thy_Header.read convenience;
wenzelm
parents: 43611
diff changeset
   102
    read(new CharSequenceReader(source))
598b2c6ce13f Thy_Header.read convenience;
wenzelm
parents: 43611
diff changeset
   103
48409
0d2114eb412a more explicit java.io.{File => JFile};
wenzelm
parents: 46943
diff changeset
   104
  def read(file: JFile): Thy_Header =
43611
21a57a0c5f25 more general theory header parsing;
wenzelm
parents: 41535
diff changeset
   105
  {
21a57a0c5f25 more general theory header parsing;
wenzelm
parents: 41535
diff changeset
   106
    val reader = Scan.byte_reader(file)
43699
fb3d99df4b1e tuned signature;
wenzelm
parents: 43697
diff changeset
   107
    try { read(reader).map(Standard_System.decode_permissive_utf8) }
43611
21a57a0c5f25 more general theory header parsing;
wenzelm
parents: 41535
diff changeset
   108
    finally { reader.close }
21a57a0c5f25 more general theory header parsing;
wenzelm
parents: 41535
diff changeset
   109
  }
34169
7501b2910900 basic setup for header scanning/parsing;
wenzelm
parents: 32466
diff changeset
   110
}
44159
9a35e88d9dc9 simplified class Thy_Header;
wenzelm
parents: 44157
diff changeset
   111
9a35e88d9dc9 simplified class Thy_Header;
wenzelm
parents: 44157
diff changeset
   112
44185
05641edb5d30 provide node header via Scala layer;
wenzelm
parents: 44163
diff changeset
   113
sealed case class Thy_Header(
46938
cda018294515 some support for outer syntax keyword declarations within theory header;
wenzelm
parents: 46737
diff changeset
   114
  name: String, imports: List[String],
46940
a40be2f10ca9 explicit Outer_Syntax.Decl;
wenzelm
parents: 46939
diff changeset
   115
  keywords: List[Outer_Syntax.Decl],
46938
cda018294515 some support for outer syntax keyword declarations within theory header;
wenzelm
parents: 46737
diff changeset
   116
  uses: List[(String, Boolean)])
44159
9a35e88d9dc9 simplified class Thy_Header;
wenzelm
parents: 44157
diff changeset
   117
{
9a35e88d9dc9 simplified class Thy_Header;
wenzelm
parents: 44157
diff changeset
   118
  def map(f: String => String): Thy_Header =
46938
cda018294515 some support for outer syntax keyword declarations within theory header;
wenzelm
parents: 46737
diff changeset
   119
    Thy_Header(f(name), imports.map(f), keywords, uses.map(p => (f(p._1), p._2)))
44159
9a35e88d9dc9 simplified class Thy_Header;
wenzelm
parents: 44157
diff changeset
   120
}
9a35e88d9dc9 simplified class Thy_Header;
wenzelm
parents: 44157
diff changeset
   121