src/Pure/Admin/build_log.scala
author wenzelm
Sat, 06 May 2017 12:52:29 +0200
changeset 65741 cf42659364c9
parent 65740 83388f09e9ab
child 65748 1f4a80e80c88
permissions -rw-r--r--
tuned;
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
64160
1eea419fab65 clarified files;
wenzelm
parents: 64155
diff changeset
     1
/*  Title:      Pure/Admin/build_log.scala
64045
c6160d0b0337 clarified modules;
wenzelm
parents:
diff changeset
     2
    Author:     Makarius
c6160d0b0337 clarified modules;
wenzelm
parents:
diff changeset
     3
65608
d526ba7b0a2d tuned comment;
wenzelm
parents: 65607
diff changeset
     4
Management of build log files and database storage.
64045
c6160d0b0337 clarified modules;
wenzelm
parents:
diff changeset
     5
*/
c6160d0b0337 clarified modules;
wenzelm
parents:
diff changeset
     6
c6160d0b0337 clarified modules;
wenzelm
parents:
diff changeset
     7
package isabelle
c6160d0b0337 clarified modules;
wenzelm
parents:
diff changeset
     8
c6160d0b0337 clarified modules;
wenzelm
parents:
diff changeset
     9
64100
9b1573213ebe tuned error;
wenzelm
parents: 64099
diff changeset
    10
import java.io.{File => JFile}
9b1573213ebe tuned error;
wenzelm
parents: 64099
diff changeset
    11
import java.time.ZoneId
64110
c0b96b34c7b9 support for Isabelle/Jenkins log file format;
wenzelm
parents: 64109
diff changeset
    12
import java.time.format.{DateTimeFormatter, DateTimeParseException}
64096
5edeb60a7ec5 more flexible date formats;
wenzelm
parents: 64095
diff changeset
    13
import java.util.Locale
64061
1bbea2b55d22 some support for header and data fields, notably from afp-test;
wenzelm
parents: 64054
diff changeset
    14
65600
138ffa41dc54 clarified filter_files: sorted and unique;
wenzelm
parents: 65599
diff changeset
    15
import scala.collection.immutable.SortedMap
64054
1fc9ab31720d clarified modules;
wenzelm
parents: 64053
diff changeset
    16
import scala.collection.mutable
1fc9ab31720d clarified modules;
wenzelm
parents: 64053
diff changeset
    17
import scala.util.matching.Regex
1fc9ab31720d clarified modules;
wenzelm
parents: 64053
diff changeset
    18
1fc9ab31720d clarified modules;
wenzelm
parents: 64053
diff changeset
    19
64045
c6160d0b0337 clarified modules;
wenzelm
parents:
diff changeset
    20
object Build_Log
c6160d0b0337 clarified modules;
wenzelm
parents:
diff changeset
    21
{
64298
wenzelm
parents: 64297
diff changeset
    22
  /** content **/
64101
976289c733e6 more formal directory content;
wenzelm
parents: 64100
diff changeset
    23
64298
wenzelm
parents: 64297
diff changeset
    24
  /* properties */
64150
b10f2ddd7679 clarified modules;
wenzelm
parents: 64120
diff changeset
    25
64298
wenzelm
parents: 64297
diff changeset
    26
  object Prop
wenzelm
parents: 64297
diff changeset
    27
  {
65624
32fa61f694ef clarified multi-line properties;
wenzelm
parents: 65623
diff changeset
    28
    val build_tags = SQL.Column.string("build_tags")  // lines
32fa61f694ef clarified multi-line properties;
wenzelm
parents: 65623
diff changeset
    29
    val build_args = SQL.Column.string("build_args")  // lines
65591
5953c7fbc2b8 more SQL operations;
wenzelm
parents: 65590
diff changeset
    30
    val build_group_id = SQL.Column.string("build_group_id")
5953c7fbc2b8 more SQL operations;
wenzelm
parents: 65590
diff changeset
    31
    val build_id = SQL.Column.string("build_id")
5953c7fbc2b8 more SQL operations;
wenzelm
parents: 65590
diff changeset
    32
    val build_engine = SQL.Column.string("build_engine")
5953c7fbc2b8 more SQL operations;
wenzelm
parents: 65590
diff changeset
    33
    val build_host = SQL.Column.string("build_host")
5953c7fbc2b8 more SQL operations;
wenzelm
parents: 65590
diff changeset
    34
    val build_start = SQL.Column.date("build_start")
5953c7fbc2b8 more SQL operations;
wenzelm
parents: 65590
diff changeset
    35
    val build_end = SQL.Column.date("build_end")
5953c7fbc2b8 more SQL operations;
wenzelm
parents: 65590
diff changeset
    36
    val isabelle_version = SQL.Column.string("isabelle_version")
5953c7fbc2b8 more SQL operations;
wenzelm
parents: 65590
diff changeset
    37
    val afp_version = SQL.Column.string("afp_version")
5953c7fbc2b8 more SQL operations;
wenzelm
parents: 65590
diff changeset
    38
65611
a4a7841ae84f more uniform storage of Meta_Info;
wenzelm
parents: 65609
diff changeset
    39
    val all_props: List[SQL.Column] =
65591
5953c7fbc2b8 more SQL operations;
wenzelm
parents: 65590
diff changeset
    40
      List(build_tags, build_args, build_group_id, build_id, build_engine,
5953c7fbc2b8 more SQL operations;
wenzelm
parents: 65590
diff changeset
    41
        build_host, build_start, build_end, isabelle_version, afp_version)
64298
wenzelm
parents: 64297
diff changeset
    42
  }
64150
b10f2ddd7679 clarified modules;
wenzelm
parents: 64120
diff changeset
    43
b10f2ddd7679 clarified modules;
wenzelm
parents: 64120
diff changeset
    44
64298
wenzelm
parents: 64297
diff changeset
    45
  /* settings */
64080
2e5c0bd708af clarified modules;
wenzelm
parents: 64079
diff changeset
    46
64081
38bb09ed965b more uniform treatment of settings;
wenzelm
parents: 64080
diff changeset
    47
  object Settings
38bb09ed965b more uniform treatment of settings;
wenzelm
parents: 64080
diff changeset
    48
  {
65611
a4a7841ae84f more uniform storage of Meta_Info;
wenzelm
parents: 65609
diff changeset
    49
    val ISABELLE_BUILD_OPTIONS = SQL.Column.string("ISABELLE_BUILD_OPTIONS")
a4a7841ae84f more uniform storage of Meta_Info;
wenzelm
parents: 65609
diff changeset
    50
    val ML_PLATFORM = SQL.Column.string("ML_PLATFORM")
a4a7841ae84f more uniform storage of Meta_Info;
wenzelm
parents: 65609
diff changeset
    51
    val ML_HOME = SQL.Column.string("ML_HOME")
a4a7841ae84f more uniform storage of Meta_Info;
wenzelm
parents: 65609
diff changeset
    52
    val ML_SYSTEM = SQL.Column.string("ML_SYSTEM")
a4a7841ae84f more uniform storage of Meta_Info;
wenzelm
parents: 65609
diff changeset
    53
    val ML_OPTIONS = SQL.Column.string("ML_OPTIONS")
a4a7841ae84f more uniform storage of Meta_Info;
wenzelm
parents: 65609
diff changeset
    54
a4a7841ae84f more uniform storage of Meta_Info;
wenzelm
parents: 65609
diff changeset
    55
    val ml_settings = List(ML_PLATFORM, ML_HOME, ML_SYSTEM, ML_OPTIONS)
a4a7841ae84f more uniform storage of Meta_Info;
wenzelm
parents: 65609
diff changeset
    56
    val all_settings = ISABELLE_BUILD_OPTIONS :: ml_settings
64081
38bb09ed965b more uniform treatment of settings;
wenzelm
parents: 64080
diff changeset
    57
38bb09ed965b more uniform treatment of settings;
wenzelm
parents: 64080
diff changeset
    58
    type Entry = (String, String)
38bb09ed965b more uniform treatment of settings;
wenzelm
parents: 64080
diff changeset
    59
    type T = List[Entry]
64080
2e5c0bd708af clarified modules;
wenzelm
parents: 64079
diff changeset
    60
64081
38bb09ed965b more uniform treatment of settings;
wenzelm
parents: 64080
diff changeset
    61
    object Entry
38bb09ed965b more uniform treatment of settings;
wenzelm
parents: 64080
diff changeset
    62
    {
38bb09ed965b more uniform treatment of settings;
wenzelm
parents: 64080
diff changeset
    63
      def unapply(s: String): Option[Entry] =
38bb09ed965b more uniform treatment of settings;
wenzelm
parents: 64080
diff changeset
    64
        s.indexOf('=') match {
38bb09ed965b more uniform treatment of settings;
wenzelm
parents: 64080
diff changeset
    65
          case -1 => None
38bb09ed965b more uniform treatment of settings;
wenzelm
parents: 64080
diff changeset
    66
          case i =>
38bb09ed965b more uniform treatment of settings;
wenzelm
parents: 64080
diff changeset
    67
            val a = s.substring(0, i)
38bb09ed965b more uniform treatment of settings;
wenzelm
parents: 64080
diff changeset
    68
            val b = Library.perhaps_unquote(s.substring(i + 1))
38bb09ed965b more uniform treatment of settings;
wenzelm
parents: 64080
diff changeset
    69
            Some((a, b))
38bb09ed965b more uniform treatment of settings;
wenzelm
parents: 64080
diff changeset
    70
        }
38bb09ed965b more uniform treatment of settings;
wenzelm
parents: 64080
diff changeset
    71
      def apply(a: String, b: String): String = a + "=" + quote(b)
38bb09ed965b more uniform treatment of settings;
wenzelm
parents: 64080
diff changeset
    72
      def getenv(a: String): String = apply(a, Isabelle_System.getenv(a))
38bb09ed965b more uniform treatment of settings;
wenzelm
parents: 64080
diff changeset
    73
    }
64080
2e5c0bd708af clarified modules;
wenzelm
parents: 64079
diff changeset
    74
64081
38bb09ed965b more uniform treatment of settings;
wenzelm
parents: 64080
diff changeset
    75
    def show(): String =
38bb09ed965b more uniform treatment of settings;
wenzelm
parents: 64080
diff changeset
    76
      cat_lines(
65611
a4a7841ae84f more uniform storage of Meta_Info;
wenzelm
parents: 65609
diff changeset
    77
        List(Entry.getenv(ISABELLE_BUILD_OPTIONS.name), "") :::
a4a7841ae84f more uniform storage of Meta_Info;
wenzelm
parents: 65609
diff changeset
    78
        ml_settings.map(c => Entry.getenv(c.name)))
64080
2e5c0bd708af clarified modules;
wenzelm
parents: 64079
diff changeset
    79
  }
2e5c0bd708af clarified modules;
wenzelm
parents: 64079
diff changeset
    80
2e5c0bd708af clarified modules;
wenzelm
parents: 64079
diff changeset
    81
64298
wenzelm
parents: 64297
diff changeset
    82
  /* file names */
wenzelm
parents: 64297
diff changeset
    83
wenzelm
parents: 64297
diff changeset
    84
  def log_date(date: Date): String =
wenzelm
parents: 64297
diff changeset
    85
    String.format(Locale.ROOT, "%s.%05d",
wenzelm
parents: 64297
diff changeset
    86
      DateTimeFormatter.ofPattern("yyyy-MM-dd").format(date.rep),
wenzelm
parents: 64297
diff changeset
    87
      new java.lang.Long((date.time - date.midnight.time).ms / 1000))
wenzelm
parents: 64297
diff changeset
    88
wenzelm
parents: 64297
diff changeset
    89
  def log_subdir(date: Date): Path =
wenzelm
parents: 64297
diff changeset
    90
    Path.explode("log") + Path.explode(date.rep.getYear.toString)
wenzelm
parents: 64297
diff changeset
    91
wenzelm
parents: 64297
diff changeset
    92
  def log_filename(engine: String, date: Date, more: List[String] = Nil): Path =
wenzelm
parents: 64297
diff changeset
    93
    Path.explode((engine :: log_date(date) :: more).mkString("", "_", ".log"))
wenzelm
parents: 64297
diff changeset
    94
wenzelm
parents: 64297
diff changeset
    95
64100
9b1573213ebe tuned error;
wenzelm
parents: 64099
diff changeset
    96
64062
a7352cbde7d7 misc tuning and clarification;
wenzelm
parents: 64061
diff changeset
    97
  /** log file **/
64045
c6160d0b0337 clarified modules;
wenzelm
parents:
diff changeset
    98
64155
646c4d6a6a02 tuned signature;
wenzelm
parents: 64150
diff changeset
    99
  def print_date(date: Date): String = Log_File.Date_Format(date)
646c4d6a6a02 tuned signature;
wenzelm
parents: 64150
diff changeset
   100
64062
a7352cbde7d7 misc tuning and clarification;
wenzelm
parents: 64061
diff changeset
   101
  object Log_File
a7352cbde7d7 misc tuning and clarification;
wenzelm
parents: 64061
diff changeset
   102
  {
65607
c937984c70e9 tuned signature;
wenzelm
parents: 65605
diff changeset
   103
    /* log file */
c937984c70e9 tuned signature;
wenzelm
parents: 65605
diff changeset
   104
65609
9917b8e3b5c1 clarified plain_name / log_name;
wenzelm
parents: 65608
diff changeset
   105
    def plain_name(name: String): String =
9917b8e3b5c1 clarified plain_name / log_name;
wenzelm
parents: 65608
diff changeset
   106
    {
9917b8e3b5c1 clarified plain_name / log_name;
wenzelm
parents: 65608
diff changeset
   107
      List(".log", ".log.gz", ".log.xz", ".gz", ".xz").find(name.endsWith(_)) match {
9917b8e3b5c1 clarified plain_name / log_name;
wenzelm
parents: 65608
diff changeset
   108
        case Some(s) => Library.try_unsuffix(s, name).get
9917b8e3b5c1 clarified plain_name / log_name;
wenzelm
parents: 65608
diff changeset
   109
        case None => name
9917b8e3b5c1 clarified plain_name / log_name;
wenzelm
parents: 65608
diff changeset
   110
      }
9917b8e3b5c1 clarified plain_name / log_name;
wenzelm
parents: 65608
diff changeset
   111
    }
9917b8e3b5c1 clarified plain_name / log_name;
wenzelm
parents: 65608
diff changeset
   112
64062
a7352cbde7d7 misc tuning and clarification;
wenzelm
parents: 64061
diff changeset
   113
    def apply(name: String, lines: List[String]): Log_File =
65609
9917b8e3b5c1 clarified plain_name / log_name;
wenzelm
parents: 65608
diff changeset
   114
      new Log_File(plain_name(name), lines)
64062
a7352cbde7d7 misc tuning and clarification;
wenzelm
parents: 64061
diff changeset
   115
a7352cbde7d7 misc tuning and clarification;
wenzelm
parents: 64061
diff changeset
   116
    def apply(name: String, text: String): Log_File =
64063
2c5039363ea3 tuned signature;
wenzelm
parents: 64062
diff changeset
   117
      Log_File(name, Library.trim_split_lines(text))
64090
5a68280112b3 more operations;
wenzelm
parents: 64089
diff changeset
   118
5a68280112b3 more operations;
wenzelm
parents: 64089
diff changeset
   119
    def apply(file: JFile): Log_File =
5a68280112b3 more operations;
wenzelm
parents: 64089
diff changeset
   120
    {
5a68280112b3 more operations;
wenzelm
parents: 64089
diff changeset
   121
      val name = file.getName
65609
9917b8e3b5c1 clarified plain_name / log_name;
wenzelm
parents: 65608
diff changeset
   122
      val text =
9917b8e3b5c1 clarified plain_name / log_name;
wenzelm
parents: 65608
diff changeset
   123
        if (name.endsWith(".gz")) File.read_gzip(file)
9917b8e3b5c1 clarified plain_name / log_name;
wenzelm
parents: 65608
diff changeset
   124
        else if (name.endsWith(".xz")) File.read_xz(file)
9917b8e3b5c1 clarified plain_name / log_name;
wenzelm
parents: 65608
diff changeset
   125
        else File.read(file)
9917b8e3b5c1 clarified plain_name / log_name;
wenzelm
parents: 65608
diff changeset
   126
      apply(name, text)
64090
5a68280112b3 more operations;
wenzelm
parents: 64089
diff changeset
   127
    }
5a68280112b3 more operations;
wenzelm
parents: 64089
diff changeset
   128
5a68280112b3 more operations;
wenzelm
parents: 64089
diff changeset
   129
    def apply(path: Path): Log_File = apply(path.file)
64101
976289c733e6 more formal directory content;
wenzelm
parents: 64100
diff changeset
   130
64110
c0b96b34c7b9 support for Isabelle/Jenkins log file format;
wenzelm
parents: 64109
diff changeset
   131
65607
c937984c70e9 tuned signature;
wenzelm
parents: 65605
diff changeset
   132
    /* log file collections */
c937984c70e9 tuned signature;
wenzelm
parents: 65605
diff changeset
   133
c937984c70e9 tuned signature;
wenzelm
parents: 65605
diff changeset
   134
    def is_log(file: JFile,
c937984c70e9 tuned signature;
wenzelm
parents: 65605
diff changeset
   135
      prefixes: List[String] =
65664
c84db5e0dd6d detect Jenkins log files as well;
wenzelm
parents: 65663
diff changeset
   136
        List(Build_History.log_prefix, Identify.log_prefix, Isatest.log_prefix,
c84db5e0dd6d detect Jenkins log files as well;
wenzelm
parents: 65663
diff changeset
   137
          AFP_Test.log_prefix, Jenkins.log_prefix),
65609
9917b8e3b5c1 clarified plain_name / log_name;
wenzelm
parents: 65608
diff changeset
   138
      suffixes: List[String] = List(".log", ".log.gz", ".log.xz")): Boolean =
65607
c937984c70e9 tuned signature;
wenzelm
parents: 65605
diff changeset
   139
    {
c937984c70e9 tuned signature;
wenzelm
parents: 65605
diff changeset
   140
      val name = file.getName
65639
4c14da234221 exclude special log files;
wenzelm
parents: 65636
diff changeset
   141
65607
c937984c70e9 tuned signature;
wenzelm
parents: 65605
diff changeset
   142
      prefixes.exists(name.startsWith(_)) &&
65639
4c14da234221 exclude special log files;
wenzelm
parents: 65636
diff changeset
   143
      suffixes.exists(name.endsWith(_)) &&
4c14da234221 exclude special log files;
wenzelm
parents: 65636
diff changeset
   144
      name != "isatest.log" &&
4c14da234221 exclude special log files;
wenzelm
parents: 65636
diff changeset
   145
      name != "afp-test.log" &&
4c14da234221 exclude special log files;
wenzelm
parents: 65636
diff changeset
   146
      name != "main.log"
65607
c937984c70e9 tuned signature;
wenzelm
parents: 65605
diff changeset
   147
    }
c937984c70e9 tuned signature;
wenzelm
parents: 65605
diff changeset
   148
c937984c70e9 tuned signature;
wenzelm
parents: 65605
diff changeset
   149
    def find_files(dirs: Iterable[Path]): List[JFile] =
c937984c70e9 tuned signature;
wenzelm
parents: 65605
diff changeset
   150
      dirs.iterator.flatMap(dir => File.find_files(dir.file, is_log(_))).toList
c937984c70e9 tuned signature;
wenzelm
parents: 65605
diff changeset
   151
c937984c70e9 tuned signature;
wenzelm
parents: 65605
diff changeset
   152
64110
c0b96b34c7b9 support for Isabelle/Jenkins log file format;
wenzelm
parents: 64109
diff changeset
   153
    /* date format */
c0b96b34c7b9 support for Isabelle/Jenkins log file format;
wenzelm
parents: 64109
diff changeset
   154
64101
976289c733e6 more formal directory content;
wenzelm
parents: 64100
diff changeset
   155
    val Date_Format =
976289c733e6 more formal directory content;
wenzelm
parents: 64100
diff changeset
   156
    {
976289c733e6 more formal directory content;
wenzelm
parents: 64100
diff changeset
   157
      val fmts =
976289c733e6 more formal directory content;
wenzelm
parents: 64100
diff changeset
   158
        Date.Formatter.variants(
64116
6cfd429a4296 prefer explicit timezone offset for printing;
wenzelm
parents: 64111
diff changeset
   159
          List("EEE MMM d HH:mm:ss O yyyy", "EEE MMM d HH:mm:ss VV yyyy"),
64104
b70fa05d6746 more permissive: accept all historic isatest and afp-test logs;
wenzelm
parents: 64103
diff changeset
   160
          List(Locale.ENGLISH, Locale.GERMAN)) :::
64110
c0b96b34c7b9 support for Isabelle/Jenkins log file format;
wenzelm
parents: 64109
diff changeset
   161
        List(
c0b96b34c7b9 support for Isabelle/Jenkins log file format;
wenzelm
parents: 64109
diff changeset
   162
          DateTimeFormatter.RFC_1123_DATE_TIME,
c0b96b34c7b9 support for Isabelle/Jenkins log file format;
wenzelm
parents: 64109
diff changeset
   163
          Date.Formatter.pattern("EEE MMM d HH:mm:ss yyyy").withZone(ZoneId.of("Europe/Berlin")))
64101
976289c733e6 more formal directory content;
wenzelm
parents: 64100
diff changeset
   164
64104
b70fa05d6746 more permissive: accept all historic isatest and afp-test logs;
wenzelm
parents: 64103
diff changeset
   165
      def tune_timezone(s: String): String =
b70fa05d6746 more permissive: accept all historic isatest and afp-test logs;
wenzelm
parents: 64103
diff changeset
   166
        s match {
64101
976289c733e6 more formal directory content;
wenzelm
parents: 64100
diff changeset
   167
          case "CET" | "MET" => "GMT+1"
976289c733e6 more formal directory content;
wenzelm
parents: 64100
diff changeset
   168
          case "CEST" | "MEST" => "GMT+2"
64104
b70fa05d6746 more permissive: accept all historic isatest and afp-test logs;
wenzelm
parents: 64103
diff changeset
   169
          case "EST" => "Europe/Berlin"
b70fa05d6746 more permissive: accept all historic isatest and afp-test logs;
wenzelm
parents: 64103
diff changeset
   170
          case _ => s
b70fa05d6746 more permissive: accept all historic isatest and afp-test logs;
wenzelm
parents: 64103
diff changeset
   171
        }
b70fa05d6746 more permissive: accept all historic isatest and afp-test logs;
wenzelm
parents: 64103
diff changeset
   172
      def tune_weekday(s: String): String =
b70fa05d6746 more permissive: accept all historic isatest and afp-test logs;
wenzelm
parents: 64103
diff changeset
   173
        s match {
b70fa05d6746 more permissive: accept all historic isatest and afp-test logs;
wenzelm
parents: 64103
diff changeset
   174
          case "Die" => "Di"
b70fa05d6746 more permissive: accept all historic isatest and afp-test logs;
wenzelm
parents: 64103
diff changeset
   175
          case "Mit" => "Mi"
b70fa05d6746 more permissive: accept all historic isatest and afp-test logs;
wenzelm
parents: 64103
diff changeset
   176
          case "Don" => "Do"
b70fa05d6746 more permissive: accept all historic isatest and afp-test logs;
wenzelm
parents: 64103
diff changeset
   177
          case "Fre" => "Fr"
b70fa05d6746 more permissive: accept all historic isatest and afp-test logs;
wenzelm
parents: 64103
diff changeset
   178
          case "Sam" => "Sa"
b70fa05d6746 more permissive: accept all historic isatest and afp-test logs;
wenzelm
parents: 64103
diff changeset
   179
          case "Son" => "So"
b70fa05d6746 more permissive: accept all historic isatest and afp-test logs;
wenzelm
parents: 64103
diff changeset
   180
          case _ => s
b70fa05d6746 more permissive: accept all historic isatest and afp-test logs;
wenzelm
parents: 64103
diff changeset
   181
        }
b70fa05d6746 more permissive: accept all historic isatest and afp-test logs;
wenzelm
parents: 64103
diff changeset
   182
b70fa05d6746 more permissive: accept all historic isatest and afp-test logs;
wenzelm
parents: 64103
diff changeset
   183
      def tune(s: String): String =
b70fa05d6746 more permissive: accept all historic isatest and afp-test logs;
wenzelm
parents: 64103
diff changeset
   184
        Word.implode(
b70fa05d6746 more permissive: accept all historic isatest and afp-test logs;
wenzelm
parents: 64103
diff changeset
   185
          Word.explode(s) match {
b70fa05d6746 more permissive: accept all historic isatest and afp-test logs;
wenzelm
parents: 64103
diff changeset
   186
            case a :: "M\uFFFDr" :: bs => tune_weekday(a) :: "Mär" :: bs.map(tune_timezone(_))
b70fa05d6746 more permissive: accept all historic isatest and afp-test logs;
wenzelm
parents: 64103
diff changeset
   187
            case a :: bs => tune_weekday(a) :: bs.map(tune_timezone(_))
b70fa05d6746 more permissive: accept all historic isatest and afp-test logs;
wenzelm
parents: 64103
diff changeset
   188
            case Nil => Nil
b70fa05d6746 more permissive: accept all historic isatest and afp-test logs;
wenzelm
parents: 64103
diff changeset
   189
          }
b70fa05d6746 more permissive: accept all historic isatest and afp-test logs;
wenzelm
parents: 64103
diff changeset
   190
        )
64101
976289c733e6 more formal directory content;
wenzelm
parents: 64100
diff changeset
   191
976289c733e6 more formal directory content;
wenzelm
parents: 64100
diff changeset
   192
      Date.Format.make(fmts, tune)
976289c733e6 more formal directory content;
wenzelm
parents: 64100
diff changeset
   193
    }
64117
c2b41b073d8a build_history log files with formal meta info;
wenzelm
parents: 64116
diff changeset
   194
c2b41b073d8a build_history log files with formal meta info;
wenzelm
parents: 64116
diff changeset
   195
c2b41b073d8a build_history log files with formal meta info;
wenzelm
parents: 64116
diff changeset
   196
    /* inlined content */
c2b41b073d8a build_history log files with formal meta info;
wenzelm
parents: 64116
diff changeset
   197
64119
8094eaa38d4b inline session ML statistics into main build log;
wenzelm
parents: 64117
diff changeset
   198
    def print_props(marker: String, props: Properties.T): String =
65624
32fa61f694ef clarified multi-line properties;
wenzelm
parents: 65623
diff changeset
   199
      marker + YXML.string_of_body(XML.Encode.properties(Properties.encode_lines(props)))
64102
1ec2adddf16b prefer static Date_Format;
wenzelm
parents: 64101
diff changeset
   200
  }
1ec2adddf16b prefer static Date_Format;
wenzelm
parents: 64101
diff changeset
   201
1ec2adddf16b prefer static Date_Format;
wenzelm
parents: 64101
diff changeset
   202
  class Log_File private(val name: String, val lines: List[String])
1ec2adddf16b prefer static Date_Format;
wenzelm
parents: 64101
diff changeset
   203
  {
1ec2adddf16b prefer static Date_Format;
wenzelm
parents: 64101
diff changeset
   204
    log_file =>
1ec2adddf16b prefer static Date_Format;
wenzelm
parents: 64101
diff changeset
   205
1ec2adddf16b prefer static Date_Format;
wenzelm
parents: 64101
diff changeset
   206
    override def toString: String = name
1ec2adddf16b prefer static Date_Format;
wenzelm
parents: 64101
diff changeset
   207
1ec2adddf16b prefer static Date_Format;
wenzelm
parents: 64101
diff changeset
   208
    def text: String = cat_lines(lines)
1ec2adddf16b prefer static Date_Format;
wenzelm
parents: 64101
diff changeset
   209
1ec2adddf16b prefer static Date_Format;
wenzelm
parents: 64101
diff changeset
   210
    def err(msg: String): Nothing =
1ec2adddf16b prefer static Date_Format;
wenzelm
parents: 64101
diff changeset
   211
      error("Error in log file " + quote(name) + ": " + msg)
1ec2adddf16b prefer static Date_Format;
wenzelm
parents: 64101
diff changeset
   212
1ec2adddf16b prefer static Date_Format;
wenzelm
parents: 64101
diff changeset
   213
1ec2adddf16b prefer static Date_Format;
wenzelm
parents: 64101
diff changeset
   214
    /* date format */
64101
976289c733e6 more formal directory content;
wenzelm
parents: 64100
diff changeset
   215
976289c733e6 more formal directory content;
wenzelm
parents: 64100
diff changeset
   216
    object Strict_Date
976289c733e6 more formal directory content;
wenzelm
parents: 64100
diff changeset
   217
    {
976289c733e6 more formal directory content;
wenzelm
parents: 64100
diff changeset
   218
      def unapply(s: String): Some[Date] =
64102
1ec2adddf16b prefer static Date_Format;
wenzelm
parents: 64101
diff changeset
   219
        try { Some(Log_File.Date_Format.parse(s)) }
64101
976289c733e6 more formal directory content;
wenzelm
parents: 64100
diff changeset
   220
        catch { case exn: DateTimeParseException => log_file.err(exn.getMessage) }
976289c733e6 more formal directory content;
wenzelm
parents: 64100
diff changeset
   221
    }
976289c733e6 more formal directory content;
wenzelm
parents: 64100
diff changeset
   222
976289c733e6 more formal directory content;
wenzelm
parents: 64100
diff changeset
   223
64062
a7352cbde7d7 misc tuning and clarification;
wenzelm
parents: 64061
diff changeset
   224
    /* inlined content */
a7352cbde7d7 misc tuning and clarification;
wenzelm
parents: 64061
diff changeset
   225
a7352cbde7d7 misc tuning and clarification;
wenzelm
parents: 64061
diff changeset
   226
    def find[A](f: String => Option[A]): Option[A] =
a7352cbde7d7 misc tuning and clarification;
wenzelm
parents: 64061
diff changeset
   227
      lines.iterator.map(f).find(_.isDefined).map(_.get)
a7352cbde7d7 misc tuning and clarification;
wenzelm
parents: 64061
diff changeset
   228
64196
6688b9cd443b more robust wrt. old versions that use clear-text properties (e.g. Timing in build_history_base);
wenzelm
parents: 64193
diff changeset
   229
    def find_line(marker: String): Option[String] =
6688b9cd443b more robust wrt. old versions that use clear-text properties (e.g. Timing in build_history_base);
wenzelm
parents: 64193
diff changeset
   230
      find(Library.try_unprefix(marker, _))
6688b9cd443b more robust wrt. old versions that use clear-text properties (e.g. Timing in build_history_base);
wenzelm
parents: 64193
diff changeset
   231
65684
00d4663270d9 explicit support for multiple regexes;
wenzelm
parents: 65683
diff changeset
   232
    def find_match(regexes: List[Regex]): Option[String] =
00d4663270d9 explicit support for multiple regexes;
wenzelm
parents: 65683
diff changeset
   233
      regexes match {
00d4663270d9 explicit support for multiple regexes;
wenzelm
parents: 65683
diff changeset
   234
        case Nil => None
00d4663270d9 explicit support for multiple regexes;
wenzelm
parents: 65683
diff changeset
   235
        case regex :: rest =>
00d4663270d9 explicit support for multiple regexes;
wenzelm
parents: 65683
diff changeset
   236
          lines.iterator.map(regex.unapplySeq(_)).find(res => res.isDefined && res.get.length == 1).
00d4663270d9 explicit support for multiple regexes;
wenzelm
parents: 65683
diff changeset
   237
            map(res => res.get.head) orElse find_match(rest)
00d4663270d9 explicit support for multiple regexes;
wenzelm
parents: 65683
diff changeset
   238
      }
64062
a7352cbde7d7 misc tuning and clarification;
wenzelm
parents: 64061
diff changeset
   239
a7352cbde7d7 misc tuning and clarification;
wenzelm
parents: 64061
diff changeset
   240
a7352cbde7d7 misc tuning and clarification;
wenzelm
parents: 64061
diff changeset
   241
    /* settings */
a7352cbde7d7 misc tuning and clarification;
wenzelm
parents: 64061
diff changeset
   242
64091
f8dfba90e73f more liberal parsing for old AFP logs;
wenzelm
parents: 64090
diff changeset
   243
    def get_setting(a: String): Option[Settings.Entry] =
f8dfba90e73f more liberal parsing for old AFP logs;
wenzelm
parents: 64090
diff changeset
   244
      lines.find(_.startsWith(a + "=")) match {
f8dfba90e73f more liberal parsing for old AFP logs;
wenzelm
parents: 64090
diff changeset
   245
        case Some(line) => Settings.Entry.unapply(line)
f8dfba90e73f more liberal parsing for old AFP logs;
wenzelm
parents: 64090
diff changeset
   246
        case None => None
f8dfba90e73f more liberal parsing for old AFP logs;
wenzelm
parents: 64090
diff changeset
   247
      }
64045
c6160d0b0337 clarified modules;
wenzelm
parents:
diff changeset
   248
65611
a4a7841ae84f more uniform storage of Meta_Info;
wenzelm
parents: 65609
diff changeset
   249
    def get_all_settings: Settings.T =
a4a7841ae84f more uniform storage of Meta_Info;
wenzelm
parents: 65609
diff changeset
   250
      for { c <- Settings.all_settings; entry <- get_setting(c.name) }
a4a7841ae84f more uniform storage of Meta_Info;
wenzelm
parents: 65609
diff changeset
   251
      yield entry
64062
a7352cbde7d7 misc tuning and clarification;
wenzelm
parents: 64061
diff changeset
   252
a7352cbde7d7 misc tuning and clarification;
wenzelm
parents: 64061
diff changeset
   253
a7352cbde7d7 misc tuning and clarification;
wenzelm
parents: 64061
diff changeset
   254
    /* properties (YXML) */
a7352cbde7d7 misc tuning and clarification;
wenzelm
parents: 64061
diff changeset
   255
a7352cbde7d7 misc tuning and clarification;
wenzelm
parents: 64061
diff changeset
   256
    val xml_cache = new XML.Cache()
a7352cbde7d7 misc tuning and clarification;
wenzelm
parents: 64061
diff changeset
   257
a7352cbde7d7 misc tuning and clarification;
wenzelm
parents: 64061
diff changeset
   258
    def parse_props(text: String): Properties.T =
65624
32fa61f694ef clarified multi-line properties;
wenzelm
parents: 65623
diff changeset
   259
      xml_cache.props(Properties.decode_lines(XML.Decode.properties(YXML.parse_body(text))))
64062
a7352cbde7d7 misc tuning and clarification;
wenzelm
parents: 64061
diff changeset
   260
64119
8094eaa38d4b inline session ML statistics into main build log;
wenzelm
parents: 64117
diff changeset
   261
    def filter_props(marker: String): List[Properties.T] =
64196
6688b9cd443b more robust wrt. old versions that use clear-text properties (e.g. Timing in build_history_base);
wenzelm
parents: 64193
diff changeset
   262
      for {
6688b9cd443b more robust wrt. old versions that use clear-text properties (e.g. Timing in build_history_base);
wenzelm
parents: 64193
diff changeset
   263
        line <- lines
6688b9cd443b more robust wrt. old versions that use clear-text properties (e.g. Timing in build_history_base);
wenzelm
parents: 64193
diff changeset
   264
        s <- Library.try_unprefix(marker, line)
6688b9cd443b more robust wrt. old versions that use clear-text properties (e.g. Timing in build_history_base);
wenzelm
parents: 64193
diff changeset
   265
        if YXML.detect(s)
6688b9cd443b more robust wrt. old versions that use clear-text properties (e.g. Timing in build_history_base);
wenzelm
parents: 64193
diff changeset
   266
      } yield parse_props(s)
64062
a7352cbde7d7 misc tuning and clarification;
wenzelm
parents: 64061
diff changeset
   267
64119
8094eaa38d4b inline session ML statistics into main build log;
wenzelm
parents: 64117
diff changeset
   268
    def find_props(marker: String): Option[Properties.T] =
64196
6688b9cd443b more robust wrt. old versions that use clear-text properties (e.g. Timing in build_history_base);
wenzelm
parents: 64193
diff changeset
   269
      find_line(marker) match {
6688b9cd443b more robust wrt. old versions that use clear-text properties (e.g. Timing in build_history_base);
wenzelm
parents: 64193
diff changeset
   270
        case Some(text) if YXML.detect(text) => Some(parse_props(text))
6688b9cd443b more robust wrt. old versions that use clear-text properties (e.g. Timing in build_history_base);
wenzelm
parents: 64193
diff changeset
   271
        case _ => None
6688b9cd443b more robust wrt. old versions that use clear-text properties (e.g. Timing in build_history_base);
wenzelm
parents: 64193
diff changeset
   272
      }
64062
a7352cbde7d7 misc tuning and clarification;
wenzelm
parents: 64061
diff changeset
   273
a7352cbde7d7 misc tuning and clarification;
wenzelm
parents: 64061
diff changeset
   274
a7352cbde7d7 misc tuning and clarification;
wenzelm
parents: 64061
diff changeset
   275
    /* parse various formats */
a7352cbde7d7 misc tuning and clarification;
wenzelm
parents: 64061
diff changeset
   276
64105
d93bd6d253c6 tuned signature;
wenzelm
parents: 64104
diff changeset
   277
    def parse_meta_info(): Meta_Info = Build_Log.parse_meta_info(log_file)
d93bd6d253c6 tuned signature;
wenzelm
parents: 64104
diff changeset
   278
65646
014dbbe5331f parse ml_statistics only when required;
wenzelm
parents: 65645
diff changeset
   279
    def parse_build_info(ml_statistics: Boolean = false): Build_Info =
014dbbe5331f parse ml_statistics only when required;
wenzelm
parents: 65645
diff changeset
   280
      Build_Log.parse_build_info(log_file, ml_statistics)
64105
d93bd6d253c6 tuned signature;
wenzelm
parents: 64104
diff changeset
   281
64082
d57c7295f601 clarified signature;
wenzelm
parents: 64081
diff changeset
   282
    def parse_session_info(
d57c7295f601 clarified signature;
wenzelm
parents: 64081
diff changeset
   283
        command_timings: Boolean = false,
d57c7295f601 clarified signature;
wenzelm
parents: 64081
diff changeset
   284
        ml_statistics: Boolean = false,
d57c7295f601 clarified signature;
wenzelm
parents: 64081
diff changeset
   285
        task_statistics: Boolean = false): Session_Info =
65318
342efc382558 eliminated somewhat redundant inlined name (despite a7aa17a1f721);
wenzelm
parents: 65290
diff changeset
   286
      Build_Log.parse_session_info(log_file, command_timings, ml_statistics, task_statistics)
64045
c6160d0b0337 clarified modules;
wenzelm
parents:
diff changeset
   287
  }
c6160d0b0337 clarified modules;
wenzelm
parents:
diff changeset
   288
c6160d0b0337 clarified modules;
wenzelm
parents:
diff changeset
   289
64098
099518e8af2c misc tuning and clarification;
wenzelm
parents: 64096
diff changeset
   290
65276
fa1a5efee2ec tuned comments;
wenzelm
parents: 65052
diff changeset
   291
  /** digested meta info: produced by Admin/build_history in log.xz file **/
64045
c6160d0b0337 clarified modules;
wenzelm
parents:
diff changeset
   292
64108
623abb8fecdf clarified meta info;
wenzelm
parents: 64107
diff changeset
   293
  object Meta_Info
64099
wenzelm
parents: 64098
diff changeset
   294
  {
64108
623abb8fecdf clarified meta info;
wenzelm
parents: 64107
diff changeset
   295
    val empty: Meta_Info = Meta_Info(Nil, Nil)
64099
wenzelm
parents: 64098
diff changeset
   296
  }
64098
099518e8af2c misc tuning and clarification;
wenzelm
parents: 64096
diff changeset
   297
65611
a4a7841ae84f more uniform storage of Meta_Info;
wenzelm
parents: 65609
diff changeset
   298
  sealed case class Meta_Info(props: Properties.T, settings: Settings.T)
64103
60d163f38056 accept spurious empty logs;
wenzelm
parents: 64102
diff changeset
   299
  {
60d163f38056 accept spurious empty logs;
wenzelm
parents: 64102
diff changeset
   300
    def is_empty: Boolean = props.isEmpty && settings.isEmpty
65599
08dfa79866ec database storage of Meta_Info and Build_Info;
wenzelm
parents: 65595
diff changeset
   301
65611
a4a7841ae84f more uniform storage of Meta_Info;
wenzelm
parents: 65609
diff changeset
   302
    def get(c: SQL.Column): Option[String] =
a4a7841ae84f more uniform storage of Meta_Info;
wenzelm
parents: 65609
diff changeset
   303
      Properties.get(props, c.name) orElse
a4a7841ae84f more uniform storage of Meta_Info;
wenzelm
parents: 65609
diff changeset
   304
      Properties.get(settings, c.name)
a4a7841ae84f more uniform storage of Meta_Info;
wenzelm
parents: 65609
diff changeset
   305
a4a7841ae84f more uniform storage of Meta_Info;
wenzelm
parents: 65609
diff changeset
   306
    def get_date(c: SQL.Column): Option[Date] =
a4a7841ae84f more uniform storage of Meta_Info;
wenzelm
parents: 65609
diff changeset
   307
      get(c).map(Log_File.Date_Format.parse(_))
64103
60d163f38056 accept spurious empty logs;
wenzelm
parents: 64102
diff changeset
   308
  }
64061
1bbea2b55d22 some support for header and data fields, notably from afp-test;
wenzelm
parents: 64054
diff changeset
   309
65625
13552d5c0005 more log files;
wenzelm
parents: 65624
diff changeset
   310
  object Identify
13552d5c0005 more log files;
wenzelm
parents: 65624
diff changeset
   311
  {
13552d5c0005 more log files;
wenzelm
parents: 65624
diff changeset
   312
    val log_prefix = "isabelle_identify_"
65674
23897f5d885d approximate repository identify job based on isabelle-nightly-slow;
wenzelm
parents: 65670
diff changeset
   313
23897f5d885d approximate repository identify job based on isabelle-nightly-slow;
wenzelm
parents: 65670
diff changeset
   314
    def engine(log_file: Log_File): String =
23897f5d885d approximate repository identify job based on isabelle-nightly-slow;
wenzelm
parents: 65670
diff changeset
   315
      if (log_file.name.startsWith(Jenkins.log_prefix)) "jenkins_identify"
23897f5d885d approximate repository identify job based on isabelle-nightly-slow;
wenzelm
parents: 65670
diff changeset
   316
      else "identify"
23897f5d885d approximate repository identify job based on isabelle-nightly-slow;
wenzelm
parents: 65670
diff changeset
   317
23897f5d885d approximate repository identify job based on isabelle-nightly-slow;
wenzelm
parents: 65670
diff changeset
   318
    def content(date: Date, isabelle_version: Option[String], afp_version: Option[String]): String =
23897f5d885d approximate repository identify job based on isabelle-nightly-slow;
wenzelm
parents: 65670
diff changeset
   319
      terminate_lines(
23897f5d885d approximate repository identify job based on isabelle-nightly-slow;
wenzelm
parents: 65670
diff changeset
   320
        List("isabelle_identify: " + Build_Log.print_date(date), "") :::
23897f5d885d approximate repository identify job based on isabelle-nightly-slow;
wenzelm
parents: 65670
diff changeset
   321
        isabelle_version.map("Isabelle version: " + _).toList :::
23897f5d885d approximate repository identify job based on isabelle-nightly-slow;
wenzelm
parents: 65670
diff changeset
   322
        afp_version.map("AFP version: " + _).toList)
23897f5d885d approximate repository identify job based on isabelle-nightly-slow;
wenzelm
parents: 65670
diff changeset
   323
65625
13552d5c0005 more log files;
wenzelm
parents: 65624
diff changeset
   324
    val Start = new Regex("""^isabelle_identify: (.+)$""")
13552d5c0005 more log files;
wenzelm
parents: 65624
diff changeset
   325
    val No_End = new Regex("""$.""")
65684
00d4663270d9 explicit support for multiple regexes;
wenzelm
parents: 65683
diff changeset
   326
    val Isabelle_Version = List(new Regex("""^Isabelle version: (\S+)$"""))
00d4663270d9 explicit support for multiple regexes;
wenzelm
parents: 65683
diff changeset
   327
    val AFP_Version = List(new Regex("""^AFP version: (\S+)$"""))
65625
13552d5c0005 more log files;
wenzelm
parents: 65624
diff changeset
   328
  }
13552d5c0005 more log files;
wenzelm
parents: 65624
diff changeset
   329
64095
1a6d37c31df9 support for isatest format;
wenzelm
parents: 64094
diff changeset
   330
  object Isatest
1a6d37c31df9 support for isatest format;
wenzelm
parents: 64094
diff changeset
   331
  {
65588
b0d8d97198b3 clarified signature;
wenzelm
parents: 65318
diff changeset
   332
    val log_prefix = "isatest-makeall-"
64108
623abb8fecdf clarified meta info;
wenzelm
parents: 64107
diff changeset
   333
    val engine = "isatest"
64109
wenzelm
parents: 64108
diff changeset
   334
    val Start = new Regex("""^------------------- starting test --- (.+) --- (.+)$""")
wenzelm
parents: 64108
diff changeset
   335
    val End = new Regex("""^------------------- test (?:successful|FAILED) --- (.+) --- .*$""")
65684
00d4663270d9 explicit support for multiple regexes;
wenzelm
parents: 65683
diff changeset
   336
    val Isabelle_Version = List(new Regex("""^Isabelle version: (\S+)$"""))
64095
1a6d37c31df9 support for isatest format;
wenzelm
parents: 64094
diff changeset
   337
  }
1a6d37c31df9 support for isatest format;
wenzelm
parents: 64094
diff changeset
   338
64109
wenzelm
parents: 64108
diff changeset
   339
  object AFP_Test
64061
1bbea2b55d22 some support for header and data fields, notably from afp-test;
wenzelm
parents: 64054
diff changeset
   340
  {
65588
b0d8d97198b3 clarified signature;
wenzelm
parents: 65318
diff changeset
   341
    val log_prefix = "afp-test-devel-"
64108
623abb8fecdf clarified meta info;
wenzelm
parents: 64107
diff changeset
   342
    val engine = "afp-test"
64109
wenzelm
parents: 64108
diff changeset
   343
    val Start = new Regex("""^Start test(?: for .+)? at ([^,]+), (.*)$""")
wenzelm
parents: 64108
diff changeset
   344
    val Start_Old = new Regex("""^Start test(?: for .+)? at ([^,]+)$""")
wenzelm
parents: 64108
diff changeset
   345
    val End = new Regex("""^End test on (.+), .+, elapsed time:.*$""")
65684
00d4663270d9 explicit support for multiple regexes;
wenzelm
parents: 65683
diff changeset
   346
    val Isabelle_Version = List(new Regex("""^Isabelle version: .* -- hg id (\S+)$"""))
00d4663270d9 explicit support for multiple regexes;
wenzelm
parents: 65683
diff changeset
   347
    val AFP_Version = List(new Regex("""^AFP version: .* -- hg id (\S+)$"""))
64104
b70fa05d6746 more permissive: accept all historic isatest and afp-test logs;
wenzelm
parents: 64103
diff changeset
   348
    val Bad_Init = new Regex("""^cp:.*: Disc quota exceeded$""")
64061
1bbea2b55d22 some support for header and data fields, notably from afp-test;
wenzelm
parents: 64054
diff changeset
   349
  }
1bbea2b55d22 some support for header and data fields, notably from afp-test;
wenzelm
parents: 64054
diff changeset
   350
64110
c0b96b34c7b9 support for Isabelle/Jenkins log file format;
wenzelm
parents: 64109
diff changeset
   351
  object Jenkins
c0b96b34c7b9 support for Isabelle/Jenkins log file format;
wenzelm
parents: 64109
diff changeset
   352
  {
65664
c84db5e0dd6d detect Jenkins log files as well;
wenzelm
parents: 65663
diff changeset
   353
    val log_prefix = "jenkins_"
64110
c0b96b34c7b9 support for Isabelle/Jenkins log file format;
wenzelm
parents: 64109
diff changeset
   354
    val engine = "jenkins"
65663
61cd86bb9613 detect host name;
wenzelm
parents: 65649
diff changeset
   355
    val Host = new Regex("""^Building remotely on (\S+) \((\S+)\).*$""")
65665
9b7fb07b4a96 more robust detection of Jenkins log;
wenzelm
parents: 65664
diff changeset
   356
    val Start = new Regex("""^(?:Started by an SCM change|Started from command line by admin|).*$""")
64110
c0b96b34c7b9 support for Isabelle/Jenkins log file format;
wenzelm
parents: 64109
diff changeset
   357
    val Start_Date = new Regex("""^Build started at (.+)$""")
c0b96b34c7b9 support for Isabelle/Jenkins log file format;
wenzelm
parents: 64109
diff changeset
   358
    val No_End = new Regex("""$.""")
65674
23897f5d885d approximate repository identify job based on isabelle-nightly-slow;
wenzelm
parents: 65670
diff changeset
   359
    val Isabelle_Version =
65684
00d4663270d9 explicit support for multiple regexes;
wenzelm
parents: 65683
diff changeset
   360
      List(new Regex("""^(?:Build for Isabelle id|Isabelle id) (\w+).*$"""),
65685
47bbf7150aae detect old log files (early 2016);
wenzelm
parents: 65684
diff changeset
   361
        new Regex("""^ISABELLE_CI_REPO_ID="(\w+)".*$"""),
47bbf7150aae detect old log files (early 2016);
wenzelm
parents: 65684
diff changeset
   362
        new Regex("""^(\w{12}) tip.*$"""))
65674
23897f5d885d approximate repository identify job based on isabelle-nightly-slow;
wenzelm
parents: 65670
diff changeset
   363
    val AFP_Version =
65684
00d4663270d9 explicit support for multiple regexes;
wenzelm
parents: 65683
diff changeset
   364
      List(new Regex("""^(?:Build for AFP id|AFP id) (\w+).*$"""),
00d4663270d9 explicit support for multiple regexes;
wenzelm
parents: 65683
diff changeset
   365
        new Regex("""^ISABELLE_CI_AFP_ID="(\w+)".*$"""))
64110
c0b96b34c7b9 support for Isabelle/Jenkins log file format;
wenzelm
parents: 64109
diff changeset
   366
    val CONFIGURATION = "=== CONFIGURATION ==="
c0b96b34c7b9 support for Isabelle/Jenkins log file format;
wenzelm
parents: 64109
diff changeset
   367
    val BUILD = "=== BUILD ==="
c0b96b34c7b9 support for Isabelle/Jenkins log file format;
wenzelm
parents: 64109
diff changeset
   368
  }
c0b96b34c7b9 support for Isabelle/Jenkins log file format;
wenzelm
parents: 64109
diff changeset
   369
64105
d93bd6d253c6 tuned signature;
wenzelm
parents: 64104
diff changeset
   370
  private def parse_meta_info(log_file: Log_File): Meta_Info =
64061
1bbea2b55d22 some support for header and data fields, notably from afp-test;
wenzelm
parents: 64054
diff changeset
   371
  {
64108
623abb8fecdf clarified meta info;
wenzelm
parents: 64107
diff changeset
   372
    def parse(engine: String, host: String, start: Date,
65684
00d4663270d9 explicit support for multiple regexes;
wenzelm
parents: 65683
diff changeset
   373
      End: Regex, Isabelle_Version: List[Regex], AFP_Version: List[Regex]): Meta_Info =
64091
f8dfba90e73f more liberal parsing for old AFP logs;
wenzelm
parents: 64090
diff changeset
   374
    {
64296
544481988e65 explicit identification of builds and correlated build groups;
wenzelm
parents: 64196
diff changeset
   375
      val build_id =
544481988e65 explicit identification of builds and correlated build groups;
wenzelm
parents: 64196
diff changeset
   376
      {
65714
wenzelm
parents: 65709
diff changeset
   377
        val prefix = proper_string(host) orElse proper_string(engine) getOrElse "build"
wenzelm
parents: 65709
diff changeset
   378
        prefix + ":" + start.time.ms
64296
544481988e65 explicit identification of builds and correlated build groups;
wenzelm
parents: 64196
diff changeset
   379
      }
65591
5953c7fbc2b8 more SQL operations;
wenzelm
parents: 65590
diff changeset
   380
      val build_engine = if (engine == "") Nil else List(Prop.build_engine.name -> engine)
5953c7fbc2b8 more SQL operations;
wenzelm
parents: 65590
diff changeset
   381
      val build_host = if (host == "") Nil else List(Prop.build_host.name -> host)
64108
623abb8fecdf clarified meta info;
wenzelm
parents: 64107
diff changeset
   382
65599
08dfa79866ec database storage of Meta_Info and Build_Info;
wenzelm
parents: 65595
diff changeset
   383
      val start_date = List(Prop.build_start.name -> print_date(start))
64091
f8dfba90e73f more liberal parsing for old AFP logs;
wenzelm
parents: 64090
diff changeset
   384
      val end_date =
f8dfba90e73f more liberal parsing for old AFP logs;
wenzelm
parents: 64090
diff changeset
   385
        log_file.lines.last match {
64109
wenzelm
parents: 64108
diff changeset
   386
          case End(log_file.Strict_Date(end_date)) =>
65599
08dfa79866ec database storage of Meta_Info and Build_Info;
wenzelm
parents: 65595
diff changeset
   387
            List(Prop.build_end.name -> print_date(end_date))
64091
f8dfba90e73f more liberal parsing for old AFP logs;
wenzelm
parents: 64090
diff changeset
   388
          case _ => Nil
f8dfba90e73f more liberal parsing for old AFP logs;
wenzelm
parents: 64090
diff changeset
   389
        }
f8dfba90e73f more liberal parsing for old AFP logs;
wenzelm
parents: 64090
diff changeset
   390
f8dfba90e73f more liberal parsing for old AFP logs;
wenzelm
parents: 64090
diff changeset
   391
      val isabelle_version =
65591
5953c7fbc2b8 more SQL operations;
wenzelm
parents: 65590
diff changeset
   392
        log_file.find_match(Isabelle_Version).map(Prop.isabelle_version.name -> _)
64091
f8dfba90e73f more liberal parsing for old AFP logs;
wenzelm
parents: 64090
diff changeset
   393
      val afp_version =
65591
5953c7fbc2b8 more SQL operations;
wenzelm
parents: 65590
diff changeset
   394
        log_file.find_match(AFP_Version).map(Prop.afp_version.name -> _)
64062
a7352cbde7d7 misc tuning and clarification;
wenzelm
parents: 64061
diff changeset
   395
65591
5953c7fbc2b8 more SQL operations;
wenzelm
parents: 65590
diff changeset
   396
      Meta_Info((Prop.build_id.name -> build_id) :: build_engine ::: build_host :::
64108
623abb8fecdf clarified meta info;
wenzelm
parents: 64107
diff changeset
   397
          start_date ::: end_date ::: isabelle_version.toList ::: afp_version.toList,
65611
a4a7841ae84f more uniform storage of Meta_Info;
wenzelm
parents: 65609
diff changeset
   398
        log_file.get_all_settings)
64091
f8dfba90e73f more liberal parsing for old AFP logs;
wenzelm
parents: 64090
diff changeset
   399
    }
f8dfba90e73f more liberal parsing for old AFP logs;
wenzelm
parents: 64090
diff changeset
   400
f8dfba90e73f more liberal parsing for old AFP logs;
wenzelm
parents: 64090
diff changeset
   401
    log_file.lines match {
64119
8094eaa38d4b inline session ML statistics into main build log;
wenzelm
parents: 64117
diff changeset
   402
      case line :: _ if line.startsWith(Build_History.META_INFO_MARKER) =>
8094eaa38d4b inline session ML statistics into main build log;
wenzelm
parents: 64117
diff changeset
   403
        Meta_Info(log_file.find_props(Build_History.META_INFO_MARKER).get,
65611
a4a7841ae84f more uniform storage of Meta_Info;
wenzelm
parents: 65609
diff changeset
   404
          log_file.get_all_settings)
64117
c2b41b073d8a build_history log files with formal meta info;
wenzelm
parents: 64116
diff changeset
   405
65625
13552d5c0005 more log files;
wenzelm
parents: 65624
diff changeset
   406
      case Identify.Start(log_file.Strict_Date(start)) :: _ =>
65674
23897f5d885d approximate repository identify job based on isabelle-nightly-slow;
wenzelm
parents: 65670
diff changeset
   407
        parse(Identify.engine(log_file), "", start, Identify.No_End,
65625
13552d5c0005 more log files;
wenzelm
parents: 65624
diff changeset
   408
          Identify.Isabelle_Version, Identify.AFP_Version)
13552d5c0005 more log files;
wenzelm
parents: 65624
diff changeset
   409
64109
wenzelm
parents: 64108
diff changeset
   410
      case Isatest.Start(log_file.Strict_Date(start), host) :: _ =>
wenzelm
parents: 64108
diff changeset
   411
        parse(Isatest.engine, host, start, Isatest.End,
65684
00d4663270d9 explicit support for multiple regexes;
wenzelm
parents: 65683
diff changeset
   412
          Isatest.Isabelle_Version, Nil)
64099
wenzelm
parents: 64098
diff changeset
   413
64109
wenzelm
parents: 64108
diff changeset
   414
      case AFP_Test.Start(log_file.Strict_Date(start), host) :: _ =>
wenzelm
parents: 64108
diff changeset
   415
        parse(AFP_Test.engine, host, start, AFP_Test.End,
wenzelm
parents: 64108
diff changeset
   416
          AFP_Test.Isabelle_Version, AFP_Test.AFP_Version)
64099
wenzelm
parents: 64098
diff changeset
   417
64109
wenzelm
parents: 64108
diff changeset
   418
      case AFP_Test.Start_Old(log_file.Strict_Date(start)) :: _ =>
wenzelm
parents: 64108
diff changeset
   419
        parse(AFP_Test.engine, "", start, AFP_Test.End,
wenzelm
parents: 64108
diff changeset
   420
          AFP_Test.Isabelle_Version, AFP_Test.AFP_Version)
64099
wenzelm
parents: 64098
diff changeset
   421
65665
9b7fb07b4a96 more robust detection of Jenkins log;
wenzelm
parents: 65664
diff changeset
   422
      case Jenkins.Start() :: _ =>
64110
c0b96b34c7b9 support for Isabelle/Jenkins log file format;
wenzelm
parents: 64109
diff changeset
   423
        log_file.lines.dropWhile(_ != Jenkins.BUILD) match {
c0b96b34c7b9 support for Isabelle/Jenkins log file format;
wenzelm
parents: 64109
diff changeset
   424
          case Jenkins.BUILD :: _ :: Jenkins.Start_Date(log_file.Strict_Date(start)) :: _ =>
65663
61cd86bb9613 detect host name;
wenzelm
parents: 65649
diff changeset
   425
            val host =
61cd86bb9613 detect host name;
wenzelm
parents: 65649
diff changeset
   426
              log_file.lines.takeWhile(_ != Jenkins.CONFIGURATION).collectFirst({
61cd86bb9613 detect host name;
wenzelm
parents: 65649
diff changeset
   427
                case Jenkins.Host(a, b) => a + "." + b
61cd86bb9613 detect host name;
wenzelm
parents: 65649
diff changeset
   428
              }).getOrElse("")
61cd86bb9613 detect host name;
wenzelm
parents: 65649
diff changeset
   429
            parse(Jenkins.engine, host, start.to(ZoneId.of("Europe/Berlin")), Jenkins.No_End,
64110
c0b96b34c7b9 support for Isabelle/Jenkins log file format;
wenzelm
parents: 64109
diff changeset
   430
              Jenkins.Isabelle_Version, Jenkins.AFP_Version)
c0b96b34c7b9 support for Isabelle/Jenkins log file format;
wenzelm
parents: 64109
diff changeset
   431
          case _ => Meta_Info.empty
c0b96b34c7b9 support for Isabelle/Jenkins log file format;
wenzelm
parents: 64109
diff changeset
   432
        }
c0b96b34c7b9 support for Isabelle/Jenkins log file format;
wenzelm
parents: 64109
diff changeset
   433
64341
45b6faeee56d avoid deprecated Scala;
wenzelm
parents: 64303
diff changeset
   434
      case line :: _ if line.startsWith("\u0000") => Meta_Info.empty
64109
wenzelm
parents: 64108
diff changeset
   435
      case List(Isatest.End(_)) => Meta_Info.empty
wenzelm
parents: 64108
diff changeset
   436
      case _ :: AFP_Test.Bad_Init() :: _ => Meta_Info.empty
64105
d93bd6d253c6 tuned signature;
wenzelm
parents: 64104
diff changeset
   437
      case Nil => Meta_Info.empty
64104
b70fa05d6746 more permissive: accept all historic isatest and afp-test logs;
wenzelm
parents: 64103
diff changeset
   438
64110
c0b96b34c7b9 support for Isabelle/Jenkins log file format;
wenzelm
parents: 64109
diff changeset
   439
      case _ => log_file.err("cannot detect log file format")
64061
1bbea2b55d22 some support for header and data fields, notably from afp-test;
wenzelm
parents: 64054
diff changeset
   440
    }
1bbea2b55d22 some support for header and data fields, notably from afp-test;
wenzelm
parents: 64054
diff changeset
   441
  }
1bbea2b55d22 some support for header and data fields, notably from afp-test;
wenzelm
parents: 64054
diff changeset
   442
64085
1c451e5c145f clarified parse_build_info: isabelle build output;
wenzelm
parents: 64083
diff changeset
   443
64098
099518e8af2c misc tuning and clarification;
wenzelm
parents: 64096
diff changeset
   444
65276
fa1a5efee2ec tuned comments;
wenzelm
parents: 65052
diff changeset
   445
  /** build info: toplevel output of isabelle build or Admin/build_history **/
64119
8094eaa38d4b inline session ML statistics into main build log;
wenzelm
parents: 64117
diff changeset
   446
8094eaa38d4b inline session ML statistics into main build log;
wenzelm
parents: 64117
diff changeset
   447
  val ML_STATISTICS_MARKER = "\fML_statistics = "
8094eaa38d4b inline session ML statistics into main build log;
wenzelm
parents: 64117
diff changeset
   448
  val SESSION_NAME = "session_name"
64085
1c451e5c145f clarified parse_build_info: isabelle build output;
wenzelm
parents: 64083
diff changeset
   449
64061
1bbea2b55d22 some support for header and data fields, notably from afp-test;
wenzelm
parents: 64054
diff changeset
   450
  object Session_Status extends Enumeration
1bbea2b55d22 some support for header and data fields, notably from afp-test;
wenzelm
parents: 64054
diff changeset
   451
  {
65633
wenzelm
parents: 65632
diff changeset
   452
    val existing, finished, failed, cancelled = Value
64061
1bbea2b55d22 some support for header and data fields, notably from afp-test;
wenzelm
parents: 64054
diff changeset
   453
  }
1bbea2b55d22 some support for header and data fields, notably from afp-test;
wenzelm
parents: 64054
diff changeset
   454
65643
a54371226182 clarified dummy Session_Entry;
wenzelm
parents: 65642
diff changeset
   455
  object Session_Entry
a54371226182 clarified dummy Session_Entry;
wenzelm
parents: 65642
diff changeset
   456
  {
a54371226182 clarified dummy Session_Entry;
wenzelm
parents: 65642
diff changeset
   457
    val empty: Session_Entry = Session_Entry()
a54371226182 clarified dummy Session_Entry;
wenzelm
parents: 65642
diff changeset
   458
  }
a54371226182 clarified dummy Session_Entry;
wenzelm
parents: 65642
diff changeset
   459
64085
1c451e5c145f clarified parse_build_info: isabelle build output;
wenzelm
parents: 64083
diff changeset
   460
  sealed case class Session_Entry(
65643
a54371226182 clarified dummy Session_Entry;
wenzelm
parents: 65642
diff changeset
   461
    chapter: String = "",
a54371226182 clarified dummy Session_Entry;
wenzelm
parents: 65642
diff changeset
   462
    groups: List[String] = Nil,
a54371226182 clarified dummy Session_Entry;
wenzelm
parents: 65642
diff changeset
   463
    threads: Option[Int] = None,
a54371226182 clarified dummy Session_Entry;
wenzelm
parents: 65642
diff changeset
   464
    timing: Timing = Timing.zero,
a54371226182 clarified dummy Session_Entry;
wenzelm
parents: 65642
diff changeset
   465
    ml_timing: Timing = Timing.zero,
a54371226182 clarified dummy Session_Entry;
wenzelm
parents: 65642
diff changeset
   466
    heap_size: Option[Long] = None,
a54371226182 clarified dummy Session_Entry;
wenzelm
parents: 65642
diff changeset
   467
    status: Option[Session_Status.Value] = None,
a54371226182 clarified dummy Session_Entry;
wenzelm
parents: 65642
diff changeset
   468
    ml_statistics: List[Properties.T] = Nil)
64085
1c451e5c145f clarified parse_build_info: isabelle build output;
wenzelm
parents: 64083
diff changeset
   469
  {
65631
ee917f172912 clarified database content;
wenzelm
parents: 65629
diff changeset
   470
    def proper_chapter: Option[String] = if (chapter == "") None else Some(chapter)
ee917f172912 clarified database content;
wenzelm
parents: 65629
diff changeset
   471
    def proper_groups: Option[String] = if (groups.isEmpty) None else Some(cat_lines(groups))
65643
a54371226182 clarified dummy Session_Entry;
wenzelm
parents: 65642
diff changeset
   472
    def finished: Boolean = status == Some(Session_Status.finished)
64085
1c451e5c145f clarified parse_build_info: isabelle build output;
wenzelm
parents: 64083
diff changeset
   473
  }
64054
1fc9ab31720d clarified modules;
wenzelm
parents: 64053
diff changeset
   474
64085
1c451e5c145f clarified parse_build_info: isabelle build output;
wenzelm
parents: 64083
diff changeset
   475
  sealed case class Build_Info(sessions: Map[String, Session_Entry])
64054
1fc9ab31720d clarified modules;
wenzelm
parents: 64053
diff changeset
   476
  {
64085
1c451e5c145f clarified parse_build_info: isabelle build output;
wenzelm
parents: 64083
diff changeset
   477
    def session(name: String): Session_Entry = sessions(name)
1c451e5c145f clarified parse_build_info: isabelle build output;
wenzelm
parents: 64083
diff changeset
   478
    def get_session(name: String): Option[Session_Entry] = sessions.get(name)
64054
1fc9ab31720d clarified modules;
wenzelm
parents: 64053
diff changeset
   479
64089
10d719dbb3ee more permissive timing data;
wenzelm
parents: 64088
diff changeset
   480
    def get_default[A](name: String, f: Session_Entry => A, x: A): A =
64085
1c451e5c145f clarified parse_build_info: isabelle build output;
wenzelm
parents: 64083
diff changeset
   481
      get_session(name) match {
64089
10d719dbb3ee more permissive timing data;
wenzelm
parents: 64088
diff changeset
   482
        case Some(entry) => f(entry)
10d719dbb3ee more permissive timing data;
wenzelm
parents: 64088
diff changeset
   483
        case None => x
64085
1c451e5c145f clarified parse_build_info: isabelle build output;
wenzelm
parents: 64083
diff changeset
   484
      }
1c451e5c145f clarified parse_build_info: isabelle build output;
wenzelm
parents: 64083
diff changeset
   485
64119
8094eaa38d4b inline session ML statistics into main build log;
wenzelm
parents: 64117
diff changeset
   486
    def finished_sessions: List[String] = sessions.keySet.iterator.filter(finished(_)).toList
64089
10d719dbb3ee more permissive timing data;
wenzelm
parents: 64088
diff changeset
   487
    def finished(name: String): Boolean = get_default(name, _.finished, false)
10d719dbb3ee more permissive timing data;
wenzelm
parents: 64088
diff changeset
   488
    def timing(name: String): Timing = get_default(name, _.timing, Timing.zero)
10d719dbb3ee more permissive timing data;
wenzelm
parents: 64088
diff changeset
   489
    def ml_timing(name: String): Timing = get_default(name, _.ml_timing, Timing.zero)
65052
7f825cc6debf more operations;
wenzelm
parents: 64341
diff changeset
   490
    def ml_statistics(name: String): ML_Statistics =
7f825cc6debf more operations;
wenzelm
parents: 64341
diff changeset
   491
      get_default(name, entry => ML_Statistics(name, entry.ml_statistics), ML_Statistics.empty)
64054
1fc9ab31720d clarified modules;
wenzelm
parents: 64053
diff changeset
   492
  }
1fc9ab31720d clarified modules;
wenzelm
parents: 64053
diff changeset
   493
65646
014dbbe5331f parse ml_statistics only when required;
wenzelm
parents: 65645
diff changeset
   494
  private def parse_build_info(log_file: Log_File, parse_ml_statistics: Boolean): Build_Info =
64085
1c451e5c145f clarified parse_build_info: isabelle build output;
wenzelm
parents: 64083
diff changeset
   495
  {
1c451e5c145f clarified parse_build_info: isabelle build output;
wenzelm
parents: 64083
diff changeset
   496
    object Chapter_Name
1c451e5c145f clarified parse_build_info: isabelle build output;
wenzelm
parents: 64083
diff changeset
   497
    {
1c451e5c145f clarified parse_build_info: isabelle build output;
wenzelm
parents: 64083
diff changeset
   498
      def unapply(s: String): Some[(String, String)] =
1c451e5c145f clarified parse_build_info: isabelle build output;
wenzelm
parents: 64083
diff changeset
   499
        space_explode('/', s) match {
1c451e5c145f clarified parse_build_info: isabelle build output;
wenzelm
parents: 64083
diff changeset
   500
          case List(chapter, name) => Some((chapter, name))
1c451e5c145f clarified parse_build_info: isabelle build output;
wenzelm
parents: 64083
diff changeset
   501
          case _ => Some(("", s))
1c451e5c145f clarified parse_build_info: isabelle build output;
wenzelm
parents: 64083
diff changeset
   502
        }
1c451e5c145f clarified parse_build_info: isabelle build output;
wenzelm
parents: 64083
diff changeset
   503
    }
64054
1fc9ab31720d clarified modules;
wenzelm
parents: 64053
diff changeset
   504
64085
1c451e5c145f clarified parse_build_info: isabelle build output;
wenzelm
parents: 64083
diff changeset
   505
    val Session_No_Groups = new Regex("""^Session (\S+)$""")
1c451e5c145f clarified parse_build_info: isabelle build output;
wenzelm
parents: 64083
diff changeset
   506
    val Session_Groups = new Regex("""^Session (\S+) \((.*)\)$""")
1c451e5c145f clarified parse_build_info: isabelle build output;
wenzelm
parents: 64083
diff changeset
   507
    val Session_Finished1 =
1c451e5c145f clarified parse_build_info: isabelle build output;
wenzelm
parents: 64083
diff changeset
   508
      new Regex("""^Finished (\S+) \((\d+):(\d+):(\d+) elapsed time, (\d+):(\d+):(\d+) cpu time.*$""")
1c451e5c145f clarified parse_build_info: isabelle build output;
wenzelm
parents: 64083
diff changeset
   509
    val Session_Finished2 =
1c451e5c145f clarified parse_build_info: isabelle build output;
wenzelm
parents: 64083
diff changeset
   510
      new Regex("""^Finished (\S+) \((\d+):(\d+):(\d+) elapsed time.*$""")
1c451e5c145f clarified parse_build_info: isabelle build output;
wenzelm
parents: 64083
diff changeset
   511
    val Session_Timing =
65679
45632d594bdb more general pattern;
wenzelm
parents: 65674
diff changeset
   512
      new Regex("""^Timing (\S+) \((\d+) threads, (\d+\.\d+)s elapsed time, (\d+\.\d+)s cpu time, (\d+\.\d+)s GC time.*$""")
64086
ac7ae5067783 clarified status: started sessions may bomb without explicit FAILED or CANCELLED (cf. in afp-test-devel-2016-01-03.log);
wenzelm
parents: 64085
diff changeset
   513
    val Session_Started = new Regex("""^(?:Running|Building) (\S+) \.\.\.$""")
64085
1c451e5c145f clarified parse_build_info: isabelle build output;
wenzelm
parents: 64083
diff changeset
   514
    val Session_Failed = new Regex("""^(\S+) FAILED""")
1c451e5c145f clarified parse_build_info: isabelle build output;
wenzelm
parents: 64083
diff changeset
   515
    val Session_Cancelled = new Regex("""^(\S+) CANCELLED""")
64120
6c5039016321 record heap sizes;
wenzelm
parents: 64119
diff changeset
   516
    val Heap = new Regex("""^Heap (\S+) \((\d+) bytes\)$""")
64085
1c451e5c145f clarified parse_build_info: isabelle build output;
wenzelm
parents: 64083
diff changeset
   517
1c451e5c145f clarified parse_build_info: isabelle build output;
wenzelm
parents: 64083
diff changeset
   518
    var chapter = Map.empty[String, String]
1c451e5c145f clarified parse_build_info: isabelle build output;
wenzelm
parents: 64083
diff changeset
   519
    var groups = Map.empty[String, List[String]]
1c451e5c145f clarified parse_build_info: isabelle build output;
wenzelm
parents: 64083
diff changeset
   520
    var threads = Map.empty[String, Int]
64054
1fc9ab31720d clarified modules;
wenzelm
parents: 64053
diff changeset
   521
    var timing = Map.empty[String, Timing]
64085
1c451e5c145f clarified parse_build_info: isabelle build output;
wenzelm
parents: 64083
diff changeset
   522
    var ml_timing = Map.empty[String, Timing]
64086
ac7ae5067783 clarified status: started sessions may bomb without explicit FAILED or CANCELLED (cf. in afp-test-devel-2016-01-03.log);
wenzelm
parents: 64085
diff changeset
   523
    var started = Set.empty[String]
64085
1c451e5c145f clarified parse_build_info: isabelle build output;
wenzelm
parents: 64083
diff changeset
   524
    var failed = Set.empty[String]
1c451e5c145f clarified parse_build_info: isabelle build output;
wenzelm
parents: 64083
diff changeset
   525
    var cancelled = Set.empty[String]
65627
bb185e442c95 put bulky data last;
wenzelm
parents: 65626
diff changeset
   526
    var heap_sizes = Map.empty[String, Long]
64119
8094eaa38d4b inline session ML statistics into main build log;
wenzelm
parents: 64117
diff changeset
   527
    var ml_statistics = Map.empty[String, List[Properties.T]]
8094eaa38d4b inline session ML statistics into main build log;
wenzelm
parents: 64117
diff changeset
   528
64085
1c451e5c145f clarified parse_build_info: isabelle build output;
wenzelm
parents: 64083
diff changeset
   529
    def all_sessions: Set[String] =
64120
6c5039016321 record heap sizes;
wenzelm
parents: 64119
diff changeset
   530
      chapter.keySet ++ groups.keySet ++ threads.keySet ++ timing.keySet ++ ml_timing.keySet ++
65627
bb185e442c95 put bulky data last;
wenzelm
parents: 65626
diff changeset
   531
      failed ++ cancelled ++ started ++ heap_sizes.keySet ++ ml_statistics.keySet
64085
1c451e5c145f clarified parse_build_info: isabelle build output;
wenzelm
parents: 64083
diff changeset
   532
64054
1fc9ab31720d clarified modules;
wenzelm
parents: 64053
diff changeset
   533
64062
a7352cbde7d7 misc tuning and clarification;
wenzelm
parents: 64061
diff changeset
   534
    for (line <- log_file.lines) {
64054
1fc9ab31720d clarified modules;
wenzelm
parents: 64053
diff changeset
   535
      line match {
64085
1c451e5c145f clarified parse_build_info: isabelle build output;
wenzelm
parents: 64083
diff changeset
   536
        case Session_No_Groups(Chapter_Name(chapt, name)) =>
1c451e5c145f clarified parse_build_info: isabelle build output;
wenzelm
parents: 64083
diff changeset
   537
          chapter += (name -> chapt)
1c451e5c145f clarified parse_build_info: isabelle build output;
wenzelm
parents: 64083
diff changeset
   538
          groups += (name -> Nil)
64119
8094eaa38d4b inline session ML statistics into main build log;
wenzelm
parents: 64117
diff changeset
   539
64085
1c451e5c145f clarified parse_build_info: isabelle build output;
wenzelm
parents: 64083
diff changeset
   540
        case Session_Groups(Chapter_Name(chapt, name), grps) =>
1c451e5c145f clarified parse_build_info: isabelle build output;
wenzelm
parents: 64083
diff changeset
   541
          chapter += (name -> chapt)
1c451e5c145f clarified parse_build_info: isabelle build output;
wenzelm
parents: 64083
diff changeset
   542
          groups += (name -> Word.explode(grps))
64119
8094eaa38d4b inline session ML statistics into main build log;
wenzelm
parents: 64117
diff changeset
   543
64086
ac7ae5067783 clarified status: started sessions may bomb without explicit FAILED or CANCELLED (cf. in afp-test-devel-2016-01-03.log);
wenzelm
parents: 64085
diff changeset
   544
        case Session_Started(name) =>
ac7ae5067783 clarified status: started sessions may bomb without explicit FAILED or CANCELLED (cf. in afp-test-devel-2016-01-03.log);
wenzelm
parents: 64085
diff changeset
   545
          started += name
64119
8094eaa38d4b inline session ML statistics into main build log;
wenzelm
parents: 64117
diff changeset
   546
64054
1fc9ab31720d clarified modules;
wenzelm
parents: 64053
diff changeset
   547
        case Session_Finished1(name,
1fc9ab31720d clarified modules;
wenzelm
parents: 64053
diff changeset
   548
            Value.Int(e1), Value.Int(e2), Value.Int(e3),
1fc9ab31720d clarified modules;
wenzelm
parents: 64053
diff changeset
   549
            Value.Int(c1), Value.Int(c2), Value.Int(c3)) =>
1fc9ab31720d clarified modules;
wenzelm
parents: 64053
diff changeset
   550
          val elapsed = Time.hms(e1, e2, e3)
1fc9ab31720d clarified modules;
wenzelm
parents: 64053
diff changeset
   551
          val cpu = Time.hms(c1, c2, c3)
64085
1c451e5c145f clarified parse_build_info: isabelle build output;
wenzelm
parents: 64083
diff changeset
   552
          timing += (name -> Timing(elapsed, cpu, Time.zero))
64119
8094eaa38d4b inline session ML statistics into main build log;
wenzelm
parents: 64117
diff changeset
   553
64054
1fc9ab31720d clarified modules;
wenzelm
parents: 64053
diff changeset
   554
        case Session_Finished2(name,
1fc9ab31720d clarified modules;
wenzelm
parents: 64053
diff changeset
   555
            Value.Int(e1), Value.Int(e2), Value.Int(e3)) =>
1fc9ab31720d clarified modules;
wenzelm
parents: 64053
diff changeset
   556
          val elapsed = Time.hms(e1, e2, e3)
64085
1c451e5c145f clarified parse_build_info: isabelle build output;
wenzelm
parents: 64083
diff changeset
   557
          timing += (name -> Timing(elapsed, Time.zero, Time.zero))
64119
8094eaa38d4b inline session ML statistics into main build log;
wenzelm
parents: 64117
diff changeset
   558
64054
1fc9ab31720d clarified modules;
wenzelm
parents: 64053
diff changeset
   559
        case Session_Timing(name,
1fc9ab31720d clarified modules;
wenzelm
parents: 64053
diff changeset
   560
            Value.Int(t), Value.Double(e), Value.Double(c), Value.Double(g)) =>
1fc9ab31720d clarified modules;
wenzelm
parents: 64053
diff changeset
   561
          val elapsed = Time.seconds(e)
1fc9ab31720d clarified modules;
wenzelm
parents: 64053
diff changeset
   562
          val cpu = Time.seconds(c)
1fc9ab31720d clarified modules;
wenzelm
parents: 64053
diff changeset
   563
          val gc = Time.seconds(g)
64085
1c451e5c145f clarified parse_build_info: isabelle build output;
wenzelm
parents: 64083
diff changeset
   564
          ml_timing += (name -> Timing(elapsed, cpu, gc))
64054
1fc9ab31720d clarified modules;
wenzelm
parents: 64053
diff changeset
   565
          threads += (name -> t)
64119
8094eaa38d4b inline session ML statistics into main build log;
wenzelm
parents: 64117
diff changeset
   566
64120
6c5039016321 record heap sizes;
wenzelm
parents: 64119
diff changeset
   567
        case Heap(name, Value.Long(size)) =>
6c5039016321 record heap sizes;
wenzelm
parents: 64119
diff changeset
   568
          heap_sizes += (name -> size)
6c5039016321 record heap sizes;
wenzelm
parents: 64119
diff changeset
   569
65646
014dbbe5331f parse ml_statistics only when required;
wenzelm
parents: 65645
diff changeset
   570
        case _
014dbbe5331f parse ml_statistics only when required;
wenzelm
parents: 65645
diff changeset
   571
        if parse_ml_statistics && line.startsWith(ML_STATISTICS_MARKER) && YXML.detect(line) =>
64119
8094eaa38d4b inline session ML statistics into main build log;
wenzelm
parents: 64117
diff changeset
   572
          val (name, props) =
8094eaa38d4b inline session ML statistics into main build log;
wenzelm
parents: 64117
diff changeset
   573
            Library.try_unprefix(ML_STATISTICS_MARKER, line).map(log_file.parse_props(_)) match {
8094eaa38d4b inline session ML statistics into main build log;
wenzelm
parents: 64117
diff changeset
   574
              case Some((SESSION_NAME, session_name) :: props) => (session_name, props)
8094eaa38d4b inline session ML statistics into main build log;
wenzelm
parents: 64117
diff changeset
   575
              case _ => log_file.err("malformed ML_statistics " + quote(line))
8094eaa38d4b inline session ML statistics into main build log;
wenzelm
parents: 64117
diff changeset
   576
            }
64120
6c5039016321 record heap sizes;
wenzelm
parents: 64119
diff changeset
   577
          ml_statistics += (name -> (props :: ml_statistics.getOrElse(name, Nil)))
64119
8094eaa38d4b inline session ML statistics into main build log;
wenzelm
parents: 64117
diff changeset
   578
64054
1fc9ab31720d clarified modules;
wenzelm
parents: 64053
diff changeset
   579
        case _ =>
1fc9ab31720d clarified modules;
wenzelm
parents: 64053
diff changeset
   580
      }
1fc9ab31720d clarified modules;
wenzelm
parents: 64053
diff changeset
   581
    }
1fc9ab31720d clarified modules;
wenzelm
parents: 64053
diff changeset
   582
64085
1c451e5c145f clarified parse_build_info: isabelle build output;
wenzelm
parents: 64083
diff changeset
   583
    val sessions =
1c451e5c145f clarified parse_build_info: isabelle build output;
wenzelm
parents: 64083
diff changeset
   584
      Map(
1c451e5c145f clarified parse_build_info: isabelle build output;
wenzelm
parents: 64083
diff changeset
   585
        (for (name <- all_sessions.toList) yield {
1c451e5c145f clarified parse_build_info: isabelle build output;
wenzelm
parents: 64083
diff changeset
   586
          val status =
65633
wenzelm
parents: 65632
diff changeset
   587
            if (failed(name)) Session_Status.failed
wenzelm
parents: 65632
diff changeset
   588
            else if (cancelled(name)) Session_Status.cancelled
64086
ac7ae5067783 clarified status: started sessions may bomb without explicit FAILED or CANCELLED (cf. in afp-test-devel-2016-01-03.log);
wenzelm
parents: 64085
diff changeset
   589
            else if (timing.isDefinedAt(name) || ml_timing.isDefinedAt(name))
65633
wenzelm
parents: 65632
diff changeset
   590
              Session_Status.finished
wenzelm
parents: 65632
diff changeset
   591
            else if (started(name)) Session_Status.failed
wenzelm
parents: 65632
diff changeset
   592
            else Session_Status.existing
64085
1c451e5c145f clarified parse_build_info: isabelle build output;
wenzelm
parents: 64083
diff changeset
   593
          val entry =
1c451e5c145f clarified parse_build_info: isabelle build output;
wenzelm
parents: 64083
diff changeset
   594
            Session_Entry(
65643
a54371226182 clarified dummy Session_Entry;
wenzelm
parents: 65642
diff changeset
   595
              chapter = chapter.getOrElse(name, ""),
a54371226182 clarified dummy Session_Entry;
wenzelm
parents: 65642
diff changeset
   596
              groups = groups.getOrElse(name, Nil),
a54371226182 clarified dummy Session_Entry;
wenzelm
parents: 65642
diff changeset
   597
              threads = threads.get(name),
a54371226182 clarified dummy Session_Entry;
wenzelm
parents: 65642
diff changeset
   598
              timing = timing.getOrElse(name, Timing.zero),
a54371226182 clarified dummy Session_Entry;
wenzelm
parents: 65642
diff changeset
   599
              ml_timing = ml_timing.getOrElse(name, Timing.zero),
a54371226182 clarified dummy Session_Entry;
wenzelm
parents: 65642
diff changeset
   600
              heap_size = heap_sizes.get(name),
a54371226182 clarified dummy Session_Entry;
wenzelm
parents: 65642
diff changeset
   601
              status = Some(status),
a54371226182 clarified dummy Session_Entry;
wenzelm
parents: 65642
diff changeset
   602
              ml_statistics = ml_statistics.getOrElse(name, Nil).reverse)
64085
1c451e5c145f clarified parse_build_info: isabelle build output;
wenzelm
parents: 64083
diff changeset
   603
          (name -> entry)
1c451e5c145f clarified parse_build_info: isabelle build output;
wenzelm
parents: 64083
diff changeset
   604
        }):_*)
1c451e5c145f clarified parse_build_info: isabelle build output;
wenzelm
parents: 64083
diff changeset
   605
    Build_Info(sessions)
64054
1fc9ab31720d clarified modules;
wenzelm
parents: 64053
diff changeset
   606
  }
64099
wenzelm
parents: 64098
diff changeset
   607
wenzelm
parents: 64098
diff changeset
   608
wenzelm
parents: 64098
diff changeset
   609
65276
fa1a5efee2ec tuned comments;
wenzelm
parents: 65052
diff changeset
   610
  /** session info: produced by isabelle build as session log.gz file **/
64099
wenzelm
parents: 64098
diff changeset
   611
wenzelm
parents: 64098
diff changeset
   612
  sealed case class Session_Info(
wenzelm
parents: 64098
diff changeset
   613
    session_timing: Properties.T,
wenzelm
parents: 64098
diff changeset
   614
    command_timings: List[Properties.T],
wenzelm
parents: 64098
diff changeset
   615
    ml_statistics: List[Properties.T],
wenzelm
parents: 64098
diff changeset
   616
    task_statistics: List[Properties.T])
wenzelm
parents: 64098
diff changeset
   617
wenzelm
parents: 64098
diff changeset
   618
  private def parse_session_info(
wenzelm
parents: 64098
diff changeset
   619
    log_file: Log_File,
wenzelm
parents: 64098
diff changeset
   620
    command_timings: Boolean,
wenzelm
parents: 64098
diff changeset
   621
    ml_statistics: Boolean,
wenzelm
parents: 64098
diff changeset
   622
    task_statistics: Boolean): Session_Info =
wenzelm
parents: 64098
diff changeset
   623
  {
65290
wenzelm
parents: 65276
diff changeset
   624
    Session_Info(
wenzelm
parents: 65276
diff changeset
   625
      session_timing = log_file.find_props("\fTiming = ") getOrElse Nil,
wenzelm
parents: 65276
diff changeset
   626
      command_timings = if (command_timings) log_file.filter_props("\fcommand_timing = ") else Nil,
wenzelm
parents: 65276
diff changeset
   627
      ml_statistics = if (ml_statistics) log_file.filter_props(ML_STATISTICS_MARKER) else Nil,
wenzelm
parents: 65276
diff changeset
   628
      task_statistics = if (task_statistics) log_file.filter_props("\ftask_statistics = ") else Nil)
64099
wenzelm
parents: 64098
diff changeset
   629
  }
65595
ffd8283b7be0 support for database connection;
wenzelm
parents: 65591
diff changeset
   630
ffd8283b7be0 support for database connection;
wenzelm
parents: 65591
diff changeset
   631
ffd8283b7be0 support for database connection;
wenzelm
parents: 65591
diff changeset
   632
ffd8283b7be0 support for database connection;
wenzelm
parents: 65591
diff changeset
   633
  /** persistent store **/
ffd8283b7be0 support for database connection;
wenzelm
parents: 65591
diff changeset
   634
65694
b82f2990161a clarified modules;
wenzelm
parents: 65693
diff changeset
   635
  /* SQL data model */
b82f2990161a clarified modules;
wenzelm
parents: 65693
diff changeset
   636
b82f2990161a clarified modules;
wenzelm
parents: 65693
diff changeset
   637
  object Data
b82f2990161a clarified modules;
wenzelm
parents: 65693
diff changeset
   638
  {
65702
7c6a91deb212 tuned signature;
wenzelm
parents: 65701
diff changeset
   639
    def build_log_table(name: String, columns: List[SQL.Column], body: String = ""): SQL.Table =
65700
wenzelm
parents: 65699
diff changeset
   640
      SQL.Table("isabelle_build_log_" + name, columns, body)
wenzelm
parents: 65699
diff changeset
   641
wenzelm
parents: 65699
diff changeset
   642
65694
b82f2990161a clarified modules;
wenzelm
parents: 65693
diff changeset
   643
    /* main content */
b82f2990161a clarified modules;
wenzelm
parents: 65693
diff changeset
   644
b82f2990161a clarified modules;
wenzelm
parents: 65693
diff changeset
   645
    val log_name = SQL.Column.string("log_name", primary_key = true)
b82f2990161a clarified modules;
wenzelm
parents: 65693
diff changeset
   646
    val session_name = SQL.Column.string("session_name", primary_key = true)
b82f2990161a clarified modules;
wenzelm
parents: 65693
diff changeset
   647
    val chapter = SQL.Column.string("chapter")
b82f2990161a clarified modules;
wenzelm
parents: 65693
diff changeset
   648
    val groups = SQL.Column.string("groups")
b82f2990161a clarified modules;
wenzelm
parents: 65693
diff changeset
   649
    val threads = SQL.Column.int("threads")
b82f2990161a clarified modules;
wenzelm
parents: 65693
diff changeset
   650
    val timing_elapsed = SQL.Column.long("timing_elapsed")
b82f2990161a clarified modules;
wenzelm
parents: 65693
diff changeset
   651
    val timing_cpu = SQL.Column.long("timing_cpu")
b82f2990161a clarified modules;
wenzelm
parents: 65693
diff changeset
   652
    val timing_gc = SQL.Column.long("timing_gc")
b82f2990161a clarified modules;
wenzelm
parents: 65693
diff changeset
   653
    val timing_factor = SQL.Column.double("timing_factor")
b82f2990161a clarified modules;
wenzelm
parents: 65693
diff changeset
   654
    val ml_timing_elapsed = SQL.Column.long("ml_timing_elapsed")
b82f2990161a clarified modules;
wenzelm
parents: 65693
diff changeset
   655
    val ml_timing_cpu = SQL.Column.long("ml_timing_cpu")
b82f2990161a clarified modules;
wenzelm
parents: 65693
diff changeset
   656
    val ml_timing_gc = SQL.Column.long("ml_timing_gc")
b82f2990161a clarified modules;
wenzelm
parents: 65693
diff changeset
   657
    val ml_timing_factor = SQL.Column.double("ml_timing_factor")
b82f2990161a clarified modules;
wenzelm
parents: 65693
diff changeset
   658
    val heap_size = SQL.Column.long("heap_size")
b82f2990161a clarified modules;
wenzelm
parents: 65693
diff changeset
   659
    val status = SQL.Column.string("status")
b82f2990161a clarified modules;
wenzelm
parents: 65693
diff changeset
   660
    val ml_statistics = SQL.Column.bytes("ml_statistics")
b82f2990161a clarified modules;
wenzelm
parents: 65693
diff changeset
   661
b82f2990161a clarified modules;
wenzelm
parents: 65693
diff changeset
   662
    val meta_info_table =
65702
7c6a91deb212 tuned signature;
wenzelm
parents: 65701
diff changeset
   663
      build_log_table("meta_info", log_name :: Prop.all_props ::: Settings.all_settings)
65694
b82f2990161a clarified modules;
wenzelm
parents: 65693
diff changeset
   664
b82f2990161a clarified modules;
wenzelm
parents: 65693
diff changeset
   665
    val sessions_table =
65702
7c6a91deb212 tuned signature;
wenzelm
parents: 65701
diff changeset
   666
      build_log_table("sessions",
65694
b82f2990161a clarified modules;
wenzelm
parents: 65693
diff changeset
   667
        List(log_name, session_name, chapter, groups, threads, timing_elapsed, timing_cpu,
b82f2990161a clarified modules;
wenzelm
parents: 65693
diff changeset
   668
          timing_gc, timing_factor, ml_timing_elapsed, ml_timing_cpu, ml_timing_gc, ml_timing_factor,
b82f2990161a clarified modules;
wenzelm
parents: 65693
diff changeset
   669
          heap_size, status))
b82f2990161a clarified modules;
wenzelm
parents: 65693
diff changeset
   670
b82f2990161a clarified modules;
wenzelm
parents: 65693
diff changeset
   671
    val ml_statistics_table =
65702
7c6a91deb212 tuned signature;
wenzelm
parents: 65701
diff changeset
   672
      build_log_table("ml_statistics", List(log_name, session_name, ml_statistics))
65694
b82f2990161a clarified modules;
wenzelm
parents: 65693
diff changeset
   673
b82f2990161a clarified modules;
wenzelm
parents: 65693
diff changeset
   674
65705
d0ca2a3ea657 more snapshot content;
wenzelm
parents: 65703
diff changeset
   675
    /* earliest pull date for repository version (PostgreSQL queries) */
65694
b82f2990161a clarified modules;
wenzelm
parents: 65693
diff changeset
   676
b82f2990161a clarified modules;
wenzelm
parents: 65693
diff changeset
   677
    val pull_date = SQL.Column.date("pull_date")
b82f2990161a clarified modules;
wenzelm
parents: 65693
diff changeset
   678
65722
35fcedb6bdc8 clarified database layout: pull date progression follows Isabelle only, and AFP is derived from that;
wenzelm
parents: 65721
diff changeset
   679
    val pull_date_table: SQL.Table =
65709
1626b73daccf eliminated unused afp_pull_date table;
wenzelm
parents: 65708
diff changeset
   680
    {
1626b73daccf eliminated unused afp_pull_date table;
wenzelm
parents: 65708
diff changeset
   681
      val version = Prop.isabelle_version
65722
35fcedb6bdc8 clarified database layout: pull date progression follows Isabelle only, and AFP is derived from that;
wenzelm
parents: 65721
diff changeset
   682
      build_log_table("pull_date", List(version.copy(primary_key = true), pull_date),
65701
d788c11176e5 simplified: standard toString is SQL.ident;
wenzelm
parents: 65700
diff changeset
   683
        "SELECT " + version + ", min(" + Prop.build_start + ") AS " + pull_date +
d788c11176e5 simplified: standard toString is SQL.ident;
wenzelm
parents: 65700
diff changeset
   684
        " FROM " + meta_info_table +
d788c11176e5 simplified: standard toString is SQL.ident;
wenzelm
parents: 65700
diff changeset
   685
        " WHERE " + version + " IS NOT NULL AND " + Prop.build_start + " IS NOT NULL" +
d788c11176e5 simplified: standard toString is SQL.ident;
wenzelm
parents: 65700
diff changeset
   686
        " GROUP BY " + version)
65709
1626b73daccf eliminated unused afp_pull_date table;
wenzelm
parents: 65708
diff changeset
   687
    }
65694
b82f2990161a clarified modules;
wenzelm
parents: 65693
diff changeset
   688
65736
2e7230b66a32 performance statistics from build log database;
wenzelm
parents: 65729
diff changeset
   689
    def recent_time(days: Int): SQL.Source =
2e7230b66a32 performance statistics from build log database;
wenzelm
parents: 65729
diff changeset
   690
      "now() - INTERVAL '" + days.max(0) + " days'"
2e7230b66a32 performance statistics from build log database;
wenzelm
parents: 65729
diff changeset
   691
65709
1626b73daccf eliminated unused afp_pull_date table;
wenzelm
parents: 65708
diff changeset
   692
    def recent_table(days: Int): SQL.Table =
65702
7c6a91deb212 tuned signature;
wenzelm
parents: 65701
diff changeset
   693
    {
65722
35fcedb6bdc8 clarified database layout: pull date progression follows Isabelle only, and AFP is derived from that;
wenzelm
parents: 65721
diff changeset
   694
      val table = pull_date_table
65709
1626b73daccf eliminated unused afp_pull_date table;
wenzelm
parents: 65708
diff changeset
   695
      SQL.Table("recent", table.columns,
65736
2e7230b66a32 performance statistics from build log database;
wenzelm
parents: 65729
diff changeset
   696
        table.select(table.columns, "WHERE " + pull_date(table) + " > " + recent_time(days)))
65702
7c6a91deb212 tuned signature;
wenzelm
parents: 65701
diff changeset
   697
    }
65694
b82f2990161a clarified modules;
wenzelm
parents: 65693
diff changeset
   698
65705
d0ca2a3ea657 more snapshot content;
wenzelm
parents: 65703
diff changeset
   699
    def select_recent(table: SQL.Table, columns: List[SQL.Column], days: Int,
65736
2e7230b66a32 performance statistics from build log database;
wenzelm
parents: 65729
diff changeset
   700
      distinct: Boolean = false, pull_date: Boolean = false): SQL.Source =
65702
7c6a91deb212 tuned signature;
wenzelm
parents: 65701
diff changeset
   701
    {
65709
1626b73daccf eliminated unused afp_pull_date table;
wenzelm
parents: 65708
diff changeset
   702
      val recent = recent_table(days)
65705
d0ca2a3ea657 more snapshot content;
wenzelm
parents: 65703
diff changeset
   703
      val columns1 = if (pull_date) columns ::: List(Data.pull_date(recent)) else columns
65729
3f40afe30feb tuned signature;
wenzelm
parents: 65724
diff changeset
   704
      table.select(columns1, distinct = distinct) + " INNER JOIN " + recent.query_name +
65702
7c6a91deb212 tuned signature;
wenzelm
parents: 65701
diff changeset
   705
      " ON " + Prop.isabelle_version(table) + " = " + Prop.isabelle_version(recent)
7c6a91deb212 tuned signature;
wenzelm
parents: 65701
diff changeset
   706
    }
65724
681cdf83ce09 clarified universal view: include pull_date;
wenzelm
parents: 65723
diff changeset
   707
681cdf83ce09 clarified universal view: include pull_date;
wenzelm
parents: 65723
diff changeset
   708
681cdf83ce09 clarified universal view: include pull_date;
wenzelm
parents: 65723
diff changeset
   709
    /* universal view on main data */
681cdf83ce09 clarified universal view: include pull_date;
wenzelm
parents: 65723
diff changeset
   710
681cdf83ce09 clarified universal view: include pull_date;
wenzelm
parents: 65723
diff changeset
   711
    val universal_table: SQL.Table =
681cdf83ce09 clarified universal view: include pull_date;
wenzelm
parents: 65723
diff changeset
   712
    {
681cdf83ce09 clarified universal view: include pull_date;
wenzelm
parents: 65723
diff changeset
   713
      val table1 = meta_info_table
681cdf83ce09 clarified universal view: include pull_date;
wenzelm
parents: 65723
diff changeset
   714
      val table2 = pull_date_table
681cdf83ce09 clarified universal view: include pull_date;
wenzelm
parents: 65723
diff changeset
   715
      val table3 = sessions_table
681cdf83ce09 clarified universal view: include pull_date;
wenzelm
parents: 65723
diff changeset
   716
681cdf83ce09 clarified universal view: include pull_date;
wenzelm
parents: 65723
diff changeset
   717
      val aux_columns = log_name :: pull_date :: meta_info_table.columns.tail
681cdf83ce09 clarified universal view: include pull_date;
wenzelm
parents: 65723
diff changeset
   718
      val aux_table = SQL.Table("aux", aux_columns,
681cdf83ce09 clarified universal view: include pull_date;
wenzelm
parents: 65723
diff changeset
   719
        SQL.select(aux_columns.take(2) ::: aux_columns.drop(2). map(_.apply(table1))) +
681cdf83ce09 clarified universal view: include pull_date;
wenzelm
parents: 65723
diff changeset
   720
          table1 + " LEFT OUTER JOIN " + table2 + " ON " +
681cdf83ce09 clarified universal view: include pull_date;
wenzelm
parents: 65723
diff changeset
   721
          Prop.isabelle_version(table1) + " = " + Prop.isabelle_version(table2))
681cdf83ce09 clarified universal view: include pull_date;
wenzelm
parents: 65723
diff changeset
   722
681cdf83ce09 clarified universal view: include pull_date;
wenzelm
parents: 65723
diff changeset
   723
      val columns = aux_columns ::: sessions_table.columns.tail
681cdf83ce09 clarified universal view: include pull_date;
wenzelm
parents: 65723
diff changeset
   724
      SQL.Table("isabelle_build_log", columns,
681cdf83ce09 clarified universal view: include pull_date;
wenzelm
parents: 65723
diff changeset
   725
        {
65729
3f40afe30feb tuned signature;
wenzelm
parents: 65724
diff changeset
   726
          SQL.select(log_name(aux_table) :: columns.tail) + aux_table.query_name +
65724
681cdf83ce09 clarified universal view: include pull_date;
wenzelm
parents: 65723
diff changeset
   727
          " INNER JOIN " + table3 + " ON " + log_name(aux_table) + " = " + log_name(table3)
681cdf83ce09 clarified universal view: include pull_date;
wenzelm
parents: 65723
diff changeset
   728
        })
681cdf83ce09 clarified universal view: include pull_date;
wenzelm
parents: 65723
diff changeset
   729
    }
65694
b82f2990161a clarified modules;
wenzelm
parents: 65693
diff changeset
   730
  }
b82f2990161a clarified modules;
wenzelm
parents: 65693
diff changeset
   731
b82f2990161a clarified modules;
wenzelm
parents: 65693
diff changeset
   732
b82f2990161a clarified modules;
wenzelm
parents: 65693
diff changeset
   733
  /* database access */
b82f2990161a clarified modules;
wenzelm
parents: 65693
diff changeset
   734
65595
ffd8283b7be0 support for database connection;
wenzelm
parents: 65591
diff changeset
   735
  def store(options: Options): Store = new Store(options)
ffd8283b7be0 support for database connection;
wenzelm
parents: 65591
diff changeset
   736
ffd8283b7be0 support for database connection;
wenzelm
parents: 65591
diff changeset
   737
  class Store private[Build_Log](options: Options) extends Properties.Store
ffd8283b7be0 support for database connection;
wenzelm
parents: 65591
diff changeset
   738
  {
ffd8283b7be0 support for database connection;
wenzelm
parents: 65591
diff changeset
   739
    def open_database(
ffd8283b7be0 support for database connection;
wenzelm
parents: 65591
diff changeset
   740
      user: String = options.string("build_log_database_user"),
ffd8283b7be0 support for database connection;
wenzelm
parents: 65591
diff changeset
   741
      password: String = options.string("build_log_database_password"),
ffd8283b7be0 support for database connection;
wenzelm
parents: 65591
diff changeset
   742
      database: String = options.string("build_log_database_name"),
ffd8283b7be0 support for database connection;
wenzelm
parents: 65591
diff changeset
   743
      host: String = options.string("build_log_database_host"),
ffd8283b7be0 support for database connection;
wenzelm
parents: 65591
diff changeset
   744
      port: Int = options.int("build_log_database_port"),
ffd8283b7be0 support for database connection;
wenzelm
parents: 65591
diff changeset
   745
      ssh_host: String = options.string("build_log_ssh_host"),
ffd8283b7be0 support for database connection;
wenzelm
parents: 65591
diff changeset
   746
      ssh_user: String = options.string("build_log_ssh_user"),
ffd8283b7be0 support for database connection;
wenzelm
parents: 65591
diff changeset
   747
      ssh_port: Int = options.int("build_log_ssh_port")): PostgreSQL.Database =
ffd8283b7be0 support for database connection;
wenzelm
parents: 65591
diff changeset
   748
    {
ffd8283b7be0 support for database connection;
wenzelm
parents: 65591
diff changeset
   749
      PostgreSQL.open_database(
ffd8283b7be0 support for database connection;
wenzelm
parents: 65591
diff changeset
   750
        user = user, password = password, database = database, host = host, port = port,
ffd8283b7be0 support for database connection;
wenzelm
parents: 65591
diff changeset
   751
        ssh =
ffd8283b7be0 support for database connection;
wenzelm
parents: 65591
diff changeset
   752
          if (ssh_host == "") None
65636
df804cdba5f9 ssh_close for proper termination after use of database;
wenzelm
parents: 65633
diff changeset
   753
          else Some(SSH.init_context(options).open_session(ssh_host, ssh_user, port)),
df804cdba5f9 ssh_close for proper termination after use of database;
wenzelm
parents: 65633
diff changeset
   754
        ssh_close = true)
65595
ffd8283b7be0 support for database connection;
wenzelm
parents: 65591
diff changeset
   755
    }
65599
08dfa79866ec database storage of Meta_Info and Build_Info;
wenzelm
parents: 65595
diff changeset
   756
65723
3ee466e89047 clarified signature: PostgreSQL manages high-volume data, SQLite only sees small snapshots;
wenzelm
parents: 65722
diff changeset
   757
    def update_database(db: PostgreSQL.Database, dirs: List[Path], ml_statistics: Boolean = false)
65694
b82f2990161a clarified modules;
wenzelm
parents: 65693
diff changeset
   758
    {
b82f2990161a clarified modules;
wenzelm
parents: 65693
diff changeset
   759
      write_info(db, Log_File.find_files(dirs), ml_statistics = ml_statistics)
b82f2990161a clarified modules;
wenzelm
parents: 65693
diff changeset
   760
65723
3ee466e89047 clarified signature: PostgreSQL manages high-volume data, SQLite only sees small snapshots;
wenzelm
parents: 65722
diff changeset
   761
      db.create_view(Data.pull_date_table)
65724
681cdf83ce09 clarified universal view: include pull_date;
wenzelm
parents: 65723
diff changeset
   762
      db.create_view(Data.universal_table)
65694
b82f2990161a clarified modules;
wenzelm
parents: 65693
diff changeset
   763
    }
b82f2990161a clarified modules;
wenzelm
parents: 65693
diff changeset
   764
65723
3ee466e89047 clarified signature: PostgreSQL manages high-volume data, SQLite only sees small snapshots;
wenzelm
parents: 65722
diff changeset
   765
    def snapshot_database(db: PostgreSQL.Database, sqlite_database: Path,
65705
d0ca2a3ea657 more snapshot content;
wenzelm
parents: 65703
diff changeset
   766
      days: Int = 100, ml_statistics: Boolean = false)
65694
b82f2990161a clarified modules;
wenzelm
parents: 65693
diff changeset
   767
    {
b82f2990161a clarified modules;
wenzelm
parents: 65693
diff changeset
   768
      Isabelle_System.mkdirs(sqlite_database.dir)
b82f2990161a clarified modules;
wenzelm
parents: 65693
diff changeset
   769
      sqlite_database.file.delete
b82f2990161a clarified modules;
wenzelm
parents: 65693
diff changeset
   770
b82f2990161a clarified modules;
wenzelm
parents: 65693
diff changeset
   771
      using(SQLite.open_database(sqlite_database))(db2 =>
b82f2990161a clarified modules;
wenzelm
parents: 65693
diff changeset
   772
      {
b82f2990161a clarified modules;
wenzelm
parents: 65693
diff changeset
   773
        db.transaction {
b82f2990161a clarified modules;
wenzelm
parents: 65693
diff changeset
   774
          db2.transaction {
65705
d0ca2a3ea657 more snapshot content;
wenzelm
parents: 65703
diff changeset
   775
            // main content
d0ca2a3ea657 more snapshot content;
wenzelm
parents: 65703
diff changeset
   776
            db2.create_table(Data.meta_info_table)
d0ca2a3ea657 more snapshot content;
wenzelm
parents: 65703
diff changeset
   777
            db2.create_table(Data.sessions_table)
d0ca2a3ea657 more snapshot content;
wenzelm
parents: 65703
diff changeset
   778
            db2.create_table(Data.ml_statistics_table)
d0ca2a3ea657 more snapshot content;
wenzelm
parents: 65703
diff changeset
   779
d0ca2a3ea657 more snapshot content;
wenzelm
parents: 65703
diff changeset
   780
            val recent_log_names =
d0ca2a3ea657 more snapshot content;
wenzelm
parents: 65703
diff changeset
   781
              db.using_statement(
d0ca2a3ea657 more snapshot content;
wenzelm
parents: 65703
diff changeset
   782
                Data.select_recent(
65740
83388f09e9ab clarified signature;
wenzelm
parents: 65738
diff changeset
   783
                  Data.meta_info_table, List(Data.log_name), days, distinct = true))(stmt =>
83388f09e9ab clarified signature;
wenzelm
parents: 65738
diff changeset
   784
                    stmt.execute_query().iterator(_.string(Data.log_name)).toList)
65705
d0ca2a3ea657 more snapshot content;
wenzelm
parents: 65703
diff changeset
   785
d0ca2a3ea657 more snapshot content;
wenzelm
parents: 65703
diff changeset
   786
            for (log_name <- recent_log_names) {
d0ca2a3ea657 more snapshot content;
wenzelm
parents: 65703
diff changeset
   787
              read_meta_info(db, log_name).foreach(meta_info =>
d0ca2a3ea657 more snapshot content;
wenzelm
parents: 65703
diff changeset
   788
                update_meta_info(db2, log_name, meta_info))
d0ca2a3ea657 more snapshot content;
wenzelm
parents: 65703
diff changeset
   789
d0ca2a3ea657 more snapshot content;
wenzelm
parents: 65703
diff changeset
   790
              update_sessions(db2, log_name, read_build_info(db, log_name))
d0ca2a3ea657 more snapshot content;
wenzelm
parents: 65703
diff changeset
   791
d0ca2a3ea657 more snapshot content;
wenzelm
parents: 65703
diff changeset
   792
              if (ml_statistics)
d0ca2a3ea657 more snapshot content;
wenzelm
parents: 65703
diff changeset
   793
                update_ml_statistics(db2, log_name, read_build_info(db, log_name))
d0ca2a3ea657 more snapshot content;
wenzelm
parents: 65703
diff changeset
   794
            }
d0ca2a3ea657 more snapshot content;
wenzelm
parents: 65703
diff changeset
   795
d0ca2a3ea657 more snapshot content;
wenzelm
parents: 65703
diff changeset
   796
            // pull_date
65694
b82f2990161a clarified modules;
wenzelm
parents: 65693
diff changeset
   797
            {
65722
35fcedb6bdc8 clarified database layout: pull date progression follows Isabelle only, and AFP is derived from that;
wenzelm
parents: 65721
diff changeset
   798
              val table = Data.pull_date_table
65694
b82f2990161a clarified modules;
wenzelm
parents: 65693
diff changeset
   799
              db2.create_table(table)
65698
38139b2067cf clarified signature;
wenzelm
parents: 65697
diff changeset
   800
              db2.using_statement(table.insert())(stmt2 =>
65694
b82f2990161a clarified modules;
wenzelm
parents: 65693
diff changeset
   801
              {
65709
1626b73daccf eliminated unused afp_pull_date table;
wenzelm
parents: 65708
diff changeset
   802
                db.using_statement(Data.recent_table(days).query)(stmt =>
65694
b82f2990161a clarified modules;
wenzelm
parents: 65693
diff changeset
   803
                {
65740
83388f09e9ab clarified signature;
wenzelm
parents: 65738
diff changeset
   804
                  val res = stmt.execute_query()
83388f09e9ab clarified signature;
wenzelm
parents: 65738
diff changeset
   805
                  while (res.next()) {
65694
b82f2990161a clarified modules;
wenzelm
parents: 65693
diff changeset
   806
                    for ((c, i) <- table.columns.zipWithIndex)
65740
83388f09e9ab clarified signature;
wenzelm
parents: 65738
diff changeset
   807
                      stmt2.set_string(i + 1, res.get_string(c))
83388f09e9ab clarified signature;
wenzelm
parents: 65738
diff changeset
   808
                    stmt2.execute()
65694
b82f2990161a clarified modules;
wenzelm
parents: 65693
diff changeset
   809
                  }
b82f2990161a clarified modules;
wenzelm
parents: 65693
diff changeset
   810
                })
b82f2990161a clarified modules;
wenzelm
parents: 65693
diff changeset
   811
              })
65709
1626b73daccf eliminated unused afp_pull_date table;
wenzelm
parents: 65708
diff changeset
   812
            }
65705
d0ca2a3ea657 more snapshot content;
wenzelm
parents: 65703
diff changeset
   813
d0ca2a3ea657 more snapshot content;
wenzelm
parents: 65703
diff changeset
   814
            // full view
65724
681cdf83ce09 clarified universal view: include pull_date;
wenzelm
parents: 65723
diff changeset
   815
            db2.create_view(Data.universal_table)
65694
b82f2990161a clarified modules;
wenzelm
parents: 65693
diff changeset
   816
          }
b82f2990161a clarified modules;
wenzelm
parents: 65693
diff changeset
   817
        }
65708
50a61990c01e slightly more compact file;
wenzelm
parents: 65706
diff changeset
   818
        db2.rebuild
65694
b82f2990161a clarified modules;
wenzelm
parents: 65693
diff changeset
   819
      })
b82f2990161a clarified modules;
wenzelm
parents: 65693
diff changeset
   820
    }
b82f2990161a clarified modules;
wenzelm
parents: 65693
diff changeset
   821
65688
wenzelm
parents: 65685
diff changeset
   822
    def domain(db: SQL.Database, table: SQL.Table, column: SQL.Column): Set[String] =
65698
38139b2067cf clarified signature;
wenzelm
parents: 65697
diff changeset
   823
      db.using_statement(table.select(List(column), distinct = true))(stmt =>
65740
83388f09e9ab clarified signature;
wenzelm
parents: 65738
diff changeset
   824
        stmt.execute_query().iterator(_.string(column)).toSet)
65688
wenzelm
parents: 65685
diff changeset
   825
65705
d0ca2a3ea657 more snapshot content;
wenzelm
parents: 65703
diff changeset
   826
    def update_meta_info(db: SQL.Database, log_name: String, meta_info: Meta_Info)
65632
218dbe4fb484 tuned signature;
wenzelm
parents: 65631
diff changeset
   827
    {
65694
b82f2990161a clarified modules;
wenzelm
parents: 65693
diff changeset
   828
      val table = Data.meta_info_table
65703
cead65c19f2e more direct insert_permissive statement, which avoids somewhat fragile nested transactions;
wenzelm
parents: 65702
diff changeset
   829
      db.using_statement(db.insert_permissive(table))(stmt =>
cead65c19f2e more direct insert_permissive statement, which avoids somewhat fragile nested transactions;
wenzelm
parents: 65702
diff changeset
   830
      {
65740
83388f09e9ab clarified signature;
wenzelm
parents: 65738
diff changeset
   831
        stmt.set_string(1, log_name)
65703
cead65c19f2e more direct insert_permissive statement, which avoids somewhat fragile nested transactions;
wenzelm
parents: 65702
diff changeset
   832
        for ((c, i) <- table.columns.tail.zipWithIndex) {
cead65c19f2e more direct insert_permissive statement, which avoids somewhat fragile nested transactions;
wenzelm
parents: 65702
diff changeset
   833
          if (c.T == SQL.Type.Date)
65740
83388f09e9ab clarified signature;
wenzelm
parents: 65738
diff changeset
   834
            stmt.set_date(i + 2, meta_info.get_date(c))
65703
cead65c19f2e more direct insert_permissive statement, which avoids somewhat fragile nested transactions;
wenzelm
parents: 65702
diff changeset
   835
          else
65740
83388f09e9ab clarified signature;
wenzelm
parents: 65738
diff changeset
   836
            stmt.set_string(i + 2, meta_info.get(c))
65703
cead65c19f2e more direct insert_permissive statement, which avoids somewhat fragile nested transactions;
wenzelm
parents: 65702
diff changeset
   837
        }
cead65c19f2e more direct insert_permissive statement, which avoids somewhat fragile nested transactions;
wenzelm
parents: 65702
diff changeset
   838
        stmt.execute()
cead65c19f2e more direct insert_permissive statement, which avoids somewhat fragile nested transactions;
wenzelm
parents: 65702
diff changeset
   839
      })
65600
138ffa41dc54 clarified filter_files: sorted and unique;
wenzelm
parents: 65599
diff changeset
   840
    }
138ffa41dc54 clarified filter_files: sorted and unique;
wenzelm
parents: 65599
diff changeset
   841
65705
d0ca2a3ea657 more snapshot content;
wenzelm
parents: 65703
diff changeset
   842
    def update_sessions(db: SQL.Database, log_name: String, build_info: Build_Info)
65599
08dfa79866ec database storage of Meta_Info and Build_Info;
wenzelm
parents: 65595
diff changeset
   843
    {
65694
b82f2990161a clarified modules;
wenzelm
parents: 65693
diff changeset
   844
      val table = Data.sessions_table
65703
cead65c19f2e more direct insert_permissive statement, which avoids somewhat fragile nested transactions;
wenzelm
parents: 65702
diff changeset
   845
      db.using_statement(db.insert_permissive(table))(stmt =>
cead65c19f2e more direct insert_permissive statement, which avoids somewhat fragile nested transactions;
wenzelm
parents: 65702
diff changeset
   846
      {
cead65c19f2e more direct insert_permissive statement, which avoids somewhat fragile nested transactions;
wenzelm
parents: 65702
diff changeset
   847
        val entries_iterator =
cead65c19f2e more direct insert_permissive statement, which avoids somewhat fragile nested transactions;
wenzelm
parents: 65702
diff changeset
   848
          if (build_info.sessions.isEmpty) Iterator("" -> Session_Entry.empty)
cead65c19f2e more direct insert_permissive statement, which avoids somewhat fragile nested transactions;
wenzelm
parents: 65702
diff changeset
   849
          else build_info.sessions.iterator
cead65c19f2e more direct insert_permissive statement, which avoids somewhat fragile nested transactions;
wenzelm
parents: 65702
diff changeset
   850
        for ((session_name, session) <- entries_iterator) {
65740
83388f09e9ab clarified signature;
wenzelm
parents: 65738
diff changeset
   851
          stmt.set_string(1, log_name)
83388f09e9ab clarified signature;
wenzelm
parents: 65738
diff changeset
   852
          stmt.set_string(2, session_name)
83388f09e9ab clarified signature;
wenzelm
parents: 65738
diff changeset
   853
          stmt.set_string(3, session.proper_chapter)
83388f09e9ab clarified signature;
wenzelm
parents: 65738
diff changeset
   854
          stmt.set_string(4, session.proper_groups)
83388f09e9ab clarified signature;
wenzelm
parents: 65738
diff changeset
   855
          stmt.set_int(5, session.threads)
83388f09e9ab clarified signature;
wenzelm
parents: 65738
diff changeset
   856
          stmt.set_long(6, session.timing.elapsed.proper_ms)
83388f09e9ab clarified signature;
wenzelm
parents: 65738
diff changeset
   857
          stmt.set_long(7, session.timing.cpu.proper_ms)
83388f09e9ab clarified signature;
wenzelm
parents: 65738
diff changeset
   858
          stmt.set_long(8, session.timing.gc.proper_ms)
83388f09e9ab clarified signature;
wenzelm
parents: 65738
diff changeset
   859
          stmt.set_double(9, session.timing.factor)
83388f09e9ab clarified signature;
wenzelm
parents: 65738
diff changeset
   860
          stmt.set_long(10, session.ml_timing.elapsed.proper_ms)
83388f09e9ab clarified signature;
wenzelm
parents: 65738
diff changeset
   861
          stmt.set_long(11, session.ml_timing.cpu.proper_ms)
83388f09e9ab clarified signature;
wenzelm
parents: 65738
diff changeset
   862
          stmt.set_long(12, session.ml_timing.gc.proper_ms)
83388f09e9ab clarified signature;
wenzelm
parents: 65738
diff changeset
   863
          stmt.set_double(13, session.ml_timing.factor)
83388f09e9ab clarified signature;
wenzelm
parents: 65738
diff changeset
   864
          stmt.set_long(14, session.heap_size)
83388f09e9ab clarified signature;
wenzelm
parents: 65738
diff changeset
   865
          stmt.set_string(15, session.status.map(_.toString))
65703
cead65c19f2e more direct insert_permissive statement, which avoids somewhat fragile nested transactions;
wenzelm
parents: 65702
diff changeset
   866
          stmt.execute()
cead65c19f2e more direct insert_permissive statement, which avoids somewhat fragile nested transactions;
wenzelm
parents: 65702
diff changeset
   867
        }
cead65c19f2e more direct insert_permissive statement, which avoids somewhat fragile nested transactions;
wenzelm
parents: 65702
diff changeset
   868
      })
65642
1423cbbc542d clarified database update operations;
wenzelm
parents: 65639
diff changeset
   869
    }
1423cbbc542d clarified database update operations;
wenzelm
parents: 65639
diff changeset
   870
65705
d0ca2a3ea657 more snapshot content;
wenzelm
parents: 65703
diff changeset
   871
    def update_ml_statistics(db: SQL.Database, log_name: String, build_info: Build_Info)
65645
2c704ae04db1 clarified database layout: bulky ml_statistics are stored/retrieved separately;
wenzelm
parents: 65643
diff changeset
   872
    {
65694
b82f2990161a clarified modules;
wenzelm
parents: 65693
diff changeset
   873
      val table = Data.ml_statistics_table
65703
cead65c19f2e more direct insert_permissive statement, which avoids somewhat fragile nested transactions;
wenzelm
parents: 65702
diff changeset
   874
      db.using_statement(db.insert_permissive(table))(stmt =>
cead65c19f2e more direct insert_permissive statement, which avoids somewhat fragile nested transactions;
wenzelm
parents: 65702
diff changeset
   875
      {
cead65c19f2e more direct insert_permissive statement, which avoids somewhat fragile nested transactions;
wenzelm
parents: 65702
diff changeset
   876
        val ml_stats: List[(String, Option[Bytes])] =
cead65c19f2e more direct insert_permissive statement, which avoids somewhat fragile nested transactions;
wenzelm
parents: 65702
diff changeset
   877
          Par_List.map[(String, Session_Entry), (String, Option[Bytes])](
cead65c19f2e more direct insert_permissive statement, which avoids somewhat fragile nested transactions;
wenzelm
parents: 65702
diff changeset
   878
            { case (a, b) => (a, compress_properties(b.ml_statistics).proper) },
cead65c19f2e more direct insert_permissive statement, which avoids somewhat fragile nested transactions;
wenzelm
parents: 65702
diff changeset
   879
            build_info.sessions.iterator.filter(p => p._2.ml_statistics.nonEmpty).toList)
cead65c19f2e more direct insert_permissive statement, which avoids somewhat fragile nested transactions;
wenzelm
parents: 65702
diff changeset
   880
        val entries = if (ml_stats.nonEmpty) ml_stats else List("" -> None)
cead65c19f2e more direct insert_permissive statement, which avoids somewhat fragile nested transactions;
wenzelm
parents: 65702
diff changeset
   881
        for ((session_name, ml_statistics) <- entries) {
65740
83388f09e9ab clarified signature;
wenzelm
parents: 65738
diff changeset
   882
          stmt.set_string(1, log_name)
83388f09e9ab clarified signature;
wenzelm
parents: 65738
diff changeset
   883
          stmt.set_string(2, session_name)
83388f09e9ab clarified signature;
wenzelm
parents: 65738
diff changeset
   884
          stmt.set_bytes(3, ml_statistics)
65703
cead65c19f2e more direct insert_permissive statement, which avoids somewhat fragile nested transactions;
wenzelm
parents: 65702
diff changeset
   885
          stmt.execute()
cead65c19f2e more direct insert_permissive statement, which avoids somewhat fragile nested transactions;
wenzelm
parents: 65702
diff changeset
   886
        }
cead65c19f2e more direct insert_permissive statement, which avoids somewhat fragile nested transactions;
wenzelm
parents: 65702
diff changeset
   887
      })
65645
2c704ae04db1 clarified database layout: bulky ml_statistics are stored/retrieved separately;
wenzelm
parents: 65643
diff changeset
   888
    }
2c704ae04db1 clarified database layout: bulky ml_statistics are stored/retrieved separately;
wenzelm
parents: 65643
diff changeset
   889
2c704ae04db1 clarified database layout: bulky ml_statistics are stored/retrieved separately;
wenzelm
parents: 65643
diff changeset
   890
    def write_info(db: SQL.Database, files: List[JFile], ml_statistics: Boolean = false)
65642
1423cbbc542d clarified database update operations;
wenzelm
parents: 65639
diff changeset
   891
    {
65705
d0ca2a3ea657 more snapshot content;
wenzelm
parents: 65703
diff changeset
   892
      abstract class Table_Status(table: SQL.Table)
65642
1423cbbc542d clarified database update operations;
wenzelm
parents: 65639
diff changeset
   893
      {
65688
wenzelm
parents: 65685
diff changeset
   894
        db.create_table(table)
65694
b82f2990161a clarified modules;
wenzelm
parents: 65693
diff changeset
   895
        private var known: Set[String] = domain(db, table, Data.log_name)
65688
wenzelm
parents: 65685
diff changeset
   896
65642
1423cbbc542d clarified database update operations;
wenzelm
parents: 65639
diff changeset
   897
        def required(file: JFile): Boolean = !known(Log_File.plain_name(file.getName))
65705
d0ca2a3ea657 more snapshot content;
wenzelm
parents: 65703
diff changeset
   898
d0ca2a3ea657 more snapshot content;
wenzelm
parents: 65703
diff changeset
   899
        def update_db(db: SQL.Database, log_file: Log_File): Unit
65642
1423cbbc542d clarified database update operations;
wenzelm
parents: 65639
diff changeset
   900
        def update(log_file: Log_File)
1423cbbc542d clarified database update operations;
wenzelm
parents: 65639
diff changeset
   901
        {
1423cbbc542d clarified database update operations;
wenzelm
parents: 65639
diff changeset
   902
          if (!known(log_file.name)) {
1423cbbc542d clarified database update operations;
wenzelm
parents: 65639
diff changeset
   903
            update_db(db, log_file)
1423cbbc542d clarified database update operations;
wenzelm
parents: 65639
diff changeset
   904
            known += log_file.name
65618
986fac3c60b4 tuned transaction granularity;
wenzelm
parents: 65616
diff changeset
   905
          }
65614
325801edb37d clarified transaction boundaries: more robust incremental write operations;
wenzelm
parents: 65613
diff changeset
   906
        }
65605
a6447eb6bc38 separate small meta_info vs. big build_info;
wenzelm
parents: 65603
diff changeset
   907
      }
65642
1423cbbc542d clarified database update operations;
wenzelm
parents: 65639
diff changeset
   908
      val status =
1423cbbc542d clarified database update operations;
wenzelm
parents: 65639
diff changeset
   909
        List(
65705
d0ca2a3ea657 more snapshot content;
wenzelm
parents: 65703
diff changeset
   910
          new Table_Status(Data.meta_info_table) {
d0ca2a3ea657 more snapshot content;
wenzelm
parents: 65703
diff changeset
   911
            override def update_db(db: SQL.Database, log_file: Log_File): Unit =
d0ca2a3ea657 more snapshot content;
wenzelm
parents: 65703
diff changeset
   912
              update_meta_info(db, log_file.name, log_file.parse_meta_info())
d0ca2a3ea657 more snapshot content;
wenzelm
parents: 65703
diff changeset
   913
          },
d0ca2a3ea657 more snapshot content;
wenzelm
parents: 65703
diff changeset
   914
          new Table_Status(Data.sessions_table) {
d0ca2a3ea657 more snapshot content;
wenzelm
parents: 65703
diff changeset
   915
            override def update_db(db: SQL.Database, log_file: Log_File): Unit =
d0ca2a3ea657 more snapshot content;
wenzelm
parents: 65703
diff changeset
   916
              update_sessions(db, log_file.name, log_file.parse_build_info())
d0ca2a3ea657 more snapshot content;
wenzelm
parents: 65703
diff changeset
   917
          },
d0ca2a3ea657 more snapshot content;
wenzelm
parents: 65703
diff changeset
   918
          new Table_Status(Data.ml_statistics_table) {
d0ca2a3ea657 more snapshot content;
wenzelm
parents: 65703
diff changeset
   919
            override def update_db(db: SQL.Database, log_file: Log_File): Unit =
d0ca2a3ea657 more snapshot content;
wenzelm
parents: 65703
diff changeset
   920
            if (ml_statistics) {
d0ca2a3ea657 more snapshot content;
wenzelm
parents: 65703
diff changeset
   921
              update_ml_statistics(db, log_file.name,
d0ca2a3ea657 more snapshot content;
wenzelm
parents: 65703
diff changeset
   922
                log_file.parse_build_info(ml_statistics = true))
d0ca2a3ea657 more snapshot content;
wenzelm
parents: 65703
diff changeset
   923
            }
d0ca2a3ea657 more snapshot content;
wenzelm
parents: 65703
diff changeset
   924
          })
65642
1423cbbc542d clarified database update operations;
wenzelm
parents: 65639
diff changeset
   925
65645
2c704ae04db1 clarified database layout: bulky ml_statistics are stored/retrieved separately;
wenzelm
parents: 65643
diff changeset
   926
      for (file_group <- files.filter(file => status.exists(_.required(file))).grouped(100)) {
65642
1423cbbc542d clarified database update operations;
wenzelm
parents: 65639
diff changeset
   927
        val log_files = Par_List.map[JFile, Log_File](Log_File.apply _, file_group)
1423cbbc542d clarified database update operations;
wenzelm
parents: 65639
diff changeset
   928
        db.transaction { log_files.foreach(log_file => status.foreach(_.update(log_file))) }
1423cbbc542d clarified database update operations;
wenzelm
parents: 65639
diff changeset
   929
      }
65605
a6447eb6bc38 separate small meta_info vs. big build_info;
wenzelm
parents: 65603
diff changeset
   930
    }
a6447eb6bc38 separate small meta_info vs. big build_info;
wenzelm
parents: 65603
diff changeset
   931
65621
551950dccec6 operations to read database;
wenzelm
parents: 65619
diff changeset
   932
    def read_meta_info(db: SQL.Database, log_name: String): Option[Meta_Info] =
551950dccec6 operations to read database;
wenzelm
parents: 65619
diff changeset
   933
    {
65694
b82f2990161a clarified modules;
wenzelm
parents: 65693
diff changeset
   934
      val table = Data.meta_info_table
65642
1423cbbc542d clarified database update operations;
wenzelm
parents: 65639
diff changeset
   935
      val columns = table.columns.tail
65699
9f74d9aa0bdf tuned signature;
wenzelm
parents: 65698
diff changeset
   936
      db.using_statement(table.select(columns, Data.log_name.where_equal(log_name)))(stmt =>
65621
551950dccec6 operations to read database;
wenzelm
parents: 65619
diff changeset
   937
      {
65740
83388f09e9ab clarified signature;
wenzelm
parents: 65738
diff changeset
   938
        val res = stmt.execute_query()
83388f09e9ab clarified signature;
wenzelm
parents: 65738
diff changeset
   939
        if (!res.next) None
65621
551950dccec6 operations to read database;
wenzelm
parents: 65619
diff changeset
   940
        else {
551950dccec6 operations to read database;
wenzelm
parents: 65619
diff changeset
   941
          val results =
65642
1423cbbc542d clarified database update operations;
wenzelm
parents: 65639
diff changeset
   942
            columns.map(c => c.name ->
65621
551950dccec6 operations to read database;
wenzelm
parents: 65619
diff changeset
   943
              (if (c.T == SQL.Type.Date)
65740
83388f09e9ab clarified signature;
wenzelm
parents: 65738
diff changeset
   944
                res.get_date(c).map(Log_File.Date_Format(_))
65621
551950dccec6 operations to read database;
wenzelm
parents: 65619
diff changeset
   945
               else
65740
83388f09e9ab clarified signature;
wenzelm
parents: 65738
diff changeset
   946
                res.get_string(c)))
65621
551950dccec6 operations to read database;
wenzelm
parents: 65619
diff changeset
   947
          val n = Prop.all_props.length
551950dccec6 operations to read database;
wenzelm
parents: 65619
diff changeset
   948
          val props = for ((x, Some(y)) <- results.take(n)) yield (x, y)
551950dccec6 operations to read database;
wenzelm
parents: 65619
diff changeset
   949
          val settings = for ((x, Some(y)) <- results.drop(n)) yield (x, y)
551950dccec6 operations to read database;
wenzelm
parents: 65619
diff changeset
   950
          Some(Meta_Info(props, settings))
551950dccec6 operations to read database;
wenzelm
parents: 65619
diff changeset
   951
        }
551950dccec6 operations to read database;
wenzelm
parents: 65619
diff changeset
   952
      })
551950dccec6 operations to read database;
wenzelm
parents: 65619
diff changeset
   953
    }
551950dccec6 operations to read database;
wenzelm
parents: 65619
diff changeset
   954
551950dccec6 operations to read database;
wenzelm
parents: 65619
diff changeset
   955
    def read_build_info(
65629
e6c0afe672fa optional ml_statistics: much faster;
wenzelm
parents: 65628
diff changeset
   956
      db: SQL.Database,
e6c0afe672fa optional ml_statistics: much faster;
wenzelm
parents: 65628
diff changeset
   957
      log_name: String,
e6c0afe672fa optional ml_statistics: much faster;
wenzelm
parents: 65628
diff changeset
   958
      session_names: List[String] = Nil,
e6c0afe672fa optional ml_statistics: much faster;
wenzelm
parents: 65628
diff changeset
   959
      ml_statistics: Boolean = false): Build_Info =
65621
551950dccec6 operations to read database;
wenzelm
parents: 65619
diff changeset
   960
    {
65694
b82f2990161a clarified modules;
wenzelm
parents: 65693
diff changeset
   961
      val table1 = Data.sessions_table
b82f2990161a clarified modules;
wenzelm
parents: 65693
diff changeset
   962
      val table2 = Data.ml_statistics_table
65629
e6c0afe672fa optional ml_statistics: much faster;
wenzelm
parents: 65628
diff changeset
   963
65645
2c704ae04db1 clarified database layout: bulky ml_statistics are stored/retrieved separately;
wenzelm
parents: 65643
diff changeset
   964
      val where_log_name =
65699
9f74d9aa0bdf tuned signature;
wenzelm
parents: 65698
diff changeset
   965
        Data.log_name(table1).where_equal(log_name) + " AND " +
65701
d788c11176e5 simplified: standard toString is SQL.ident;
wenzelm
parents: 65700
diff changeset
   966
        Data.session_name(table1) + " <> ''"
65621
551950dccec6 operations to read database;
wenzelm
parents: 65619
diff changeset
   967
      val where =
65645
2c704ae04db1 clarified database layout: bulky ml_statistics are stored/retrieved separately;
wenzelm
parents: 65643
diff changeset
   968
        if (session_names.isEmpty) where_log_name
65621
551950dccec6 operations to read database;
wenzelm
parents: 65619
diff changeset
   969
        else
65645
2c704ae04db1 clarified database layout: bulky ml_statistics are stored/retrieved separately;
wenzelm
parents: 65643
diff changeset
   970
          where_log_name + " AND " +
65701
d788c11176e5 simplified: standard toString is SQL.ident;
wenzelm
parents: 65700
diff changeset
   971
          session_names.map(a => Data.session_name(table1) + " = " + SQL.string(a)).
65621
551950dccec6 operations to read database;
wenzelm
parents: 65619
diff changeset
   972
            mkString("(", " OR ", ")")
65629
e6c0afe672fa optional ml_statistics: much faster;
wenzelm
parents: 65628
diff changeset
   973
65645
2c704ae04db1 clarified database layout: bulky ml_statistics are stored/retrieved separately;
wenzelm
parents: 65643
diff changeset
   974
      val columns1 = table1.columns.tail.map(_.apply(table1))
2c704ae04db1 clarified database layout: bulky ml_statistics are stored/retrieved separately;
wenzelm
parents: 65643
diff changeset
   975
      val (columns, from) =
2c704ae04db1 clarified database layout: bulky ml_statistics are stored/retrieved separately;
wenzelm
parents: 65643
diff changeset
   976
        if (ml_statistics) {
65694
b82f2990161a clarified modules;
wenzelm
parents: 65693
diff changeset
   977
          val columns = columns1 ::: List(Data.ml_statistics(table2))
65668
366bc4e6a238 more operations;
wenzelm
parents: 65665
diff changeset
   978
          val join =
65738
wenzelm
parents: 65736
diff changeset
   979
            table1 + " LEFT OUTER JOIN " + table2 + " ON " +
wenzelm
parents: 65736
diff changeset
   980
            Data.log_name(table1) + " = " + Data.log_name(table2) + " AND " +
wenzelm
parents: 65736
diff changeset
   981
            Data.session_name(table1) + " = " + Data.session_name(table2)
65668
366bc4e6a238 more operations;
wenzelm
parents: 65665
diff changeset
   982
          (columns, SQL.enclose(join))
65645
2c704ae04db1 clarified database layout: bulky ml_statistics are stored/retrieved separately;
wenzelm
parents: 65643
diff changeset
   983
        }
65695
4edac706bc5e tuned signature;
wenzelm
parents: 65694
diff changeset
   984
        else (columns1, table1.ident)
65645
2c704ae04db1 clarified database layout: bulky ml_statistics are stored/retrieved separately;
wenzelm
parents: 65643
diff changeset
   985
65621
551950dccec6 operations to read database;
wenzelm
parents: 65619
diff changeset
   986
      val sessions =
65698
38139b2067cf clarified signature;
wenzelm
parents: 65697
diff changeset
   987
        db.using_statement(SQL.select(columns) + from + " " + where)(stmt =>
65621
551950dccec6 operations to read database;
wenzelm
parents: 65619
diff changeset
   988
        {
65740
83388f09e9ab clarified signature;
wenzelm
parents: 65738
diff changeset
   989
          stmt.execute_query().iterator(res =>
65621
551950dccec6 operations to read database;
wenzelm
parents: 65619
diff changeset
   990
          {
65740
83388f09e9ab clarified signature;
wenzelm
parents: 65738
diff changeset
   991
            val session_name = res.string(Data.session_name)
65626
wenzelm
parents: 65625
diff changeset
   992
            val session_entry =
wenzelm
parents: 65625
diff changeset
   993
              Session_Entry(
65740
83388f09e9ab clarified signature;
wenzelm
parents: 65738
diff changeset
   994
                chapter = res.string(Data.chapter),
83388f09e9ab clarified signature;
wenzelm
parents: 65738
diff changeset
   995
                groups = split_lines(res.string(Data.groups)),
83388f09e9ab clarified signature;
wenzelm
parents: 65738
diff changeset
   996
                threads = res.get_int(Data.threads),
65741
wenzelm
parents: 65740
diff changeset
   997
                timing = res.timing(Data.timing_elapsed, Data.timing_cpu, Data.timing_gc),
65626
wenzelm
parents: 65625
diff changeset
   998
                ml_timing =
65741
wenzelm
parents: 65740
diff changeset
   999
                  res.timing(Data.ml_timing_elapsed, Data.ml_timing_cpu, Data.ml_timing_gc),
65740
83388f09e9ab clarified signature;
wenzelm
parents: 65738
diff changeset
  1000
                heap_size = res.get_long(Data.heap_size),
83388f09e9ab clarified signature;
wenzelm
parents: 65738
diff changeset
  1001
                status = res.get_string(Data.status).map(Session_Status.withName(_)),
65629
e6c0afe672fa optional ml_statistics: much faster;
wenzelm
parents: 65628
diff changeset
  1002
                ml_statistics =
65740
83388f09e9ab clarified signature;
wenzelm
parents: 65738
diff changeset
  1003
                  if (ml_statistics) uncompress_properties(res.bytes(Data.ml_statistics))
65629
e6c0afe672fa optional ml_statistics: much faster;
wenzelm
parents: 65628
diff changeset
  1004
                  else Nil)
65626
wenzelm
parents: 65625
diff changeset
  1005
            session_name -> session_entry
65621
551950dccec6 operations to read database;
wenzelm
parents: 65619
diff changeset
  1006
          }).toMap
551950dccec6 operations to read database;
wenzelm
parents: 65619
diff changeset
  1007
        })
551950dccec6 operations to read database;
wenzelm
parents: 65619
diff changeset
  1008
      Build_Info(sessions)
551950dccec6 operations to read database;
wenzelm
parents: 65619
diff changeset
  1009
    }
65595
ffd8283b7be0 support for database connection;
wenzelm
parents: 65591
diff changeset
  1010
  }
64045
c6160d0b0337 clarified modules;
wenzelm
parents:
diff changeset
  1011
}