src/Pure/Admin/build_log.scala
author wenzelm
Wed May 03 14:55:34 2017 +0200 (2017-05-03)
changeset 65694 b82f2990161a
parent 65693 99676834e53c
child 65695 4edac706bc5e
permissions -rw-r--r--
clarified modules;
wenzelm@64160
     1
/*  Title:      Pure/Admin/build_log.scala
wenzelm@64045
     2
    Author:     Makarius
wenzelm@64045
     3
wenzelm@65608
     4
Management of build log files and database storage.
wenzelm@64045
     5
*/
wenzelm@64045
     6
wenzelm@64045
     7
package isabelle
wenzelm@64045
     8
wenzelm@64045
     9
wenzelm@64100
    10
import java.io.{File => JFile}
wenzelm@64100
    11
import java.time.ZoneId
wenzelm@64110
    12
import java.time.format.{DateTimeFormatter, DateTimeParseException}
wenzelm@64096
    13
import java.util.Locale
wenzelm@65599
    14
import java.sql.PreparedStatement
wenzelm@64061
    15
wenzelm@65600
    16
import scala.collection.immutable.SortedMap
wenzelm@64054
    17
import scala.collection.mutable
wenzelm@64054
    18
import scala.util.matching.Regex
wenzelm@64054
    19
wenzelm@64054
    20
wenzelm@64045
    21
object Build_Log
wenzelm@64045
    22
{
wenzelm@64298
    23
  /** content **/
wenzelm@64101
    24
wenzelm@64298
    25
  /* properties */
wenzelm@64150
    26
wenzelm@64298
    27
  object Prop
wenzelm@64298
    28
  {
wenzelm@65624
    29
    val build_tags = SQL.Column.string("build_tags")  // lines
wenzelm@65624
    30
    val build_args = SQL.Column.string("build_args")  // lines
wenzelm@65591
    31
    val build_group_id = SQL.Column.string("build_group_id")
wenzelm@65591
    32
    val build_id = SQL.Column.string("build_id")
wenzelm@65591
    33
    val build_engine = SQL.Column.string("build_engine")
wenzelm@65591
    34
    val build_host = SQL.Column.string("build_host")
wenzelm@65591
    35
    val build_start = SQL.Column.date("build_start")
wenzelm@65591
    36
    val build_end = SQL.Column.date("build_end")
wenzelm@65591
    37
    val isabelle_version = SQL.Column.string("isabelle_version")
wenzelm@65591
    38
    val afp_version = SQL.Column.string("afp_version")
wenzelm@65591
    39
wenzelm@65611
    40
    val all_props: List[SQL.Column] =
wenzelm@65591
    41
      List(build_tags, build_args, build_group_id, build_id, build_engine,
wenzelm@65591
    42
        build_host, build_start, build_end, isabelle_version, afp_version)
wenzelm@64298
    43
  }
wenzelm@64150
    44
wenzelm@64150
    45
wenzelm@64298
    46
  /* settings */
wenzelm@64080
    47
wenzelm@64081
    48
  object Settings
wenzelm@64081
    49
  {
wenzelm@65611
    50
    val ISABELLE_BUILD_OPTIONS = SQL.Column.string("ISABELLE_BUILD_OPTIONS")
wenzelm@65611
    51
    val ML_PLATFORM = SQL.Column.string("ML_PLATFORM")
wenzelm@65611
    52
    val ML_HOME = SQL.Column.string("ML_HOME")
wenzelm@65611
    53
    val ML_SYSTEM = SQL.Column.string("ML_SYSTEM")
wenzelm@65611
    54
    val ML_OPTIONS = SQL.Column.string("ML_OPTIONS")
wenzelm@65611
    55
wenzelm@65611
    56
    val ml_settings = List(ML_PLATFORM, ML_HOME, ML_SYSTEM, ML_OPTIONS)
wenzelm@65611
    57
    val all_settings = ISABELLE_BUILD_OPTIONS :: ml_settings
wenzelm@64081
    58
wenzelm@64081
    59
    type Entry = (String, String)
wenzelm@64081
    60
    type T = List[Entry]
wenzelm@64080
    61
wenzelm@64081
    62
    object Entry
wenzelm@64081
    63
    {
wenzelm@64081
    64
      def unapply(s: String): Option[Entry] =
wenzelm@64081
    65
        s.indexOf('=') match {
wenzelm@64081
    66
          case -1 => None
wenzelm@64081
    67
          case i =>
wenzelm@64081
    68
            val a = s.substring(0, i)
wenzelm@64081
    69
            val b = Library.perhaps_unquote(s.substring(i + 1))
wenzelm@64081
    70
            Some((a, b))
wenzelm@64081
    71
        }
wenzelm@64081
    72
      def apply(a: String, b: String): String = a + "=" + quote(b)
wenzelm@64081
    73
      def getenv(a: String): String = apply(a, Isabelle_System.getenv(a))
wenzelm@64081
    74
    }
wenzelm@64080
    75
wenzelm@64081
    76
    def show(): String =
wenzelm@64081
    77
      cat_lines(
wenzelm@65611
    78
        List(Entry.getenv(ISABELLE_BUILD_OPTIONS.name), "") :::
wenzelm@65611
    79
        ml_settings.map(c => Entry.getenv(c.name)))
wenzelm@64080
    80
  }
wenzelm@64080
    81
wenzelm@64080
    82
wenzelm@64298
    83
  /* file names */
wenzelm@64298
    84
wenzelm@64298
    85
  def log_date(date: Date): String =
wenzelm@64298
    86
    String.format(Locale.ROOT, "%s.%05d",
wenzelm@64298
    87
      DateTimeFormatter.ofPattern("yyyy-MM-dd").format(date.rep),
wenzelm@64298
    88
      new java.lang.Long((date.time - date.midnight.time).ms / 1000))
wenzelm@64298
    89
wenzelm@64298
    90
  def log_subdir(date: Date): Path =
wenzelm@64298
    91
    Path.explode("log") + Path.explode(date.rep.getYear.toString)
wenzelm@64298
    92
wenzelm@64298
    93
  def log_filename(engine: String, date: Date, more: List[String] = Nil): Path =
wenzelm@64298
    94
    Path.explode((engine :: log_date(date) :: more).mkString("", "_", ".log"))
wenzelm@64298
    95
wenzelm@64298
    96
wenzelm@64100
    97
wenzelm@64062
    98
  /** log file **/
wenzelm@64045
    99
wenzelm@64155
   100
  def print_date(date: Date): String = Log_File.Date_Format(date)
wenzelm@64155
   101
wenzelm@64062
   102
  object Log_File
wenzelm@64062
   103
  {
wenzelm@65607
   104
    /* log file */
wenzelm@65607
   105
wenzelm@65609
   106
    def plain_name(name: String): String =
wenzelm@65609
   107
    {
wenzelm@65609
   108
      List(".log", ".log.gz", ".log.xz", ".gz", ".xz").find(name.endsWith(_)) match {
wenzelm@65609
   109
        case Some(s) => Library.try_unsuffix(s, name).get
wenzelm@65609
   110
        case None => name
wenzelm@65609
   111
      }
wenzelm@65609
   112
    }
wenzelm@65609
   113
wenzelm@64062
   114
    def apply(name: String, lines: List[String]): Log_File =
wenzelm@65609
   115
      new Log_File(plain_name(name), lines)
wenzelm@64062
   116
wenzelm@64062
   117
    def apply(name: String, text: String): Log_File =
wenzelm@64063
   118
      Log_File(name, Library.trim_split_lines(text))
wenzelm@64090
   119
wenzelm@64090
   120
    def apply(file: JFile): Log_File =
wenzelm@64090
   121
    {
wenzelm@64090
   122
      val name = file.getName
wenzelm@65609
   123
      val text =
wenzelm@65609
   124
        if (name.endsWith(".gz")) File.read_gzip(file)
wenzelm@65609
   125
        else if (name.endsWith(".xz")) File.read_xz(file)
wenzelm@65609
   126
        else File.read(file)
wenzelm@65609
   127
      apply(name, text)
wenzelm@64090
   128
    }
wenzelm@64090
   129
wenzelm@64090
   130
    def apply(path: Path): Log_File = apply(path.file)
wenzelm@64101
   131
wenzelm@64110
   132
wenzelm@65607
   133
    /* log file collections */
wenzelm@65607
   134
wenzelm@65607
   135
    def is_log(file: JFile,
wenzelm@65607
   136
      prefixes: List[String] =
wenzelm@65664
   137
        List(Build_History.log_prefix, Identify.log_prefix, Isatest.log_prefix,
wenzelm@65664
   138
          AFP_Test.log_prefix, Jenkins.log_prefix),
wenzelm@65609
   139
      suffixes: List[String] = List(".log", ".log.gz", ".log.xz")): Boolean =
wenzelm@65607
   140
    {
wenzelm@65607
   141
      val name = file.getName
wenzelm@65639
   142
wenzelm@65607
   143
      prefixes.exists(name.startsWith(_)) &&
wenzelm@65639
   144
      suffixes.exists(name.endsWith(_)) &&
wenzelm@65639
   145
      name != "isatest.log" &&
wenzelm@65639
   146
      name != "afp-test.log" &&
wenzelm@65639
   147
      name != "main.log"
wenzelm@65607
   148
    }
wenzelm@65607
   149
wenzelm@65607
   150
    def find_files(dirs: Iterable[Path]): List[JFile] =
wenzelm@65607
   151
      dirs.iterator.flatMap(dir => File.find_files(dir.file, is_log(_))).toList
wenzelm@65607
   152
wenzelm@65607
   153
wenzelm@64110
   154
    /* date format */
wenzelm@64110
   155
wenzelm@64101
   156
    val Date_Format =
wenzelm@64101
   157
    {
wenzelm@64101
   158
      val fmts =
wenzelm@64101
   159
        Date.Formatter.variants(
wenzelm@64116
   160
          List("EEE MMM d HH:mm:ss O yyyy", "EEE MMM d HH:mm:ss VV yyyy"),
wenzelm@64104
   161
          List(Locale.ENGLISH, Locale.GERMAN)) :::
wenzelm@64110
   162
        List(
wenzelm@64110
   163
          DateTimeFormatter.RFC_1123_DATE_TIME,
wenzelm@64110
   164
          Date.Formatter.pattern("EEE MMM d HH:mm:ss yyyy").withZone(ZoneId.of("Europe/Berlin")))
wenzelm@64101
   165
wenzelm@64104
   166
      def tune_timezone(s: String): String =
wenzelm@64104
   167
        s match {
wenzelm@64101
   168
          case "CET" | "MET" => "GMT+1"
wenzelm@64101
   169
          case "CEST" | "MEST" => "GMT+2"
wenzelm@64104
   170
          case "EST" => "Europe/Berlin"
wenzelm@64104
   171
          case _ => s
wenzelm@64104
   172
        }
wenzelm@64104
   173
      def tune_weekday(s: String): String =
wenzelm@64104
   174
        s match {
wenzelm@64104
   175
          case "Die" => "Di"
wenzelm@64104
   176
          case "Mit" => "Mi"
wenzelm@64104
   177
          case "Don" => "Do"
wenzelm@64104
   178
          case "Fre" => "Fr"
wenzelm@64104
   179
          case "Sam" => "Sa"
wenzelm@64104
   180
          case "Son" => "So"
wenzelm@64104
   181
          case _ => s
wenzelm@64104
   182
        }
wenzelm@64104
   183
wenzelm@64104
   184
      def tune(s: String): String =
wenzelm@64104
   185
        Word.implode(
wenzelm@64104
   186
          Word.explode(s) match {
wenzelm@64104
   187
            case a :: "M\uFFFDr" :: bs => tune_weekday(a) :: "Mär" :: bs.map(tune_timezone(_))
wenzelm@64104
   188
            case a :: bs => tune_weekday(a) :: bs.map(tune_timezone(_))
wenzelm@64104
   189
            case Nil => Nil
wenzelm@64104
   190
          }
wenzelm@64104
   191
        )
wenzelm@64101
   192
wenzelm@64101
   193
      Date.Format.make(fmts, tune)
wenzelm@64101
   194
    }
wenzelm@64117
   195
wenzelm@64117
   196
wenzelm@64117
   197
    /* inlined content */
wenzelm@64117
   198
wenzelm@64119
   199
    def print_props(marker: String, props: Properties.T): String =
wenzelm@65624
   200
      marker + YXML.string_of_body(XML.Encode.properties(Properties.encode_lines(props)))
wenzelm@64102
   201
  }
wenzelm@64102
   202
wenzelm@64102
   203
  class Log_File private(val name: String, val lines: List[String])
wenzelm@64102
   204
  {
wenzelm@64102
   205
    log_file =>
wenzelm@64102
   206
wenzelm@64102
   207
    override def toString: String = name
wenzelm@64102
   208
wenzelm@64102
   209
    def text: String = cat_lines(lines)
wenzelm@64102
   210
wenzelm@64102
   211
    def err(msg: String): Nothing =
wenzelm@64102
   212
      error("Error in log file " + quote(name) + ": " + msg)
wenzelm@64102
   213
wenzelm@64102
   214
wenzelm@64102
   215
    /* date format */
wenzelm@64101
   216
wenzelm@64101
   217
    object Strict_Date
wenzelm@64101
   218
    {
wenzelm@64101
   219
      def unapply(s: String): Some[Date] =
wenzelm@64102
   220
        try { Some(Log_File.Date_Format.parse(s)) }
wenzelm@64101
   221
        catch { case exn: DateTimeParseException => log_file.err(exn.getMessage) }
wenzelm@64101
   222
    }
wenzelm@64101
   223
wenzelm@64101
   224
wenzelm@64062
   225
    /* inlined content */
wenzelm@64062
   226
wenzelm@64062
   227
    def find[A](f: String => Option[A]): Option[A] =
wenzelm@64062
   228
      lines.iterator.map(f).find(_.isDefined).map(_.get)
wenzelm@64062
   229
wenzelm@64196
   230
    def find_line(marker: String): Option[String] =
wenzelm@64196
   231
      find(Library.try_unprefix(marker, _))
wenzelm@64196
   232
wenzelm@65684
   233
    def find_match(regexes: List[Regex]): Option[String] =
wenzelm@65684
   234
      regexes match {
wenzelm@65684
   235
        case Nil => None
wenzelm@65684
   236
        case regex :: rest =>
wenzelm@65684
   237
          lines.iterator.map(regex.unapplySeq(_)).find(res => res.isDefined && res.get.length == 1).
wenzelm@65684
   238
            map(res => res.get.head) orElse find_match(rest)
wenzelm@65684
   239
      }
wenzelm@64062
   240
wenzelm@64062
   241
wenzelm@64062
   242
    /* settings */
wenzelm@64062
   243
wenzelm@64091
   244
    def get_setting(a: String): Option[Settings.Entry] =
wenzelm@64091
   245
      lines.find(_.startsWith(a + "=")) match {
wenzelm@64091
   246
        case Some(line) => Settings.Entry.unapply(line)
wenzelm@64091
   247
        case None => None
wenzelm@64091
   248
      }
wenzelm@64045
   249
wenzelm@65611
   250
    def get_all_settings: Settings.T =
wenzelm@65611
   251
      for { c <- Settings.all_settings; entry <- get_setting(c.name) }
wenzelm@65611
   252
      yield entry
wenzelm@64062
   253
wenzelm@64062
   254
wenzelm@64062
   255
    /* properties (YXML) */
wenzelm@64062
   256
wenzelm@64062
   257
    val xml_cache = new XML.Cache()
wenzelm@64062
   258
wenzelm@64062
   259
    def parse_props(text: String): Properties.T =
wenzelm@65624
   260
      xml_cache.props(Properties.decode_lines(XML.Decode.properties(YXML.parse_body(text))))
wenzelm@64062
   261
wenzelm@64119
   262
    def filter_props(marker: String): List[Properties.T] =
wenzelm@64196
   263
      for {
wenzelm@64196
   264
        line <- lines
wenzelm@64196
   265
        s <- Library.try_unprefix(marker, line)
wenzelm@64196
   266
        if YXML.detect(s)
wenzelm@64196
   267
      } yield parse_props(s)
wenzelm@64062
   268
wenzelm@64119
   269
    def find_props(marker: String): Option[Properties.T] =
wenzelm@64196
   270
      find_line(marker) match {
wenzelm@64196
   271
        case Some(text) if YXML.detect(text) => Some(parse_props(text))
wenzelm@64196
   272
        case _ => None
wenzelm@64196
   273
      }
wenzelm@64062
   274
wenzelm@64062
   275
wenzelm@64062
   276
    /* parse various formats */
wenzelm@64062
   277
wenzelm@64105
   278
    def parse_meta_info(): Meta_Info = Build_Log.parse_meta_info(log_file)
wenzelm@64105
   279
wenzelm@65646
   280
    def parse_build_info(ml_statistics: Boolean = false): Build_Info =
wenzelm@65646
   281
      Build_Log.parse_build_info(log_file, ml_statistics)
wenzelm@64105
   282
wenzelm@64082
   283
    def parse_session_info(
wenzelm@64082
   284
        command_timings: Boolean = false,
wenzelm@64082
   285
        ml_statistics: Boolean = false,
wenzelm@64082
   286
        task_statistics: Boolean = false): Session_Info =
wenzelm@65318
   287
      Build_Log.parse_session_info(log_file, command_timings, ml_statistics, task_statistics)
wenzelm@64045
   288
  }
wenzelm@64045
   289
wenzelm@64045
   290
wenzelm@64098
   291
wenzelm@65276
   292
  /** digested meta info: produced by Admin/build_history in log.xz file **/
wenzelm@64045
   293
wenzelm@64108
   294
  object Meta_Info
wenzelm@64099
   295
  {
wenzelm@64108
   296
    val empty: Meta_Info = Meta_Info(Nil, Nil)
wenzelm@64099
   297
  }
wenzelm@64098
   298
wenzelm@65611
   299
  sealed case class Meta_Info(props: Properties.T, settings: Settings.T)
wenzelm@64103
   300
  {
wenzelm@64103
   301
    def is_empty: Boolean = props.isEmpty && settings.isEmpty
wenzelm@65599
   302
wenzelm@65611
   303
    def get(c: SQL.Column): Option[String] =
wenzelm@65611
   304
      Properties.get(props, c.name) orElse
wenzelm@65611
   305
      Properties.get(settings, c.name)
wenzelm@65611
   306
wenzelm@65611
   307
    def get_date(c: SQL.Column): Option[Date] =
wenzelm@65611
   308
      get(c).map(Log_File.Date_Format.parse(_))
wenzelm@64103
   309
  }
wenzelm@64061
   310
wenzelm@65625
   311
  object Identify
wenzelm@65625
   312
  {
wenzelm@65625
   313
    val log_prefix = "isabelle_identify_"
wenzelm@65674
   314
wenzelm@65674
   315
    def engine(log_file: Log_File): String =
wenzelm@65674
   316
      if (log_file.name.startsWith(Jenkins.log_prefix)) "jenkins_identify"
wenzelm@65674
   317
      else "identify"
wenzelm@65674
   318
wenzelm@65674
   319
    def content(date: Date, isabelle_version: Option[String], afp_version: Option[String]): String =
wenzelm@65674
   320
      terminate_lines(
wenzelm@65674
   321
        List("isabelle_identify: " + Build_Log.print_date(date), "") :::
wenzelm@65674
   322
        isabelle_version.map("Isabelle version: " + _).toList :::
wenzelm@65674
   323
        afp_version.map("AFP version: " + _).toList)
wenzelm@65674
   324
wenzelm@65625
   325
    val Start = new Regex("""^isabelle_identify: (.+)$""")
wenzelm@65625
   326
    val No_End = new Regex("""$.""")
wenzelm@65684
   327
    val Isabelle_Version = List(new Regex("""^Isabelle version: (\S+)$"""))
wenzelm@65684
   328
    val AFP_Version = List(new Regex("""^AFP version: (\S+)$"""))
wenzelm@65625
   329
  }
wenzelm@65625
   330
wenzelm@64095
   331
  object Isatest
wenzelm@64095
   332
  {
wenzelm@65588
   333
    val log_prefix = "isatest-makeall-"
wenzelm@64108
   334
    val engine = "isatest"
wenzelm@64109
   335
    val Start = new Regex("""^------------------- starting test --- (.+) --- (.+)$""")
wenzelm@64109
   336
    val End = new Regex("""^------------------- test (?:successful|FAILED) --- (.+) --- .*$""")
wenzelm@65684
   337
    val Isabelle_Version = List(new Regex("""^Isabelle version: (\S+)$"""))
wenzelm@64095
   338
  }
wenzelm@64095
   339
wenzelm@64109
   340
  object AFP_Test
wenzelm@64061
   341
  {
wenzelm@65588
   342
    val log_prefix = "afp-test-devel-"
wenzelm@64108
   343
    val engine = "afp-test"
wenzelm@64109
   344
    val Start = new Regex("""^Start test(?: for .+)? at ([^,]+), (.*)$""")
wenzelm@64109
   345
    val Start_Old = new Regex("""^Start test(?: for .+)? at ([^,]+)$""")
wenzelm@64109
   346
    val End = new Regex("""^End test on (.+), .+, elapsed time:.*$""")
wenzelm@65684
   347
    val Isabelle_Version = List(new Regex("""^Isabelle version: .* -- hg id (\S+)$"""))
wenzelm@65684
   348
    val AFP_Version = List(new Regex("""^AFP version: .* -- hg id (\S+)$"""))
wenzelm@64104
   349
    val Bad_Init = new Regex("""^cp:.*: Disc quota exceeded$""")
wenzelm@64061
   350
  }
wenzelm@64061
   351
wenzelm@64110
   352
  object Jenkins
wenzelm@64110
   353
  {
wenzelm@65664
   354
    val log_prefix = "jenkins_"
wenzelm@64110
   355
    val engine = "jenkins"
wenzelm@65663
   356
    val Host = new Regex("""^Building remotely on (\S+) \((\S+)\).*$""")
wenzelm@65665
   357
    val Start = new Regex("""^(?:Started by an SCM change|Started from command line by admin|).*$""")
wenzelm@64110
   358
    val Start_Date = new Regex("""^Build started at (.+)$""")
wenzelm@64110
   359
    val No_End = new Regex("""$.""")
wenzelm@65674
   360
    val Isabelle_Version =
wenzelm@65684
   361
      List(new Regex("""^(?:Build for Isabelle id|Isabelle id) (\w+).*$"""),
wenzelm@65685
   362
        new Regex("""^ISABELLE_CI_REPO_ID="(\w+)".*$"""),
wenzelm@65685
   363
        new Regex("""^(\w{12}) tip.*$"""))
wenzelm@65674
   364
    val AFP_Version =
wenzelm@65684
   365
      List(new Regex("""^(?:Build for AFP id|AFP id) (\w+).*$"""),
wenzelm@65684
   366
        new Regex("""^ISABELLE_CI_AFP_ID="(\w+)".*$"""))
wenzelm@64110
   367
    val CONFIGURATION = "=== CONFIGURATION ==="
wenzelm@64110
   368
    val BUILD = "=== BUILD ==="
wenzelm@64110
   369
  }
wenzelm@64110
   370
wenzelm@64105
   371
  private def parse_meta_info(log_file: Log_File): Meta_Info =
wenzelm@64061
   372
  {
wenzelm@64108
   373
    def parse(engine: String, host: String, start: Date,
wenzelm@65684
   374
      End: Regex, Isabelle_Version: List[Regex], AFP_Version: List[Regex]): Meta_Info =
wenzelm@64091
   375
    {
wenzelm@64296
   376
      val build_id =
wenzelm@64296
   377
      {
wenzelm@64296
   378
        val prefix = if (host != "") host else if (engine != "") engine else ""
wenzelm@64296
   379
        (if (prefix == "") "build" else prefix) + ":" + start.time.ms
wenzelm@64296
   380
      }
wenzelm@65591
   381
      val build_engine = if (engine == "") Nil else List(Prop.build_engine.name -> engine)
wenzelm@65591
   382
      val build_host = if (host == "") Nil else List(Prop.build_host.name -> host)
wenzelm@64108
   383
wenzelm@65599
   384
      val start_date = List(Prop.build_start.name -> print_date(start))
wenzelm@64091
   385
      val end_date =
wenzelm@64091
   386
        log_file.lines.last match {
wenzelm@64109
   387
          case End(log_file.Strict_Date(end_date)) =>
wenzelm@65599
   388
            List(Prop.build_end.name -> print_date(end_date))
wenzelm@64091
   389
          case _ => Nil
wenzelm@64091
   390
        }
wenzelm@64091
   391
wenzelm@64091
   392
      val isabelle_version =
wenzelm@65591
   393
        log_file.find_match(Isabelle_Version).map(Prop.isabelle_version.name -> _)
wenzelm@64091
   394
      val afp_version =
wenzelm@65591
   395
        log_file.find_match(AFP_Version).map(Prop.afp_version.name -> _)
wenzelm@64062
   396
wenzelm@65591
   397
      Meta_Info((Prop.build_id.name -> build_id) :: build_engine ::: build_host :::
wenzelm@64108
   398
          start_date ::: end_date ::: isabelle_version.toList ::: afp_version.toList,
wenzelm@65611
   399
        log_file.get_all_settings)
wenzelm@64091
   400
    }
wenzelm@64091
   401
wenzelm@64091
   402
    log_file.lines match {
wenzelm@64119
   403
      case line :: _ if line.startsWith(Build_History.META_INFO_MARKER) =>
wenzelm@64119
   404
        Meta_Info(log_file.find_props(Build_History.META_INFO_MARKER).get,
wenzelm@65611
   405
          log_file.get_all_settings)
wenzelm@64117
   406
wenzelm@65625
   407
      case Identify.Start(log_file.Strict_Date(start)) :: _ =>
wenzelm@65674
   408
        parse(Identify.engine(log_file), "", start, Identify.No_End,
wenzelm@65625
   409
          Identify.Isabelle_Version, Identify.AFP_Version)
wenzelm@65625
   410
wenzelm@64109
   411
      case Isatest.Start(log_file.Strict_Date(start), host) :: _ =>
wenzelm@64109
   412
        parse(Isatest.engine, host, start, Isatest.End,
wenzelm@65684
   413
          Isatest.Isabelle_Version, Nil)
wenzelm@64099
   414
wenzelm@64109
   415
      case AFP_Test.Start(log_file.Strict_Date(start), host) :: _ =>
wenzelm@64109
   416
        parse(AFP_Test.engine, host, start, AFP_Test.End,
wenzelm@64109
   417
          AFP_Test.Isabelle_Version, AFP_Test.AFP_Version)
wenzelm@64099
   418
wenzelm@64109
   419
      case AFP_Test.Start_Old(log_file.Strict_Date(start)) :: _ =>
wenzelm@64109
   420
        parse(AFP_Test.engine, "", start, AFP_Test.End,
wenzelm@64109
   421
          AFP_Test.Isabelle_Version, AFP_Test.AFP_Version)
wenzelm@64099
   422
wenzelm@65665
   423
      case Jenkins.Start() :: _ =>
wenzelm@64110
   424
        log_file.lines.dropWhile(_ != Jenkins.BUILD) match {
wenzelm@64110
   425
          case Jenkins.BUILD :: _ :: Jenkins.Start_Date(log_file.Strict_Date(start)) :: _ =>
wenzelm@65663
   426
            val host =
wenzelm@65663
   427
              log_file.lines.takeWhile(_ != Jenkins.CONFIGURATION).collectFirst({
wenzelm@65663
   428
                case Jenkins.Host(a, b) => a + "." + b
wenzelm@65663
   429
              }).getOrElse("")
wenzelm@65663
   430
            parse(Jenkins.engine, host, start.to(ZoneId.of("Europe/Berlin")), Jenkins.No_End,
wenzelm@64110
   431
              Jenkins.Isabelle_Version, Jenkins.AFP_Version)
wenzelm@64110
   432
          case _ => Meta_Info.empty
wenzelm@64110
   433
        }
wenzelm@64110
   434
wenzelm@64341
   435
      case line :: _ if line.startsWith("\u0000") => Meta_Info.empty
wenzelm@64109
   436
      case List(Isatest.End(_)) => Meta_Info.empty
wenzelm@64109
   437
      case _ :: AFP_Test.Bad_Init() :: _ => Meta_Info.empty
wenzelm@64105
   438
      case Nil => Meta_Info.empty
wenzelm@64104
   439
wenzelm@64110
   440
      case _ => log_file.err("cannot detect log file format")
wenzelm@64061
   441
    }
wenzelm@64061
   442
  }
wenzelm@64061
   443
wenzelm@64085
   444
wenzelm@64098
   445
wenzelm@65276
   446
  /** build info: toplevel output of isabelle build or Admin/build_history **/
wenzelm@64119
   447
wenzelm@64119
   448
  val ML_STATISTICS_MARKER = "\fML_statistics = "
wenzelm@64119
   449
  val SESSION_NAME = "session_name"
wenzelm@64085
   450
wenzelm@64061
   451
  object Session_Status extends Enumeration
wenzelm@64061
   452
  {
wenzelm@65633
   453
    val existing, finished, failed, cancelled = Value
wenzelm@64061
   454
  }
wenzelm@64061
   455
wenzelm@65643
   456
  object Session_Entry
wenzelm@65643
   457
  {
wenzelm@65643
   458
    val empty: Session_Entry = Session_Entry()
wenzelm@65643
   459
  }
wenzelm@65643
   460
wenzelm@64085
   461
  sealed case class Session_Entry(
wenzelm@65643
   462
    chapter: String = "",
wenzelm@65643
   463
    groups: List[String] = Nil,
wenzelm@65643
   464
    threads: Option[Int] = None,
wenzelm@65643
   465
    timing: Timing = Timing.zero,
wenzelm@65643
   466
    ml_timing: Timing = Timing.zero,
wenzelm@65643
   467
    heap_size: Option[Long] = None,
wenzelm@65643
   468
    status: Option[Session_Status.Value] = None,
wenzelm@65643
   469
    ml_statistics: List[Properties.T] = Nil)
wenzelm@64085
   470
  {
wenzelm@65631
   471
    def proper_chapter: Option[String] = if (chapter == "") None else Some(chapter)
wenzelm@65631
   472
    def proper_groups: Option[String] = if (groups.isEmpty) None else Some(cat_lines(groups))
wenzelm@65643
   473
    def finished: Boolean = status == Some(Session_Status.finished)
wenzelm@64085
   474
  }
wenzelm@64054
   475
wenzelm@64085
   476
  sealed case class Build_Info(sessions: Map[String, Session_Entry])
wenzelm@64054
   477
  {
wenzelm@64085
   478
    def session(name: String): Session_Entry = sessions(name)
wenzelm@64085
   479
    def get_session(name: String): Option[Session_Entry] = sessions.get(name)
wenzelm@64054
   480
wenzelm@64089
   481
    def get_default[A](name: String, f: Session_Entry => A, x: A): A =
wenzelm@64085
   482
      get_session(name) match {
wenzelm@64089
   483
        case Some(entry) => f(entry)
wenzelm@64089
   484
        case None => x
wenzelm@64085
   485
      }
wenzelm@64085
   486
wenzelm@64119
   487
    def finished_sessions: List[String] = sessions.keySet.iterator.filter(finished(_)).toList
wenzelm@64089
   488
    def finished(name: String): Boolean = get_default(name, _.finished, false)
wenzelm@64089
   489
    def timing(name: String): Timing = get_default(name, _.timing, Timing.zero)
wenzelm@64089
   490
    def ml_timing(name: String): Timing = get_default(name, _.ml_timing, Timing.zero)
wenzelm@65052
   491
    def ml_statistics(name: String): ML_Statistics =
wenzelm@65052
   492
      get_default(name, entry => ML_Statistics(name, entry.ml_statistics), ML_Statistics.empty)
wenzelm@64054
   493
  }
wenzelm@64054
   494
wenzelm@65646
   495
  private def parse_build_info(log_file: Log_File, parse_ml_statistics: Boolean): Build_Info =
wenzelm@64085
   496
  {
wenzelm@64085
   497
    object Chapter_Name
wenzelm@64085
   498
    {
wenzelm@64085
   499
      def unapply(s: String): Some[(String, String)] =
wenzelm@64085
   500
        space_explode('/', s) match {
wenzelm@64085
   501
          case List(chapter, name) => Some((chapter, name))
wenzelm@64085
   502
          case _ => Some(("", s))
wenzelm@64085
   503
        }
wenzelm@64085
   504
    }
wenzelm@64054
   505
wenzelm@64085
   506
    val Session_No_Groups = new Regex("""^Session (\S+)$""")
wenzelm@64085
   507
    val Session_Groups = new Regex("""^Session (\S+) \((.*)\)$""")
wenzelm@64085
   508
    val Session_Finished1 =
wenzelm@64085
   509
      new Regex("""^Finished (\S+) \((\d+):(\d+):(\d+) elapsed time, (\d+):(\d+):(\d+) cpu time.*$""")
wenzelm@64085
   510
    val Session_Finished2 =
wenzelm@64085
   511
      new Regex("""^Finished (\S+) \((\d+):(\d+):(\d+) elapsed time.*$""")
wenzelm@64085
   512
    val Session_Timing =
wenzelm@65679
   513
      new Regex("""^Timing (\S+) \((\d+) threads, (\d+\.\d+)s elapsed time, (\d+\.\d+)s cpu time, (\d+\.\d+)s GC time.*$""")
wenzelm@64086
   514
    val Session_Started = new Regex("""^(?:Running|Building) (\S+) \.\.\.$""")
wenzelm@64085
   515
    val Session_Failed = new Regex("""^(\S+) FAILED""")
wenzelm@64085
   516
    val Session_Cancelled = new Regex("""^(\S+) CANCELLED""")
wenzelm@64120
   517
    val Heap = new Regex("""^Heap (\S+) \((\d+) bytes\)$""")
wenzelm@64085
   518
wenzelm@64085
   519
    var chapter = Map.empty[String, String]
wenzelm@64085
   520
    var groups = Map.empty[String, List[String]]
wenzelm@64085
   521
    var threads = Map.empty[String, Int]
wenzelm@64054
   522
    var timing = Map.empty[String, Timing]
wenzelm@64085
   523
    var ml_timing = Map.empty[String, Timing]
wenzelm@64086
   524
    var started = Set.empty[String]
wenzelm@64085
   525
    var failed = Set.empty[String]
wenzelm@64085
   526
    var cancelled = Set.empty[String]
wenzelm@65627
   527
    var heap_sizes = Map.empty[String, Long]
wenzelm@64119
   528
    var ml_statistics = Map.empty[String, List[Properties.T]]
wenzelm@64119
   529
wenzelm@64085
   530
    def all_sessions: Set[String] =
wenzelm@64120
   531
      chapter.keySet ++ groups.keySet ++ threads.keySet ++ timing.keySet ++ ml_timing.keySet ++
wenzelm@65627
   532
      failed ++ cancelled ++ started ++ heap_sizes.keySet ++ ml_statistics.keySet
wenzelm@64085
   533
wenzelm@64054
   534
wenzelm@64062
   535
    for (line <- log_file.lines) {
wenzelm@64054
   536
      line match {
wenzelm@64085
   537
        case Session_No_Groups(Chapter_Name(chapt, name)) =>
wenzelm@64085
   538
          chapter += (name -> chapt)
wenzelm@64085
   539
          groups += (name -> Nil)
wenzelm@64119
   540
wenzelm@64085
   541
        case Session_Groups(Chapter_Name(chapt, name), grps) =>
wenzelm@64085
   542
          chapter += (name -> chapt)
wenzelm@64085
   543
          groups += (name -> Word.explode(grps))
wenzelm@64119
   544
wenzelm@64086
   545
        case Session_Started(name) =>
wenzelm@64086
   546
          started += name
wenzelm@64119
   547
wenzelm@64054
   548
        case Session_Finished1(name,
wenzelm@64054
   549
            Value.Int(e1), Value.Int(e2), Value.Int(e3),
wenzelm@64054
   550
            Value.Int(c1), Value.Int(c2), Value.Int(c3)) =>
wenzelm@64054
   551
          val elapsed = Time.hms(e1, e2, e3)
wenzelm@64054
   552
          val cpu = Time.hms(c1, c2, c3)
wenzelm@64085
   553
          timing += (name -> Timing(elapsed, cpu, Time.zero))
wenzelm@64119
   554
wenzelm@64054
   555
        case Session_Finished2(name,
wenzelm@64054
   556
            Value.Int(e1), Value.Int(e2), Value.Int(e3)) =>
wenzelm@64054
   557
          val elapsed = Time.hms(e1, e2, e3)
wenzelm@64085
   558
          timing += (name -> Timing(elapsed, Time.zero, Time.zero))
wenzelm@64119
   559
wenzelm@64054
   560
        case Session_Timing(name,
wenzelm@64054
   561
            Value.Int(t), Value.Double(e), Value.Double(c), Value.Double(g)) =>
wenzelm@64054
   562
          val elapsed = Time.seconds(e)
wenzelm@64054
   563
          val cpu = Time.seconds(c)
wenzelm@64054
   564
          val gc = Time.seconds(g)
wenzelm@64085
   565
          ml_timing += (name -> Timing(elapsed, cpu, gc))
wenzelm@64054
   566
          threads += (name -> t)
wenzelm@64119
   567
wenzelm@64120
   568
        case Heap(name, Value.Long(size)) =>
wenzelm@64120
   569
          heap_sizes += (name -> size)
wenzelm@64120
   570
wenzelm@65646
   571
        case _
wenzelm@65646
   572
        if parse_ml_statistics && line.startsWith(ML_STATISTICS_MARKER) && YXML.detect(line) =>
wenzelm@64119
   573
          val (name, props) =
wenzelm@64119
   574
            Library.try_unprefix(ML_STATISTICS_MARKER, line).map(log_file.parse_props(_)) match {
wenzelm@64119
   575
              case Some((SESSION_NAME, session_name) :: props) => (session_name, props)
wenzelm@64119
   576
              case _ => log_file.err("malformed ML_statistics " + quote(line))
wenzelm@64119
   577
            }
wenzelm@64120
   578
          ml_statistics += (name -> (props :: ml_statistics.getOrElse(name, Nil)))
wenzelm@64119
   579
wenzelm@64054
   580
        case _ =>
wenzelm@64054
   581
      }
wenzelm@64054
   582
    }
wenzelm@64054
   583
wenzelm@64085
   584
    val sessions =
wenzelm@64085
   585
      Map(
wenzelm@64085
   586
        (for (name <- all_sessions.toList) yield {
wenzelm@64085
   587
          val status =
wenzelm@65633
   588
            if (failed(name)) Session_Status.failed
wenzelm@65633
   589
            else if (cancelled(name)) Session_Status.cancelled
wenzelm@64086
   590
            else if (timing.isDefinedAt(name) || ml_timing.isDefinedAt(name))
wenzelm@65633
   591
              Session_Status.finished
wenzelm@65633
   592
            else if (started(name)) Session_Status.failed
wenzelm@65633
   593
            else Session_Status.existing
wenzelm@64085
   594
          val entry =
wenzelm@64085
   595
            Session_Entry(
wenzelm@65643
   596
              chapter = chapter.getOrElse(name, ""),
wenzelm@65643
   597
              groups = groups.getOrElse(name, Nil),
wenzelm@65643
   598
              threads = threads.get(name),
wenzelm@65643
   599
              timing = timing.getOrElse(name, Timing.zero),
wenzelm@65643
   600
              ml_timing = ml_timing.getOrElse(name, Timing.zero),
wenzelm@65643
   601
              heap_size = heap_sizes.get(name),
wenzelm@65643
   602
              status = Some(status),
wenzelm@65643
   603
              ml_statistics = ml_statistics.getOrElse(name, Nil).reverse)
wenzelm@64085
   604
          (name -> entry)
wenzelm@64085
   605
        }):_*)
wenzelm@64085
   606
    Build_Info(sessions)
wenzelm@64054
   607
  }
wenzelm@64099
   608
wenzelm@64099
   609
wenzelm@64099
   610
wenzelm@65276
   611
  /** session info: produced by isabelle build as session log.gz file **/
wenzelm@64099
   612
wenzelm@64099
   613
  sealed case class Session_Info(
wenzelm@64099
   614
    session_timing: Properties.T,
wenzelm@64099
   615
    command_timings: List[Properties.T],
wenzelm@64099
   616
    ml_statistics: List[Properties.T],
wenzelm@64099
   617
    task_statistics: List[Properties.T])
wenzelm@64099
   618
wenzelm@64099
   619
  private def parse_session_info(
wenzelm@64099
   620
    log_file: Log_File,
wenzelm@64099
   621
    command_timings: Boolean,
wenzelm@64099
   622
    ml_statistics: Boolean,
wenzelm@64099
   623
    task_statistics: Boolean): Session_Info =
wenzelm@64099
   624
  {
wenzelm@65290
   625
    Session_Info(
wenzelm@65290
   626
      session_timing = log_file.find_props("\fTiming = ") getOrElse Nil,
wenzelm@65290
   627
      command_timings = if (command_timings) log_file.filter_props("\fcommand_timing = ") else Nil,
wenzelm@65290
   628
      ml_statistics = if (ml_statistics) log_file.filter_props(ML_STATISTICS_MARKER) else Nil,
wenzelm@65290
   629
      task_statistics = if (task_statistics) log_file.filter_props("\ftask_statistics = ") else Nil)
wenzelm@64099
   630
  }
wenzelm@65595
   631
wenzelm@65595
   632
wenzelm@65595
   633
wenzelm@65595
   634
  /** persistent store **/
wenzelm@65595
   635
wenzelm@65694
   636
  /* SQL data model */
wenzelm@65694
   637
wenzelm@65694
   638
  object Data
wenzelm@65694
   639
  {
wenzelm@65694
   640
    /* main content */
wenzelm@65694
   641
wenzelm@65694
   642
    val log_name = SQL.Column.string("log_name", primary_key = true)
wenzelm@65694
   643
    val session_name = SQL.Column.string("session_name", primary_key = true)
wenzelm@65694
   644
    val chapter = SQL.Column.string("chapter")
wenzelm@65694
   645
    val groups = SQL.Column.string("groups")
wenzelm@65694
   646
    val threads = SQL.Column.int("threads")
wenzelm@65694
   647
    val timing_elapsed = SQL.Column.long("timing_elapsed")
wenzelm@65694
   648
    val timing_cpu = SQL.Column.long("timing_cpu")
wenzelm@65694
   649
    val timing_gc = SQL.Column.long("timing_gc")
wenzelm@65694
   650
    val timing_factor = SQL.Column.double("timing_factor")
wenzelm@65694
   651
    val ml_timing_elapsed = SQL.Column.long("ml_timing_elapsed")
wenzelm@65694
   652
    val ml_timing_cpu = SQL.Column.long("ml_timing_cpu")
wenzelm@65694
   653
    val ml_timing_gc = SQL.Column.long("ml_timing_gc")
wenzelm@65694
   654
    val ml_timing_factor = SQL.Column.double("ml_timing_factor")
wenzelm@65694
   655
    val heap_size = SQL.Column.long("heap_size")
wenzelm@65694
   656
    val status = SQL.Column.string("status")
wenzelm@65694
   657
    val ml_statistics = SQL.Column.bytes("ml_statistics")
wenzelm@65694
   658
wenzelm@65694
   659
    val meta_info_table =
wenzelm@65694
   660
      SQL.Table("isabelle_build_log_meta_info", log_name :: Prop.all_props ::: Settings.all_settings)
wenzelm@65694
   661
wenzelm@65694
   662
    val sessions_table =
wenzelm@65694
   663
      SQL.Table("isabelle_build_log_sessions",
wenzelm@65694
   664
        List(log_name, session_name, chapter, groups, threads, timing_elapsed, timing_cpu,
wenzelm@65694
   665
          timing_gc, timing_factor, ml_timing_elapsed, ml_timing_cpu, ml_timing_gc, ml_timing_factor,
wenzelm@65694
   666
          heap_size, status))
wenzelm@65694
   667
wenzelm@65694
   668
    val ml_statistics_table =
wenzelm@65694
   669
      SQL.Table("isabelle_build_log_ml_statistics",
wenzelm@65694
   670
        List(log_name, session_name, ml_statistics))
wenzelm@65694
   671
wenzelm@65694
   672
wenzelm@65694
   673
    /* full view on build_log data */
wenzelm@65694
   674
wenzelm@65694
   675
    // WARNING: This may cause performance problems, e.g. with sqlitebrowser
wenzelm@65694
   676
    val full_table: SQL.Table =
wenzelm@65694
   677
    {
wenzelm@65694
   678
      val columns =
wenzelm@65694
   679
        meta_info_table.columns :::
wenzelm@65694
   680
          sessions_table.columns.tail.map(_.copy(primary_key = false))
wenzelm@65694
   681
      SQL.Table("isabelle_build_log", columns,
wenzelm@65694
   682
        view =
wenzelm@65694
   683
          {
wenzelm@65694
   684
            val table1 = meta_info_table
wenzelm@65694
   685
            val table2 = sessions_table
wenzelm@65694
   686
            SQL.select(log_name(table1) :: columns.tail) +
wenzelm@65694
   687
            SQL.join(table1, table2, log_name(table1).sql + " = " + log_name(table2).sql)
wenzelm@65694
   688
          })
wenzelm@65694
   689
    }
wenzelm@65694
   690
wenzelm@65694
   691
wenzelm@65694
   692
    /* earliest pull date for repository version */
wenzelm@65694
   693
wenzelm@65694
   694
    val pull_date = SQL.Column.date("pull_date")
wenzelm@65694
   695
wenzelm@65694
   696
    def pull_date_table(name: String, version: SQL.Column): SQL.Table =
wenzelm@65694
   697
      SQL.Table("isabelle_build_log_" + name, List(version.copy(primary_key = true), pull_date),
wenzelm@65694
   698
        view = // PostgreSQL
wenzelm@65694
   699
          "SELECT " + version.sql + ", min(" + Prop.build_start.sql + ") AS " + pull_date.sql +
wenzelm@65694
   700
          " FROM " + meta_info_table.sql +
wenzelm@65694
   701
          " WHERE " + version.sql + " IS NOT NULL AND" + Prop.build_start.sql + " IS NOT NULL" +
wenzelm@65694
   702
          " GROUP BY " + version.sql)
wenzelm@65694
   703
wenzelm@65694
   704
    val isabelle_pull_date_table = pull_date_table("isabelle_pull_date", Prop.isabelle_version)
wenzelm@65694
   705
    val afp_pull_date_table = pull_date_table("afp_pull_date", Prop.afp_version)
wenzelm@65694
   706
wenzelm@65694
   707
    def recent(table: SQL.Table, days: Int): String =
wenzelm@65694
   708
      table.sql_select(table.columns) +
wenzelm@65694
   709
      " WHERE " + pull_date(table).sql + " > now() - INTERVAL '" + days.max(0) + " days'"
wenzelm@65694
   710
wenzelm@65694
   711
    def select_recent(table: SQL.Table, columns: List[SQL.Column], days: Int): String =
wenzelm@65694
   712
      table.sql_select(columns) +
wenzelm@65694
   713
      " INNER JOIN (" + recent(isabelle_pull_date_table, days) + ") AS recent" +
wenzelm@65694
   714
      " ON " + Prop.isabelle_version(table).sql + " = recent." + Prop.isabelle_version.sql
wenzelm@65694
   715
  }
wenzelm@65694
   716
wenzelm@65694
   717
wenzelm@65694
   718
  /* database access */
wenzelm@65694
   719
wenzelm@65595
   720
  def store(options: Options): Store = new Store(options)
wenzelm@65595
   721
wenzelm@65595
   722
  class Store private[Build_Log](options: Options) extends Properties.Store
wenzelm@65595
   723
  {
wenzelm@65595
   724
    def open_database(
wenzelm@65595
   725
      user: String = options.string("build_log_database_user"),
wenzelm@65595
   726
      password: String = options.string("build_log_database_password"),
wenzelm@65595
   727
      database: String = options.string("build_log_database_name"),
wenzelm@65595
   728
      host: String = options.string("build_log_database_host"),
wenzelm@65595
   729
      port: Int = options.int("build_log_database_port"),
wenzelm@65595
   730
      ssh_host: String = options.string("build_log_ssh_host"),
wenzelm@65595
   731
      ssh_user: String = options.string("build_log_ssh_user"),
wenzelm@65595
   732
      ssh_port: Int = options.int("build_log_ssh_port")): PostgreSQL.Database =
wenzelm@65595
   733
    {
wenzelm@65595
   734
      PostgreSQL.open_database(
wenzelm@65595
   735
        user = user, password = password, database = database, host = host, port = port,
wenzelm@65595
   736
        ssh =
wenzelm@65595
   737
          if (ssh_host == "") None
wenzelm@65636
   738
          else Some(SSH.init_context(options).open_session(ssh_host, ssh_user, port)),
wenzelm@65636
   739
        ssh_close = true)
wenzelm@65595
   740
    }
wenzelm@65599
   741
wenzelm@65694
   742
    def update_database(db: SQL.Database, dirs: List[Path], ml_statistics: Boolean = false)
wenzelm@65694
   743
    {
wenzelm@65694
   744
      write_info(db, Log_File.find_files(dirs), ml_statistics = ml_statistics)
wenzelm@65694
   745
wenzelm@65694
   746
      if (db.isInstanceOf[PostgreSQL.Database]) {
wenzelm@65694
   747
        List(Data.full_table, Data.isabelle_pull_date_table, Data.afp_pull_date_table)
wenzelm@65694
   748
          .foreach(db.create_view(_))
wenzelm@65694
   749
      }
wenzelm@65694
   750
    }
wenzelm@65694
   751
wenzelm@65694
   752
    def snapshot(db: PostgreSQL.Database, sqlite_database: Path, days: Int = 100)
wenzelm@65694
   753
    {
wenzelm@65694
   754
      Isabelle_System.mkdirs(sqlite_database.dir)
wenzelm@65694
   755
      sqlite_database.file.delete
wenzelm@65694
   756
wenzelm@65694
   757
      using(SQLite.open_database(sqlite_database))(db2 =>
wenzelm@65694
   758
      {
wenzelm@65694
   759
        db.transaction {
wenzelm@65694
   760
          db2.transaction {
wenzelm@65694
   761
            // pull_date tables
wenzelm@65694
   762
            List(Data.isabelle_pull_date_table, Data.afp_pull_date_table).foreach(table =>
wenzelm@65694
   763
            {
wenzelm@65694
   764
              db2.create_table(table)
wenzelm@65694
   765
              using(db2.insert(table))(stmt2 =>
wenzelm@65694
   766
              {
wenzelm@65694
   767
                using(db.statement(Data.recent(table, days)))(stmt =>
wenzelm@65694
   768
                {
wenzelm@65694
   769
                  val rs = stmt.executeQuery
wenzelm@65694
   770
                  while (rs.next()) {
wenzelm@65694
   771
                    for ((c, i) <- table.columns.zipWithIndex)
wenzelm@65694
   772
                      db2.set_string(stmt2, i + 1, db.get(rs, c, db.string _))
wenzelm@65694
   773
                    stmt2.execute
wenzelm@65694
   774
                  }
wenzelm@65694
   775
                })
wenzelm@65694
   776
              })
wenzelm@65694
   777
            })
wenzelm@65694
   778
          }
wenzelm@65694
   779
        }
wenzelm@65694
   780
      })
wenzelm@65694
   781
    }
wenzelm@65694
   782
wenzelm@65688
   783
    def domain(db: SQL.Database, table: SQL.Table, column: SQL.Column): Set[String] =
wenzelm@65688
   784
      using(db.select(table, List(column), distinct = true))(stmt =>
wenzelm@65688
   785
        SQL.iterator(stmt.executeQuery)(db.string(_, column)).toSet)
wenzelm@65688
   786
wenzelm@65642
   787
    def update_meta_info(db: SQL.Database, log_file: Log_File)
wenzelm@65632
   788
    {
wenzelm@65642
   789
      val meta_info = log_file.parse_meta_info()
wenzelm@65694
   790
      val table = Data.meta_info_table
wenzelm@65614
   791
wenzelm@65642
   792
      db.transaction {
wenzelm@65694
   793
        using(db.delete(table, Data.log_name.sql_where_equal(log_file.name)))(_.execute)
wenzelm@65642
   794
        using(db.insert(table))(stmt =>
wenzelm@65642
   795
        {
wenzelm@65642
   796
          db.set_string(stmt, 1, log_file.name)
wenzelm@65642
   797
          for ((c, i) <- table.columns.tail.zipWithIndex) {
wenzelm@65642
   798
            if (c.T == SQL.Type.Date)
wenzelm@65642
   799
              db.set_date(stmt, i + 2, meta_info.get_date(c))
wenzelm@65642
   800
            else
wenzelm@65642
   801
              db.set_string(stmt, i + 2, meta_info.get(c))
wenzelm@65642
   802
          }
wenzelm@65642
   803
          stmt.execute()
wenzelm@65642
   804
        })
wenzelm@65614
   805
      }
wenzelm@65600
   806
    }
wenzelm@65600
   807
wenzelm@65645
   808
    def update_sessions(db: SQL.Database, log_file: Log_File)
wenzelm@65599
   809
    {
wenzelm@65642
   810
      val build_info = log_file.parse_build_info()
wenzelm@65694
   811
      val table = Data.sessions_table
wenzelm@65642
   812
wenzelm@65642
   813
      db.transaction {
wenzelm@65694
   814
        using(db.delete(table, Data.log_name.sql_where_equal(log_file.name)))(_.execute)
wenzelm@65643
   815
        using(db.insert(table))(stmt =>
wenzelm@65643
   816
        {
wenzelm@65645
   817
          val entries_iterator =
wenzelm@65643
   818
            if (build_info.sessions.isEmpty) Iterator("" -> Session_Entry.empty)
wenzelm@65643
   819
            else build_info.sessions.iterator
wenzelm@65645
   820
          for ((session_name, session) <- entries_iterator) {
wenzelm@65642
   821
            db.set_string(stmt, 1, log_file.name)
wenzelm@65643
   822
            db.set_string(stmt, 2, session_name)
wenzelm@65643
   823
            db.set_string(stmt, 3, session.proper_chapter)
wenzelm@65643
   824
            db.set_string(stmt, 4, session.proper_groups)
wenzelm@65643
   825
            db.set_int(stmt, 5, session.threads)
wenzelm@65643
   826
            db.set_long(stmt, 6, session.timing.elapsed.proper_ms)
wenzelm@65643
   827
            db.set_long(stmt, 7, session.timing.cpu.proper_ms)
wenzelm@65643
   828
            db.set_long(stmt, 8, session.timing.gc.proper_ms)
wenzelm@65683
   829
            db.set_double(stmt, 9, session.timing.factor)
wenzelm@65683
   830
            db.set_long(stmt, 10, session.ml_timing.elapsed.proper_ms)
wenzelm@65683
   831
            db.set_long(stmt, 11, session.ml_timing.cpu.proper_ms)
wenzelm@65683
   832
            db.set_long(stmt, 12, session.ml_timing.gc.proper_ms)
wenzelm@65683
   833
            db.set_double(stmt, 13, session.ml_timing.factor)
wenzelm@65683
   834
            db.set_long(stmt, 14, session.heap_size)
wenzelm@65683
   835
            db.set_string(stmt, 15, session.status.map(_.toString))
wenzelm@65642
   836
            stmt.execute()
wenzelm@65643
   837
          }
wenzelm@65643
   838
        })
wenzelm@65642
   839
      }
wenzelm@65642
   840
    }
wenzelm@65642
   841
wenzelm@65645
   842
    def update_ml_statistics(db: SQL.Database, log_file: Log_File)
wenzelm@65645
   843
    {
wenzelm@65646
   844
      val build_info = log_file.parse_build_info(ml_statistics = true)
wenzelm@65694
   845
      val table = Data.ml_statistics_table
wenzelm@65645
   846
wenzelm@65645
   847
      db.transaction {
wenzelm@65694
   848
        using(db.delete(table, Data.log_name.sql_where_equal(log_file.name)))(_.execute)
wenzelm@65645
   849
        using(db.insert(table))(stmt =>
wenzelm@65645
   850
        {
wenzelm@65645
   851
          val ml_stats: List[(String, Option[Bytes])] =
wenzelm@65645
   852
            Par_List.map[(String, Session_Entry), (String, Option[Bytes])](
wenzelm@65645
   853
              { case (a, b) => (a, compress_properties(b.ml_statistics).proper) },
wenzelm@65645
   854
              build_info.sessions.iterator.filter(p => p._2.ml_statistics.nonEmpty).toList)
wenzelm@65645
   855
          val entries = if (ml_stats.nonEmpty) ml_stats else List("" -> None)
wenzelm@65645
   856
          for ((session_name, ml_statistics) <- entries) {
wenzelm@65645
   857
            db.set_string(stmt, 1, log_file.name)
wenzelm@65645
   858
            db.set_string(stmt, 2, session_name)
wenzelm@65645
   859
            db.set_bytes(stmt, 3, ml_statistics)
wenzelm@65645
   860
            stmt.execute()
wenzelm@65645
   861
          }
wenzelm@65645
   862
        })
wenzelm@65645
   863
      }
wenzelm@65645
   864
    }
wenzelm@65645
   865
wenzelm@65645
   866
    def write_info(db: SQL.Database, files: List[JFile], ml_statistics: Boolean = false)
wenzelm@65642
   867
    {
wenzelm@65642
   868
      class Table_Status(table: SQL.Table, update_db: (SQL.Database, Log_File) => Unit)
wenzelm@65642
   869
      {
wenzelm@65688
   870
        db.create_table(table)
wenzelm@65694
   871
        private var known: Set[String] = domain(db, table, Data.log_name)
wenzelm@65688
   872
wenzelm@65642
   873
        def required(file: JFile): Boolean = !known(Log_File.plain_name(file.getName))
wenzelm@65642
   874
        def update(log_file: Log_File)
wenzelm@65642
   875
        {
wenzelm@65642
   876
          if (!known(log_file.name)) {
wenzelm@65642
   877
            update_db(db, log_file)
wenzelm@65642
   878
            known += log_file.name
wenzelm@65618
   879
          }
wenzelm@65614
   880
        }
wenzelm@65605
   881
      }
wenzelm@65642
   882
      val status =
wenzelm@65642
   883
        List(
wenzelm@65694
   884
          new Table_Status(Data.meta_info_table, update_meta_info _),
wenzelm@65694
   885
          new Table_Status(Data.sessions_table, update_sessions _),
wenzelm@65694
   886
          new Table_Status(Data.ml_statistics_table,
wenzelm@65645
   887
            if (ml_statistics) update_ml_statistics _
wenzelm@65645
   888
            else (_: SQL.Database, _: Log_File) => ()))
wenzelm@65642
   889
wenzelm@65645
   890
      for (file_group <- files.filter(file => status.exists(_.required(file))).grouped(100)) {
wenzelm@65642
   891
        val log_files = Par_List.map[JFile, Log_File](Log_File.apply _, file_group)
wenzelm@65642
   892
        db.transaction { log_files.foreach(log_file => status.foreach(_.update(log_file))) }
wenzelm@65642
   893
      }
wenzelm@65605
   894
    }
wenzelm@65605
   895
wenzelm@65621
   896
    def read_meta_info(db: SQL.Database, log_name: String): Option[Meta_Info] =
wenzelm@65621
   897
    {
wenzelm@65694
   898
      val table = Data.meta_info_table
wenzelm@65642
   899
      val columns = table.columns.tail
wenzelm@65694
   900
      using(db.select(table, columns, Data.log_name.sql_where_equal(log_name)))(stmt =>
wenzelm@65621
   901
      {
wenzelm@65621
   902
        val rs = stmt.executeQuery
wenzelm@65621
   903
        if (!rs.next) None
wenzelm@65621
   904
        else {
wenzelm@65621
   905
          val results =
wenzelm@65642
   906
            columns.map(c => c.name ->
wenzelm@65621
   907
              (if (c.T == SQL.Type.Date)
wenzelm@65621
   908
                db.get(rs, c, db.date _).map(Log_File.Date_Format(_))
wenzelm@65621
   909
               else
wenzelm@65624
   910
                db.get(rs, c, db.string _)))
wenzelm@65621
   911
          val n = Prop.all_props.length
wenzelm@65621
   912
          val props = for ((x, Some(y)) <- results.take(n)) yield (x, y)
wenzelm@65621
   913
          val settings = for ((x, Some(y)) <- results.drop(n)) yield (x, y)
wenzelm@65621
   914
          Some(Meta_Info(props, settings))
wenzelm@65621
   915
        }
wenzelm@65621
   916
      })
wenzelm@65621
   917
    }
wenzelm@65621
   918
wenzelm@65621
   919
    def read_build_info(
wenzelm@65629
   920
      db: SQL.Database,
wenzelm@65629
   921
      log_name: String,
wenzelm@65629
   922
      session_names: List[String] = Nil,
wenzelm@65629
   923
      ml_statistics: Boolean = false): Build_Info =
wenzelm@65621
   924
    {
wenzelm@65694
   925
      val table1 = Data.sessions_table
wenzelm@65694
   926
      val table2 = Data.ml_statistics_table
wenzelm@65629
   927
wenzelm@65645
   928
      val where_log_name =
wenzelm@65694
   929
        Data.log_name(table1).sql_where_equal(log_name) + " AND " +
wenzelm@65694
   930
          Data.session_name(table1).sql + " <> ''"
wenzelm@65621
   931
      val where =
wenzelm@65645
   932
        if (session_names.isEmpty) where_log_name
wenzelm@65621
   933
        else
wenzelm@65645
   934
          where_log_name + " AND " +
wenzelm@65694
   935
          session_names.map(a => Data.session_name(table1).sql + " = " + SQL.string(a)).
wenzelm@65621
   936
            mkString("(", " OR ", ")")
wenzelm@65629
   937
wenzelm@65645
   938
      val columns1 = table1.columns.tail.map(_.apply(table1))
wenzelm@65645
   939
      val (columns, from) =
wenzelm@65645
   940
        if (ml_statistics) {
wenzelm@65694
   941
          val columns = columns1 ::: List(Data.ml_statistics(table2))
wenzelm@65668
   942
          val join =
wenzelm@65668
   943
            SQL.join_outer(table1, table2,
wenzelm@65694
   944
              Data.log_name(table1).sql + " = " +
wenzelm@65694
   945
              Data.log_name(table2).sql + " AND " +
wenzelm@65694
   946
              Data.session_name(table1).sql + " = " +
wenzelm@65694
   947
              Data.session_name(table2).sql)
wenzelm@65668
   948
          (columns, SQL.enclose(join))
wenzelm@65645
   949
        }
wenzelm@65649
   950
        else (columns1, table1.sql)
wenzelm@65645
   951
wenzelm@65621
   952
      val sessions =
wenzelm@65645
   953
        using(db.statement(SQL.select(columns) + from + " " + where))(stmt =>
wenzelm@65621
   954
        {
wenzelm@65621
   955
          SQL.iterator(stmt.executeQuery)(rs =>
wenzelm@65621
   956
          {
wenzelm@65694
   957
            val session_name = db.string(rs, Data.session_name)
wenzelm@65626
   958
            val session_entry =
wenzelm@65626
   959
              Session_Entry(
wenzelm@65694
   960
                chapter = db.string(rs, Data.chapter),
wenzelm@65694
   961
                groups = split_lines(db.string(rs, Data.groups)),
wenzelm@65694
   962
                threads = db.get(rs, Data.threads, db.int _),
wenzelm@65626
   963
                timing =
wenzelm@65694
   964
                  Timing(Time.ms(db.long(rs, Data.timing_elapsed)),
wenzelm@65694
   965
                    Time.ms(db.long(rs, Data.timing_cpu)),
wenzelm@65694
   966
                    Time.ms(db.long(rs, Data.timing_gc))),
wenzelm@65626
   967
                ml_timing =
wenzelm@65694
   968
                  Timing(Time.ms(db.long(rs, Data.ml_timing_elapsed)),
wenzelm@65694
   969
                    Time.ms(db.long(rs, Data.ml_timing_cpu)),
wenzelm@65694
   970
                    Time.ms(db.long(rs, Data.ml_timing_gc))),
wenzelm@65694
   971
                heap_size = db.get(rs, Data.heap_size, db.long _),
wenzelm@65643
   972
                status =
wenzelm@65694
   973
                  db.get(rs, Data.status, db.string _).
wenzelm@65643
   974
                    map(Session_Status.withName(_)),
wenzelm@65629
   975
                ml_statistics =
wenzelm@65694
   976
                  if (ml_statistics) uncompress_properties(db.bytes(rs, Data.ml_statistics))
wenzelm@65629
   977
                  else Nil)
wenzelm@65626
   978
            session_name -> session_entry
wenzelm@65621
   979
          }).toMap
wenzelm@65621
   980
        })
wenzelm@65621
   981
      Build_Info(sessions)
wenzelm@65621
   982
    }
wenzelm@65595
   983
  }
wenzelm@64045
   984
}