| author | traytel | 
| Thu, 11 Mar 2021 10:25:04 +0100 | |
| changeset 73408 | be11fe268b33 | 
| parent 73344 | f5c147654661 | 
| child 73712 | 3eba8d4b624b | 
| permissions | -rw-r--r-- | 
| 64160 | 1 | /* Title: Pure/Admin/build_log.scala | 
| 64045 | 2 | Author: Makarius | 
| 3 | ||
| 65608 | 4 | Management of build log files and database storage. | 
| 64045 | 5 | */ | 
| 6 | ||
| 7 | package isabelle | |
| 8 | ||
| 9 | ||
| 64100 | 10 | import java.io.{File => JFile}
 | 
| 64110 | 11 | import java.time.format.{DateTimeFormatter, DateTimeParseException}
 | 
| 64096 | 12 | import java.util.Locale | 
| 64061 
1bbea2b55d22
some support for header and data fields, notably from afp-test;
 wenzelm parents: 
64054diff
changeset | 13 | |
| 65600 | 14 | import scala.collection.immutable.SortedMap | 
| 64054 | 15 | import scala.collection.mutable | 
| 16 | import scala.util.matching.Regex | |
| 17 | ||
| 18 | ||
| 64045 | 19 | object Build_Log | 
| 20 | {
 | |
| 64298 | 21 | /** content **/ | 
| 64101 | 22 | |
| 64298 | 23 | /* properties */ | 
| 64150 | 24 | |
| 64298 | 25 | object Prop | 
| 26 |   {
 | |
| 65624 | 27 |     val build_tags = SQL.Column.string("build_tags")  // lines
 | 
| 28 |     val build_args = SQL.Column.string("build_args")  // lines
 | |
| 65591 | 29 |     val build_group_id = SQL.Column.string("build_group_id")
 | 
| 30 |     val build_id = SQL.Column.string("build_id")
 | |
| 31 |     val build_engine = SQL.Column.string("build_engine")
 | |
| 32 |     val build_host = SQL.Column.string("build_host")
 | |
| 33 |     val build_start = SQL.Column.date("build_start")
 | |
| 34 |     val build_end = SQL.Column.date("build_end")
 | |
| 35 |     val isabelle_version = SQL.Column.string("isabelle_version")
 | |
| 36 |     val afp_version = SQL.Column.string("afp_version")
 | |
| 37 | ||
| 65611 | 38 | val all_props: List[SQL.Column] = | 
| 65591 | 39 | List(build_tags, build_args, build_group_id, build_id, build_engine, | 
| 40 | build_host, build_start, build_end, isabelle_version, afp_version) | |
| 64298 | 41 | } | 
| 64150 | 42 | |
| 43 | ||
| 64298 | 44 | /* settings */ | 
| 64080 | 45 | |
| 64081 | 46 | object Settings | 
| 47 |   {
 | |
| 65611 | 48 |     val ISABELLE_BUILD_OPTIONS = SQL.Column.string("ISABELLE_BUILD_OPTIONS")
 | 
| 49 |     val ML_PLATFORM = SQL.Column.string("ML_PLATFORM")
 | |
| 50 |     val ML_HOME = SQL.Column.string("ML_HOME")
 | |
| 51 |     val ML_SYSTEM = SQL.Column.string("ML_SYSTEM")
 | |
| 52 |     val ML_OPTIONS = SQL.Column.string("ML_OPTIONS")
 | |
| 53 | ||
| 54 | val ml_settings = List(ML_PLATFORM, ML_HOME, ML_SYSTEM, ML_OPTIONS) | |
| 55 | val all_settings = ISABELLE_BUILD_OPTIONS :: ml_settings | |
| 64081 | 56 | |
| 57 | type Entry = (String, String) | |
| 58 | type T = List[Entry] | |
| 64080 | 59 | |
| 64081 | 60 | object Entry | 
| 61 |     {
 | |
| 62 | def unapply(s: String): Option[Entry] = | |
| 63 |         s.indexOf('=') match {
 | |
| 64 | case -1 => None | |
| 65 | case i => | |
| 66 | val a = s.substring(0, i) | |
| 67 | val b = Library.perhaps_unquote(s.substring(i + 1)) | |
| 68 | Some((a, b)) | |
| 69 | } | |
| 70 | def apply(a: String, b: String): String = a + "=" + quote(b) | |
| 71 | def getenv(a: String): String = apply(a, Isabelle_System.getenv(a)) | |
| 72 | } | |
| 64080 | 73 | |
| 71992 | 74 | def show(): String = | 
| 64081 | 75 | cat_lines( | 
| 71992 | 76 |         List(Entry.getenv("ISABELLE_TOOL_JAVA_OPTIONS"),
 | 
| 77 | Entry.getenv(ISABELLE_BUILD_OPTIONS.name), "") ::: | |
| 65611 | 78 | ml_settings.map(c => Entry.getenv(c.name))) | 
| 64080 | 79 | } | 
| 80 | ||
| 81 | ||
| 64298 | 82 | /* file names */ | 
| 83 | ||
| 84 | def log_date(date: Date): String = | |
| 85 | String.format(Locale.ROOT, "%s.%05d", | |
| 86 |       DateTimeFormatter.ofPattern("yyyy-MM-dd").format(date.rep),
 | |
| 71163 | 87 | java.lang.Long.valueOf((date.time - date.midnight.time).ms / 1000)) | 
| 64298 | 88 | |
| 89 | def log_subdir(date: Date): Path = | |
| 90 |     Path.explode("log") + Path.explode(date.rep.getYear.toString)
 | |
| 91 | ||
| 92 | def log_filename(engine: String, date: Date, more: List[String] = Nil): Path = | |
| 93 |     Path.explode((engine :: log_date(date) :: more).mkString("", "_", ".log"))
 | |
| 94 | ||
| 95 | ||
| 64100 | 96 | |
| 64062 | 97 | /** log file **/ | 
| 64045 | 98 | |
| 64155 | 99 | def print_date(date: Date): String = Log_File.Date_Format(date) | 
| 100 | ||
| 64062 | 101 | object Log_File | 
| 102 |   {
 | |
| 65607 | 103 | /* log file */ | 
| 104 | ||
| 65609 | 105 | def plain_name(name: String): String = | 
| 106 |     {
 | |
| 71621 | 107 |       List(".log", ".log.gz", ".log.xz", ".gz", ".xz").find(name.endsWith) match {
 | 
| 65609 | 108 | case Some(s) => Library.try_unsuffix(s, name).get | 
| 109 | case None => name | |
| 110 | } | |
| 111 | } | |
| 112 | ||
| 64062 | 113 | def apply(name: String, lines: List[String]): Log_File = | 
| 71653 
6f7a54954f19
more robust: process stdout on Windows may contain CR;
 wenzelm parents: 
71630diff
changeset | 114 | new Log_File(plain_name(name), lines.map(Library.trim_line)) | 
| 64062 | 115 | |
| 116 | def apply(name: String, text: String): Log_File = | |
| 71653 
6f7a54954f19
more robust: process stdout on Windows may contain CR;
 wenzelm parents: 
71630diff
changeset | 117 | new Log_File(plain_name(name), Library.trim_split_lines(text)) | 
| 64090 | 118 | |
| 119 | def apply(file: JFile): Log_File = | |
| 120 |     {
 | |
| 121 | val name = file.getName | |
| 65609 | 122 | val text = | 
| 123 |         if (name.endsWith(".gz")) File.read_gzip(file)
 | |
| 124 |         else if (name.endsWith(".xz")) File.read_xz(file)
 | |
| 125 | else File.read(file) | |
| 126 | apply(name, text) | |
| 64090 | 127 | } | 
| 128 | ||
| 129 | def apply(path: Path): Log_File = apply(path.file) | |
| 64101 | 130 | |
| 64110 | 131 | |
| 65607 | 132 | /* log file collections */ | 
| 133 | ||
| 134 | def is_log(file: JFile, | |
| 135 | prefixes: List[String] = | |
| 66995 
9cb263dbb2f7
plain identify job for Isabelle + AFP, independent of any Isabelle technology;
 wenzelm parents: 
66944diff
changeset | 136 | List(Build_History.log_prefix, Identify.log_prefix, Identify.log_prefix2, | 
| 
9cb263dbb2f7
plain identify job for Isabelle + AFP, independent of any Isabelle technology;
 wenzelm parents: 
66944diff
changeset | 137 | Isatest.log_prefix, AFP_Test.log_prefix, Jenkins.log_prefix), | 
| 65609 | 138 |       suffixes: List[String] = List(".log", ".log.gz", ".log.xz")): Boolean =
 | 
| 65607 | 139 |     {
 | 
| 140 | val name = file.getName | |
| 65639 | 141 | |
| 71621 | 142 | prefixes.exists(name.startsWith) && | 
| 143 | suffixes.exists(name.endsWith) && | |
| 65639 | 144 | name != "isatest.log" && | 
| 145 | name != "afp-test.log" && | |
| 146 | name != "main.log" | |
| 65607 | 147 | } | 
| 148 | ||
| 149 | ||
| 64110 | 150 | /* date format */ | 
| 151 | ||
| 64101 | 152 | val Date_Format = | 
| 153 |     {
 | |
| 154 | val fmts = | |
| 155 | Date.Formatter.variants( | |
| 64116 | 156 |           List("EEE MMM d HH:mm:ss O yyyy", "EEE MMM d HH:mm:ss VV yyyy"),
 | 
| 64104 
b70fa05d6746
more permissive: accept all historic isatest and afp-test logs;
 wenzelm parents: 
64103diff
changeset | 157 | List(Locale.ENGLISH, Locale.GERMAN)) ::: | 
| 64110 | 158 | List( | 
| 159 | DateTimeFormatter.RFC_1123_DATE_TIME, | |
| 69980 | 160 |           Date.Formatter.pattern("EEE MMM d HH:mm:ss yyyy").withZone(Date.timezone_berlin))
 | 
| 64101 | 161 | |
| 64104 
b70fa05d6746
more permissive: accept all historic isatest and afp-test logs;
 wenzelm parents: 
64103diff
changeset | 162 | def tune_timezone(s: String): String = | 
| 
b70fa05d6746
more permissive: accept all historic isatest and afp-test logs;
 wenzelm parents: 
64103diff
changeset | 163 |         s match {
 | 
| 64101 | 164 | case "CET" | "MET" => "GMT+1" | 
| 165 | case "CEST" | "MEST" => "GMT+2" | |
| 64104 
b70fa05d6746
more permissive: accept all historic isatest and afp-test logs;
 wenzelm parents: 
64103diff
changeset | 166 | case "EST" => "Europe/Berlin" | 
| 
b70fa05d6746
more permissive: accept all historic isatest and afp-test logs;
 wenzelm parents: 
64103diff
changeset | 167 | case _ => s | 
| 
b70fa05d6746
more permissive: accept all historic isatest and afp-test logs;
 wenzelm parents: 
64103diff
changeset | 168 | } | 
| 
b70fa05d6746
more permissive: accept all historic isatest and afp-test logs;
 wenzelm parents: 
64103diff
changeset | 169 | def tune_weekday(s: String): String = | 
| 
b70fa05d6746
more permissive: accept all historic isatest and afp-test logs;
 wenzelm parents: 
64103diff
changeset | 170 |         s match {
 | 
| 
b70fa05d6746
more permissive: accept all historic isatest and afp-test logs;
 wenzelm parents: 
64103diff
changeset | 171 | case "Die" => "Di" | 
| 
b70fa05d6746
more permissive: accept all historic isatest and afp-test logs;
 wenzelm parents: 
64103diff
changeset | 172 | case "Mit" => "Mi" | 
| 
b70fa05d6746
more permissive: accept all historic isatest and afp-test logs;
 wenzelm parents: 
64103diff
changeset | 173 | case "Don" => "Do" | 
| 
b70fa05d6746
more permissive: accept all historic isatest and afp-test logs;
 wenzelm parents: 
64103diff
changeset | 174 | case "Fre" => "Fr" | 
| 
b70fa05d6746
more permissive: accept all historic isatest and afp-test logs;
 wenzelm parents: 
64103diff
changeset | 175 | case "Sam" => "Sa" | 
| 
b70fa05d6746
more permissive: accept all historic isatest and afp-test logs;
 wenzelm parents: 
64103diff
changeset | 176 | case "Son" => "So" | 
| 
b70fa05d6746
more permissive: accept all historic isatest and afp-test logs;
 wenzelm parents: 
64103diff
changeset | 177 | case _ => s | 
| 
b70fa05d6746
more permissive: accept all historic isatest and afp-test logs;
 wenzelm parents: 
64103diff
changeset | 178 | } | 
| 
b70fa05d6746
more permissive: accept all historic isatest and afp-test logs;
 wenzelm parents: 
64103diff
changeset | 179 | |
| 
b70fa05d6746
more permissive: accept all historic isatest and afp-test logs;
 wenzelm parents: 
64103diff
changeset | 180 | def tune(s: String): String = | 
| 
b70fa05d6746
more permissive: accept all historic isatest and afp-test logs;
 wenzelm parents: 
64103diff
changeset | 181 | Word.implode( | 
| 
b70fa05d6746
more permissive: accept all historic isatest and afp-test logs;
 wenzelm parents: 
64103diff
changeset | 182 |           Word.explode(s) match {
 | 
| 71621 | 183 | case a :: "M\uFFFDr" :: bs => tune_weekday(a) :: "Mär" :: bs.map(tune_timezone) | 
| 184 | case a :: bs => tune_weekday(a) :: bs.map(tune_timezone) | |
| 64104 
b70fa05d6746
more permissive: accept all historic isatest and afp-test logs;
 wenzelm parents: 
64103diff
changeset | 185 | case Nil => Nil | 
| 
b70fa05d6746
more permissive: accept all historic isatest and afp-test logs;
 wenzelm parents: 
64103diff
changeset | 186 | } | 
| 
b70fa05d6746
more permissive: accept all historic isatest and afp-test logs;
 wenzelm parents: 
64103diff
changeset | 187 | ) | 
| 64101 | 188 | |
| 189 | Date.Format.make(fmts, tune) | |
| 190 | } | |
| 64102 | 191 | } | 
| 192 | ||
| 193 | class Log_File private(val name: String, val lines: List[String]) | |
| 194 |   {
 | |
| 195 | log_file => | |
| 196 | ||
| 197 | override def toString: String = name | |
| 198 | ||
| 199 | def text: String = cat_lines(lines) | |
| 200 | ||
| 201 | def err(msg: String): Nothing = | |
| 202 |       error("Error in log file " + quote(name) + ": " + msg)
 | |
| 203 | ||
| 204 | ||
| 205 | /* date format */ | |
| 64101 | 206 | |
| 207 | object Strict_Date | |
| 208 |     {
 | |
| 209 | def unapply(s: String): Some[Date] = | |
| 64102 | 210 |         try { Some(Log_File.Date_Format.parse(s)) }
 | 
| 64101 | 211 |         catch { case exn: DateTimeParseException => log_file.err(exn.getMessage) }
 | 
| 212 | } | |
| 213 | ||
| 214 | ||
| 71620 | 215 | /* inlined text */ | 
| 64062 | 216 | |
| 71620 | 217 | def filter(Marker: Protocol_Message.Marker): List[String] = | 
| 218 | for (Marker(text) <- lines) yield text | |
| 64062 | 219 | |
| 71620 | 220 | def find(Marker: Protocol_Message.Marker): Option[String] = | 
| 221 |       lines.collectFirst({ case Marker(text) => text })
 | |
| 64196 
6688b9cd443b
more robust wrt. old versions that use clear-text properties (e.g. Timing in build_history_base);
 wenzelm parents: 
64193diff
changeset | 222 | |
| 65684 | 223 | def find_match(regexes: List[Regex]): Option[String] = | 
| 224 |       regexes match {
 | |
| 225 | case Nil => None | |
| 226 | case regex :: rest => | |
| 227 | lines.iterator.map(regex.unapplySeq(_)).find(res => res.isDefined && res.get.length == 1). | |
| 228 | map(res => res.get.head) orElse find_match(rest) | |
| 229 | } | |
| 64062 | 230 | |
| 231 | ||
| 232 | /* settings */ | |
| 233 | ||
| 64091 | 234 | def get_setting(a: String): Option[Settings.Entry] = | 
| 235 |       lines.find(_.startsWith(a + "=")) match {
 | |
| 236 | case Some(line) => Settings.Entry.unapply(line) | |
| 237 | case None => None | |
| 238 | } | |
| 64045 | 239 | |
| 65611 | 240 | def get_all_settings: Settings.T = | 
| 241 |       for { c <- Settings.all_settings; entry <- get_setting(c.name) }
 | |
| 242 | yield entry | |
| 64062 | 243 | |
| 244 | ||
| 245 | /* properties (YXML) */ | |
| 246 | ||
| 73031 
f93f0597f4fb
clarified signature: absorb XZ.Cache into XML.Cache;
 wenzelm parents: 
73025diff
changeset | 247 | val cache: XML.Cache = XML.Cache.make() | 
| 64062 | 248 | |
| 249 | def parse_props(text: String): Properties.T = | |
| 73031 
f93f0597f4fb
clarified signature: absorb XZ.Cache into XML.Cache;
 wenzelm parents: 
73025diff
changeset | 250 |       try { cache.props(XML.Decode.properties(YXML.parse_body(text))) }
 | 
| 66046 | 251 |       catch { case _: XML.Error => log_file.err("malformed properties") }
 | 
| 64062 | 252 | |
| 71620 | 253 | def filter_props(marker: Protocol_Message.Marker): List[Properties.T] = | 
| 254 | for (text <- filter(marker) if YXML.detect(text)) yield parse_props(text) | |
| 64062 | 255 | |
| 71620 | 256 | def find_props(marker: Protocol_Message.Marker): Option[Properties.T] = | 
| 257 | for (text <- find(marker) if YXML.detect(text)) yield parse_props(text) | |
| 64062 | 258 | |
| 259 | ||
| 260 | /* parse various formats */ | |
| 261 | ||
| 64105 | 262 | def parse_meta_info(): Meta_Info = Build_Log.parse_meta_info(log_file) | 
| 263 | ||
| 65646 | 264 | def parse_build_info(ml_statistics: Boolean = false): Build_Info = | 
| 265 | Build_Log.parse_build_info(log_file, ml_statistics) | |
| 64105 | 266 | |
| 64082 | 267 | def parse_session_info( | 
| 268 | command_timings: Boolean = false, | |
| 66873 
9953ae603a23
provide theory timing information, similar to command timing but always considered relevant;
 wenzelm parents: 
66863diff
changeset | 269 | theory_timings: Boolean = false, | 
| 64082 | 270 | ml_statistics: Boolean = false, | 
| 271 | task_statistics: Boolean = false): Session_Info = | |
| 66873 
9953ae603a23
provide theory timing information, similar to command timing but always considered relevant;
 wenzelm parents: 
66863diff
changeset | 272 | Build_Log.parse_session_info( | 
| 
9953ae603a23
provide theory timing information, similar to command timing but always considered relevant;
 wenzelm parents: 
66863diff
changeset | 273 | log_file, command_timings, theory_timings, ml_statistics, task_statistics) | 
| 64045 | 274 | } | 
| 275 | ||
| 276 | ||
| 64098 | 277 | |
| 65276 | 278 | /** digested meta info: produced by Admin/build_history in log.xz file **/ | 
| 64045 | 279 | |
| 64108 | 280 | object Meta_Info | 
| 64099 | 281 |   {
 | 
| 64108 | 282 | val empty: Meta_Info = Meta_Info(Nil, Nil) | 
| 64099 | 283 | } | 
| 64098 | 284 | |
| 65611 | 285 | sealed case class Meta_Info(props: Properties.T, settings: Settings.T) | 
| 64103 | 286 |   {
 | 
| 287 | def is_empty: Boolean = props.isEmpty && settings.isEmpty | |
| 65599 | 288 | |
| 65611 | 289 | def get(c: SQL.Column): Option[String] = | 
| 290 | Properties.get(props, c.name) orElse | |
| 291 | Properties.get(settings, c.name) | |
| 292 | ||
| 293 | def get_date(c: SQL.Column): Option[Date] = | |
| 71621 | 294 | get(c).map(Log_File.Date_Format.parse) | 
| 64103 | 295 | } | 
| 64061 
1bbea2b55d22
some support for header and data fields, notably from afp-test;
 wenzelm parents: 
64054diff
changeset | 296 | |
| 65625 | 297 | object Identify | 
| 298 |   {
 | |
| 299 | val log_prefix = "isabelle_identify_" | |
| 66995 
9cb263dbb2f7
plain identify job for Isabelle + AFP, independent of any Isabelle technology;
 wenzelm parents: 
66944diff
changeset | 300 | val log_prefix2 = "plain_identify_" | 
| 65674 
23897f5d885d
approximate repository identify job based on isabelle-nightly-slow;
 wenzelm parents: 
65670diff
changeset | 301 | |
| 
23897f5d885d
approximate repository identify job based on isabelle-nightly-slow;
 wenzelm parents: 
65670diff
changeset | 302 | def engine(log_file: Log_File): String = | 
| 
23897f5d885d
approximate repository identify job based on isabelle-nightly-slow;
 wenzelm parents: 
65670diff
changeset | 303 | if (log_file.name.startsWith(Jenkins.log_prefix)) "jenkins_identify" | 
| 66995 
9cb263dbb2f7
plain identify job for Isabelle + AFP, independent of any Isabelle technology;
 wenzelm parents: 
66944diff
changeset | 304 | else if (log_file.name.startsWith(log_prefix2)) "plain_identify" | 
| 65674 
23897f5d885d
approximate repository identify job based on isabelle-nightly-slow;
 wenzelm parents: 
65670diff
changeset | 305 | else "identify" | 
| 
23897f5d885d
approximate repository identify job based on isabelle-nightly-slow;
 wenzelm parents: 
65670diff
changeset | 306 | |
| 
23897f5d885d
approximate repository identify job based on isabelle-nightly-slow;
 wenzelm parents: 
65670diff
changeset | 307 | def content(date: Date, isabelle_version: Option[String], afp_version: Option[String]): String = | 
| 
23897f5d885d
approximate repository identify job based on isabelle-nightly-slow;
 wenzelm parents: 
65670diff
changeset | 308 | terminate_lines( | 
| 
23897f5d885d
approximate repository identify job based on isabelle-nightly-slow;
 wenzelm parents: 
65670diff
changeset | 309 |         List("isabelle_identify: " + Build_Log.print_date(date), "") :::
 | 
| 
23897f5d885d
approximate repository identify job based on isabelle-nightly-slow;
 wenzelm parents: 
65670diff
changeset | 310 |         isabelle_version.map("Isabelle version: " + _).toList :::
 | 
| 
23897f5d885d
approximate repository identify job based on isabelle-nightly-slow;
 wenzelm parents: 
65670diff
changeset | 311 |         afp_version.map("AFP version: " + _).toList)
 | 
| 
23897f5d885d
approximate repository identify job based on isabelle-nightly-slow;
 wenzelm parents: 
65670diff
changeset | 312 | |
| 65625 | 313 |     val Start = new Regex("""^isabelle_identify: (.+)$""")
 | 
| 314 |     val No_End = new Regex("""$.""")
 | |
| 65684 | 315 |     val Isabelle_Version = List(new Regex("""^Isabelle version: (\S+)$"""))
 | 
| 316 |     val AFP_Version = List(new Regex("""^AFP version: (\S+)$"""))
 | |
| 65625 | 317 | } | 
| 318 | ||
| 64095 | 319 | object Isatest | 
| 320 |   {
 | |
| 65588 | 321 | val log_prefix = "isatest-makeall-" | 
| 64108 | 322 | val engine = "isatest" | 
| 64109 | 323 |     val Start = new Regex("""^------------------- starting test --- (.+) --- (.+)$""")
 | 
| 324 |     val End = new Regex("""^------------------- test (?:successful|FAILED) --- (.+) --- .*$""")
 | |
| 65684 | 325 |     val Isabelle_Version = List(new Regex("""^Isabelle version: (\S+)$"""))
 | 
| 64095 | 326 | } | 
| 327 | ||
| 64109 | 328 | object AFP_Test | 
| 64061 
1bbea2b55d22
some support for header and data fields, notably from afp-test;
 wenzelm parents: 
64054diff
changeset | 329 |   {
 | 
| 65588 | 330 | val log_prefix = "afp-test-devel-" | 
| 64108 | 331 | val engine = "afp-test" | 
| 64109 | 332 |     val Start = new Regex("""^Start test(?: for .+)? at ([^,]+), (.*)$""")
 | 
| 333 |     val Start_Old = new Regex("""^Start test(?: for .+)? at ([^,]+)$""")
 | |
| 334 |     val End = new Regex("""^End test on (.+), .+, elapsed time:.*$""")
 | |
| 65684 | 335 |     val Isabelle_Version = List(new Regex("""^Isabelle version: .* -- hg id (\S+)$"""))
 | 
| 336 |     val AFP_Version = List(new Regex("""^AFP version: .* -- hg id (\S+)$"""))
 | |
| 64104 
b70fa05d6746
more permissive: accept all historic isatest and afp-test logs;
 wenzelm parents: 
64103diff
changeset | 337 |     val Bad_Init = new Regex("""^cp:.*: Disc quota exceeded$""")
 | 
| 64061 
1bbea2b55d22
some support for header and data fields, notably from afp-test;
 wenzelm parents: 
64054diff
changeset | 338 | } | 
| 
1bbea2b55d22
some support for header and data fields, notably from afp-test;
 wenzelm parents: 
64054diff
changeset | 339 | |
| 64110 | 340 | object Jenkins | 
| 341 |   {
 | |
| 65664 | 342 | val log_prefix = "jenkins_" | 
| 64110 | 343 | val engine = "jenkins" | 
| 65663 | 344 |     val Host = new Regex("""^Building remotely on (\S+) \((\S+)\).*$""")
 | 
| 65665 | 345 |     val Start = new Regex("""^(?:Started by an SCM change|Started from command line by admin|).*$""")
 | 
| 64110 | 346 |     val Start_Date = new Regex("""^Build started at (.+)$""")
 | 
| 347 |     val No_End = new Regex("""$.""")
 | |
| 65674 
23897f5d885d
approximate repository identify job based on isabelle-nightly-slow;
 wenzelm parents: 
65670diff
changeset | 348 | val Isabelle_Version = | 
| 65684 | 349 |       List(new Regex("""^(?:Build for Isabelle id|Isabelle id) (\w+).*$"""),
 | 
| 65685 | 350 |         new Regex("""^ISABELLE_CI_REPO_ID="(\w+)".*$"""),
 | 
| 351 |         new Regex("""^(\w{12}) tip.*$"""))
 | |
| 65674 
23897f5d885d
approximate repository identify job based on isabelle-nightly-slow;
 wenzelm parents: 
65670diff
changeset | 352 | val AFP_Version = | 
| 65684 | 353 |       List(new Regex("""^(?:Build for AFP id|AFP id) (\w+).*$"""),
 | 
| 354 |         new Regex("""^ISABELLE_CI_AFP_ID="(\w+)".*$"""))
 | |
| 64110 | 355 | val CONFIGURATION = "=== CONFIGURATION ===" | 
| 356 | val BUILD = "=== BUILD ===" | |
| 357 | } | |
| 358 | ||
| 64105 | 359 | private def parse_meta_info(log_file: Log_File): Meta_Info = | 
| 64061 
1bbea2b55d22
some support for header and data fields, notably from afp-test;
 wenzelm parents: 
64054diff
changeset | 360 |   {
 | 
| 64108 | 361 | def parse(engine: String, host: String, start: Date, | 
| 65684 | 362 | End: Regex, Isabelle_Version: List[Regex], AFP_Version: List[Regex]): Meta_Info = | 
| 64091 | 363 |     {
 | 
| 64296 
544481988e65
explicit identification of builds and correlated build groups;
 wenzelm parents: 
64196diff
changeset | 364 | val build_id = | 
| 
544481988e65
explicit identification of builds and correlated build groups;
 wenzelm parents: 
64196diff
changeset | 365 |       {
 | 
| 65714 | 366 | val prefix = proper_string(host) orElse proper_string(engine) getOrElse "build" | 
| 367 | prefix + ":" + start.time.ms | |
| 64296 
544481988e65
explicit identification of builds and correlated build groups;
 wenzelm parents: 
64196diff
changeset | 368 | } | 
| 65591 | 369 | val build_engine = if (engine == "") Nil else List(Prop.build_engine.name -> engine) | 
| 370 | val build_host = if (host == "") Nil else List(Prop.build_host.name -> host) | |
| 64108 | 371 | |
| 65599 | 372 | val start_date = List(Prop.build_start.name -> print_date(start)) | 
| 64091 | 373 | val end_date = | 
| 374 |         log_file.lines.last match {
 | |
| 64109 | 375 | case End(log_file.Strict_Date(end_date)) => | 
| 65599 | 376 | List(Prop.build_end.name -> print_date(end_date)) | 
| 64091 | 377 | case _ => Nil | 
| 378 | } | |
| 379 | ||
| 380 | val isabelle_version = | |
| 65591 | 381 | log_file.find_match(Isabelle_Version).map(Prop.isabelle_version.name -> _) | 
| 64091 | 382 | val afp_version = | 
| 65591 | 383 | log_file.find_match(AFP_Version).map(Prop.afp_version.name -> _) | 
| 64062 | 384 | |
| 65591 | 385 | Meta_Info((Prop.build_id.name -> build_id) :: build_engine ::: build_host ::: | 
| 64108 | 386 | start_date ::: end_date ::: isabelle_version.toList ::: afp_version.toList, | 
| 65611 | 387 | log_file.get_all_settings) | 
| 64091 | 388 | } | 
| 389 | ||
| 390 |     log_file.lines match {
 | |
| 71630 
50425e4c3910
clarified modules: global quasi-scope for markers;
 wenzelm parents: 
71621diff
changeset | 391 | case line :: _ if Protocol.Meta_Info_Marker.test_yxml(line) => | 
| 
50425e4c3910
clarified modules: global quasi-scope for markers;
 wenzelm parents: 
71621diff
changeset | 392 | Meta_Info(log_file.find_props(Protocol.Meta_Info_Marker).get, log_file.get_all_settings) | 
| 64117 | 393 | |
| 65625 | 394 | case Identify.Start(log_file.Strict_Date(start)) :: _ => | 
| 65674 
23897f5d885d
approximate repository identify job based on isabelle-nightly-slow;
 wenzelm parents: 
65670diff
changeset | 395 | parse(Identify.engine(log_file), "", start, Identify.No_End, | 
| 65625 | 396 | Identify.Isabelle_Version, Identify.AFP_Version) | 
| 397 | ||
| 64109 | 398 | case Isatest.Start(log_file.Strict_Date(start), host) :: _ => | 
| 399 | parse(Isatest.engine, host, start, Isatest.End, | |
| 65684 | 400 | Isatest.Isabelle_Version, Nil) | 
| 64099 | 401 | |
| 64109 | 402 | case AFP_Test.Start(log_file.Strict_Date(start), host) :: _ => | 
| 403 | parse(AFP_Test.engine, host, start, AFP_Test.End, | |
| 404 | AFP_Test.Isabelle_Version, AFP_Test.AFP_Version) | |
| 64099 | 405 | |
| 64109 | 406 | case AFP_Test.Start_Old(log_file.Strict_Date(start)) :: _ => | 
| 407 | parse(AFP_Test.engine, "", start, AFP_Test.End, | |
| 408 | AFP_Test.Isabelle_Version, AFP_Test.AFP_Version) | |
| 64099 | 409 | |
| 65665 | 410 | case Jenkins.Start() :: _ => | 
| 64110 | 411 |         log_file.lines.dropWhile(_ != Jenkins.BUILD) match {
 | 
| 412 | case Jenkins.BUILD :: _ :: Jenkins.Start_Date(log_file.Strict_Date(start)) :: _ => | |
| 65663 | 413 | val host = | 
| 414 |               log_file.lines.takeWhile(_ != Jenkins.CONFIGURATION).collectFirst({
 | |
| 415 | case Jenkins.Host(a, b) => a + "." + b | |
| 416 |               }).getOrElse("")
 | |
| 69980 | 417 | parse(Jenkins.engine, host, start.to(Date.timezone_berlin), Jenkins.No_End, | 
| 64110 | 418 | Jenkins.Isabelle_Version, Jenkins.AFP_Version) | 
| 419 | case _ => Meta_Info.empty | |
| 420 | } | |
| 421 | ||
| 64341 | 422 |       case line :: _ if line.startsWith("\u0000") => Meta_Info.empty
 | 
| 64109 | 423 | case List(Isatest.End(_)) => Meta_Info.empty | 
| 424 | case _ :: AFP_Test.Bad_Init() :: _ => Meta_Info.empty | |
| 64105 | 425 | case Nil => Meta_Info.empty | 
| 64104 
b70fa05d6746
more permissive: accept all historic isatest and afp-test logs;
 wenzelm parents: 
64103diff
changeset | 426 | |
| 64110 | 427 |       case _ => log_file.err("cannot detect log file format")
 | 
| 64061 
1bbea2b55d22
some support for header and data fields, notably from afp-test;
 wenzelm parents: 
64054diff
changeset | 428 | } | 
| 
1bbea2b55d22
some support for header and data fields, notably from afp-test;
 wenzelm parents: 
64054diff
changeset | 429 | } | 
| 
1bbea2b55d22
some support for header and data fields, notably from afp-test;
 wenzelm parents: 
64054diff
changeset | 430 | |
| 64085 
1c451e5c145f
clarified parse_build_info: isabelle build output;
 wenzelm parents: 
64083diff
changeset | 431 | |
| 64098 | 432 | |
| 65276 | 433 | /** build info: toplevel output of isabelle build or Admin/build_history **/ | 
| 64119 
8094eaa38d4b
inline session ML statistics into main build log;
 wenzelm parents: 
64117diff
changeset | 434 | |
| 
8094eaa38d4b
inline session ML statistics into main build log;
 wenzelm parents: 
64117diff
changeset | 435 | val SESSION_NAME = "session_name" | 
| 64085 
1c451e5c145f
clarified parse_build_info: isabelle build output;
 wenzelm parents: 
64083diff
changeset | 436 | |
| 64061 
1bbea2b55d22
some support for header and data fields, notably from afp-test;
 wenzelm parents: 
64054diff
changeset | 437 | object Session_Status extends Enumeration | 
| 
1bbea2b55d22
some support for header and data fields, notably from afp-test;
 wenzelm parents: 
64054diff
changeset | 438 |   {
 | 
| 65633 | 439 | val existing, finished, failed, cancelled = Value | 
| 64061 
1bbea2b55d22
some support for header and data fields, notably from afp-test;
 wenzelm parents: 
64054diff
changeset | 440 | } | 
| 
1bbea2b55d22
some support for header and data fields, notably from afp-test;
 wenzelm parents: 
64054diff
changeset | 441 | |
| 64085 
1c451e5c145f
clarified parse_build_info: isabelle build output;
 wenzelm parents: 
64083diff
changeset | 442 | sealed case class Session_Entry( | 
| 65643 | 443 | chapter: String = "", | 
| 444 | groups: List[String] = Nil, | |
| 445 | threads: Option[Int] = None, | |
| 446 | timing: Timing = Timing.zero, | |
| 447 | ml_timing: Timing = Timing.zero, | |
| 66913 | 448 | sources: Option[String] = None, | 
| 65643 | 449 | heap_size: Option[Long] = None, | 
| 450 | status: Option[Session_Status.Value] = None, | |
| 65937 | 451 | errors: List[String] = Nil, | 
| 66874 
0b8da0fc9563
store theory timings in session in build_log database;
 wenzelm parents: 
66873diff
changeset | 452 | theory_timings: Map[String, Timing] = Map.empty, | 
| 65643 | 453 | ml_statistics: List[Properties.T] = Nil) | 
| 64085 
1c451e5c145f
clarified parse_build_info: isabelle build output;
 wenzelm parents: 
64083diff
changeset | 454 |   {
 | 
| 65631 | 455 | def proper_groups: Option[String] = if (groups.isEmpty) None else Some(cat_lines(groups)) | 
| 65643 | 456 | def finished: Boolean = status == Some(Session_Status.finished) | 
| 65937 | 457 | def failed: Boolean = status == Some(Session_Status.failed) | 
| 64085 
1c451e5c145f
clarified parse_build_info: isabelle build output;
 wenzelm parents: 
64083diff
changeset | 458 | } | 
| 64054 | 459 | |
| 66874 
0b8da0fc9563
store theory timings in session in build_log database;
 wenzelm parents: 
66873diff
changeset | 460 | object Build_Info | 
| 
0b8da0fc9563
store theory timings in session in build_log database;
 wenzelm parents: 
66873diff
changeset | 461 |   {
 | 
| 
0b8da0fc9563
store theory timings in session in build_log database;
 wenzelm parents: 
66873diff
changeset | 462 | val sessions_dummy: Map[String, Session_Entry] = | 
| 
0b8da0fc9563
store theory timings in session in build_log database;
 wenzelm parents: 
66873diff
changeset | 463 |       Map("" -> Session_Entry(theory_timings = Map("" -> Timing.zero)))
 | 
| 
0b8da0fc9563
store theory timings in session in build_log database;
 wenzelm parents: 
66873diff
changeset | 464 | } | 
| 
0b8da0fc9563
store theory timings in session in build_log database;
 wenzelm parents: 
66873diff
changeset | 465 | |
| 64085 
1c451e5c145f
clarified parse_build_info: isabelle build output;
 wenzelm parents: 
64083diff
changeset | 466 | sealed case class Build_Info(sessions: Map[String, Session_Entry]) | 
| 64054 | 467 |   {
 | 
| 65937 | 468 | def finished_sessions: List[String] = for ((a, b) <- sessions.toList if b.finished) yield a | 
| 469 | def failed_sessions: List[String] = for ((a, b) <- sessions.toList if b.failed) yield a | |
| 64054 | 470 | } | 
| 471 | ||
| 65646 | 472 | private def parse_build_info(log_file: Log_File, parse_ml_statistics: Boolean): Build_Info = | 
| 64085 
1c451e5c145f
clarified parse_build_info: isabelle build output;
 wenzelm parents: 
64083diff
changeset | 473 |   {
 | 
| 
1c451e5c145f
clarified parse_build_info: isabelle build output;
 wenzelm parents: 
64083diff
changeset | 474 | object Chapter_Name | 
| 
1c451e5c145f
clarified parse_build_info: isabelle build output;
 wenzelm parents: 
64083diff
changeset | 475 |     {
 | 
| 
1c451e5c145f
clarified parse_build_info: isabelle build output;
 wenzelm parents: 
64083diff
changeset | 476 | def unapply(s: String): Some[(String, String)] = | 
| 
1c451e5c145f
clarified parse_build_info: isabelle build output;
 wenzelm parents: 
64083diff
changeset | 477 |         space_explode('/', s) match {
 | 
| 
1c451e5c145f
clarified parse_build_info: isabelle build output;
 wenzelm parents: 
64083diff
changeset | 478 | case List(chapter, name) => Some((chapter, name)) | 
| 
1c451e5c145f
clarified parse_build_info: isabelle build output;
 wenzelm parents: 
64083diff
changeset | 479 |           case _ => Some(("", s))
 | 
| 
1c451e5c145f
clarified parse_build_info: isabelle build output;
 wenzelm parents: 
64083diff
changeset | 480 | } | 
| 
1c451e5c145f
clarified parse_build_info: isabelle build output;
 wenzelm parents: 
64083diff
changeset | 481 | } | 
| 64054 | 482 | |
| 64085 
1c451e5c145f
clarified parse_build_info: isabelle build output;
 wenzelm parents: 
64083diff
changeset | 483 |     val Session_No_Groups = new Regex("""^Session (\S+)$""")
 | 
| 
1c451e5c145f
clarified parse_build_info: isabelle build output;
 wenzelm parents: 
64083diff
changeset | 484 |     val Session_Groups = new Regex("""^Session (\S+) \((.*)\)$""")
 | 
| 
1c451e5c145f
clarified parse_build_info: isabelle build output;
 wenzelm parents: 
64083diff
changeset | 485 | val Session_Finished1 = | 
| 
1c451e5c145f
clarified parse_build_info: isabelle build output;
 wenzelm parents: 
64083diff
changeset | 486 |       new Regex("""^Finished (\S+) \((\d+):(\d+):(\d+) elapsed time, (\d+):(\d+):(\d+) cpu time.*$""")
 | 
| 
1c451e5c145f
clarified parse_build_info: isabelle build output;
 wenzelm parents: 
64083diff
changeset | 487 | val Session_Finished2 = | 
| 72695 | 488 |       new Regex("""^Finished ([^\s/]+) \((\d+):(\d+):(\d+) elapsed time.*$""")
 | 
| 64085 
1c451e5c145f
clarified parse_build_info: isabelle build output;
 wenzelm parents: 
64083diff
changeset | 489 | val Session_Timing = | 
| 65679 | 490 |       new Regex("""^Timing (\S+) \((\d+) threads, (\d+\.\d+)s elapsed time, (\d+\.\d+)s cpu time, (\d+\.\d+)s GC time.*$""")
 | 
| 64086 
ac7ae5067783
clarified status: started sessions may bomb without explicit FAILED or CANCELLED (cf. in afp-test-devel-2016-01-03.log);
 wenzelm parents: 
64085diff
changeset | 491 |     val Session_Started = new Regex("""^(?:Running|Building) (\S+) \.\.\.$""")
 | 
| 66913 | 492 |     val Sources = new Regex("""^Sources (\S+) (\S{""" + SHA1.digest_length + """})$""")
 | 
| 64120 | 493 |     val Heap = new Regex("""^Heap (\S+) \((\d+) bytes\)$""")
 | 
| 64085 
1c451e5c145f
clarified parse_build_info: isabelle build output;
 wenzelm parents: 
64083diff
changeset | 494 | |
| 66874 
0b8da0fc9563
store theory timings in session in build_log database;
 wenzelm parents: 
66873diff
changeset | 495 | object Theory_Timing | 
| 
0b8da0fc9563
store theory timings in session in build_log database;
 wenzelm parents: 
66873diff
changeset | 496 |     {
 | 
| 
0b8da0fc9563
store theory timings in session in build_log database;
 wenzelm parents: 
66873diff
changeset | 497 | def unapply(line: String): Option[(String, (String, Timing))] = | 
| 71630 
50425e4c3910
clarified modules: global quasi-scope for markers;
 wenzelm parents: 
71621diff
changeset | 498 |         Protocol.Theory_Timing_Marker.unapply(line.replace('~', '-')).map(log_file.parse_props)
 | 
| 
50425e4c3910
clarified modules: global quasi-scope for markers;
 wenzelm parents: 
71621diff
changeset | 499 |         match {
 | 
| 72753 | 500 | case Some((SESSION_NAME, session) :: props) => | 
| 501 | for (theory <- Markup.Name.unapply(props)) | |
| 502 | yield (session, theory -> Markup.Timing_Properties.parse(props)) | |
| 66874 
0b8da0fc9563
store theory timings in session in build_log database;
 wenzelm parents: 
66873diff
changeset | 503 | case _ => None | 
| 
0b8da0fc9563
store theory timings in session in build_log database;
 wenzelm parents: 
66873diff
changeset | 504 | } | 
| 
0b8da0fc9563
store theory timings in session in build_log database;
 wenzelm parents: 
66873diff
changeset | 505 | } | 
| 
0b8da0fc9563
store theory timings in session in build_log database;
 wenzelm parents: 
66873diff
changeset | 506 | |
| 64085 
1c451e5c145f
clarified parse_build_info: isabelle build output;
 wenzelm parents: 
64083diff
changeset | 507 | var chapter = Map.empty[String, String] | 
| 
1c451e5c145f
clarified parse_build_info: isabelle build output;
 wenzelm parents: 
64083diff
changeset | 508 | var groups = Map.empty[String, List[String]] | 
| 
1c451e5c145f
clarified parse_build_info: isabelle build output;
 wenzelm parents: 
64083diff
changeset | 509 | var threads = Map.empty[String, Int] | 
| 64054 | 510 | var timing = Map.empty[String, Timing] | 
| 64085 
1c451e5c145f
clarified parse_build_info: isabelle build output;
 wenzelm parents: 
64083diff
changeset | 511 | var ml_timing = Map.empty[String, Timing] | 
| 64086 
ac7ae5067783
clarified status: started sessions may bomb without explicit FAILED or CANCELLED (cf. in afp-test-devel-2016-01-03.log);
 wenzelm parents: 
64085diff
changeset | 512 | var started = Set.empty[String] | 
| 66913 | 513 | var sources = Map.empty[String, String] | 
| 65627 | 514 | var heap_sizes = Map.empty[String, Long] | 
| 66874 
0b8da0fc9563
store theory timings in session in build_log database;
 wenzelm parents: 
66873diff
changeset | 515 | var theory_timings = Map.empty[String, Map[String, Timing]] | 
| 64119 
8094eaa38d4b
inline session ML statistics into main build log;
 wenzelm parents: 
64117diff
changeset | 516 | var ml_statistics = Map.empty[String, List[Properties.T]] | 
| 65937 | 517 | var errors = Map.empty[String, List[String]] | 
| 64119 
8094eaa38d4b
inline session ML statistics into main build log;
 wenzelm parents: 
64117diff
changeset | 518 | |
| 64085 
1c451e5c145f
clarified parse_build_info: isabelle build output;
 wenzelm parents: 
64083diff
changeset | 519 | def all_sessions: Set[String] = | 
| 64120 | 520 | chapter.keySet ++ groups.keySet ++ threads.keySet ++ timing.keySet ++ ml_timing.keySet ++ | 
| 72694 | 521 | started ++ sources.keySet ++ heap_sizes.keySet ++ | 
| 66913 | 522 | theory_timings.keySet ++ ml_statistics.keySet | 
| 64085 
1c451e5c145f
clarified parse_build_info: isabelle build output;
 wenzelm parents: 
64083diff
changeset | 523 | |
| 64054 | 524 | |
| 64062 | 525 |     for (line <- log_file.lines) {
 | 
| 64054 | 526 |       line match {
 | 
| 64085 
1c451e5c145f
clarified parse_build_info: isabelle build output;
 wenzelm parents: 
64083diff
changeset | 527 | case Session_No_Groups(Chapter_Name(chapt, name)) => | 
| 
1c451e5c145f
clarified parse_build_info: isabelle build output;
 wenzelm parents: 
64083diff
changeset | 528 | chapter += (name -> chapt) | 
| 
1c451e5c145f
clarified parse_build_info: isabelle build output;
 wenzelm parents: 
64083diff
changeset | 529 | groups += (name -> Nil) | 
| 64119 
8094eaa38d4b
inline session ML statistics into main build log;
 wenzelm parents: 
64117diff
changeset | 530 | |
| 64085 
1c451e5c145f
clarified parse_build_info: isabelle build output;
 wenzelm parents: 
64083diff
changeset | 531 | case Session_Groups(Chapter_Name(chapt, name), grps) => | 
| 
1c451e5c145f
clarified parse_build_info: isabelle build output;
 wenzelm parents: 
64083diff
changeset | 532 | chapter += (name -> chapt) | 
| 
1c451e5c145f
clarified parse_build_info: isabelle build output;
 wenzelm parents: 
64083diff
changeset | 533 | groups += (name -> Word.explode(grps)) | 
| 64119 
8094eaa38d4b
inline session ML statistics into main build log;
 wenzelm parents: 
64117diff
changeset | 534 | |
| 64086 
ac7ae5067783
clarified status: started sessions may bomb without explicit FAILED or CANCELLED (cf. in afp-test-devel-2016-01-03.log);
 wenzelm parents: 
64085diff
changeset | 535 | case Session_Started(name) => | 
| 
ac7ae5067783
clarified status: started sessions may bomb without explicit FAILED or CANCELLED (cf. in afp-test-devel-2016-01-03.log);
 wenzelm parents: 
64085diff
changeset | 536 | started += name | 
| 64119 
8094eaa38d4b
inline session ML statistics into main build log;
 wenzelm parents: 
64117diff
changeset | 537 | |
| 64054 | 538 | case Session_Finished1(name, | 
| 539 | Value.Int(e1), Value.Int(e2), Value.Int(e3), | |
| 540 | Value.Int(c1), Value.Int(c2), Value.Int(c3)) => | |
| 541 | val elapsed = Time.hms(e1, e2, e3) | |
| 542 | val cpu = Time.hms(c1, c2, c3) | |
| 64085 
1c451e5c145f
clarified parse_build_info: isabelle build output;
 wenzelm parents: 
64083diff
changeset | 543 | timing += (name -> Timing(elapsed, cpu, Time.zero)) | 
| 64119 
8094eaa38d4b
inline session ML statistics into main build log;
 wenzelm parents: 
64117diff
changeset | 544 | |
| 64054 | 545 | case Session_Finished2(name, | 
| 546 | Value.Int(e1), Value.Int(e2), Value.Int(e3)) => | |
| 547 | val elapsed = Time.hms(e1, e2, e3) | |
| 64085 
1c451e5c145f
clarified parse_build_info: isabelle build output;
 wenzelm parents: 
64083diff
changeset | 548 | timing += (name -> Timing(elapsed, Time.zero, Time.zero)) | 
| 64119 
8094eaa38d4b
inline session ML statistics into main build log;
 wenzelm parents: 
64117diff
changeset | 549 | |
| 64054 | 550 | case Session_Timing(name, | 
| 551 | Value.Int(t), Value.Double(e), Value.Double(c), Value.Double(g)) => | |
| 552 | val elapsed = Time.seconds(e) | |
| 553 | val cpu = Time.seconds(c) | |
| 554 | val gc = Time.seconds(g) | |
| 64085 
1c451e5c145f
clarified parse_build_info: isabelle build output;
 wenzelm parents: 
64083diff
changeset | 555 | ml_timing += (name -> Timing(elapsed, cpu, gc)) | 
| 64054 | 556 | threads += (name -> t) | 
| 64119 
8094eaa38d4b
inline session ML statistics into main build log;
 wenzelm parents: 
64117diff
changeset | 557 | |
| 66913 | 558 | case Sources(name, s) => | 
| 559 | sources += (name -> s) | |
| 560 | ||
| 64120 | 561 | case Heap(name, Value.Long(size)) => | 
| 562 | heap_sizes += (name -> size) | |
| 563 | ||
| 71630 
50425e4c3910
clarified modules: global quasi-scope for markers;
 wenzelm parents: 
71621diff
changeset | 564 | case _ if Protocol.Theory_Timing_Marker.test_yxml(line) => | 
| 66874 
0b8da0fc9563
store theory timings in session in build_log database;
 wenzelm parents: 
66873diff
changeset | 565 |           line match {
 | 
| 
0b8da0fc9563
store theory timings in session in build_log database;
 wenzelm parents: 
66873diff
changeset | 566 | case Theory_Timing(name, theory_timing) => | 
| 
0b8da0fc9563
store theory timings in session in build_log database;
 wenzelm parents: 
66873diff
changeset | 567 | theory_timings += (name -> (theory_timings.getOrElse(name, Map.empty) + theory_timing)) | 
| 
0b8da0fc9563
store theory timings in session in build_log database;
 wenzelm parents: 
66873diff
changeset | 568 |             case _ => log_file.err("malformed theory_timing " + quote(line))
 | 
| 
0b8da0fc9563
store theory timings in session in build_log database;
 wenzelm parents: 
66873diff
changeset | 569 | } | 
| 
0b8da0fc9563
store theory timings in session in build_log database;
 wenzelm parents: 
66873diff
changeset | 570 | |
| 71630 
50425e4c3910
clarified modules: global quasi-scope for markers;
 wenzelm parents: 
71621diff
changeset | 571 | case _ if parse_ml_statistics && Protocol.ML_Statistics_Marker.test_yxml(line) => | 
| 
50425e4c3910
clarified modules: global quasi-scope for markers;
 wenzelm parents: 
71621diff
changeset | 572 |           Protocol.ML_Statistics_Marker.unapply(line).map(log_file.parse_props) match {
 | 
| 66874 
0b8da0fc9563
store theory timings in session in build_log database;
 wenzelm parents: 
66873diff
changeset | 573 | case Some((SESSION_NAME, name) :: props) => | 
| 
0b8da0fc9563
store theory timings in session in build_log database;
 wenzelm parents: 
66873diff
changeset | 574 | ml_statistics += (name -> (props :: ml_statistics.getOrElse(name, Nil))) | 
| 
0b8da0fc9563
store theory timings in session in build_log database;
 wenzelm parents: 
66873diff
changeset | 575 |             case _ => log_file.err("malformed ML_statistics " + quote(line))
 | 
| 
0b8da0fc9563
store theory timings in session in build_log database;
 wenzelm parents: 
66873diff
changeset | 576 | } | 
| 64119 
8094eaa38d4b
inline session ML statistics into main build log;
 wenzelm parents: 
64117diff
changeset | 577 | |
| 71630 
50425e4c3910
clarified modules: global quasi-scope for markers;
 wenzelm parents: 
71621diff
changeset | 578 | case _ if Protocol.Error_Message_Marker.test_yxml(line) => | 
| 
50425e4c3910
clarified modules: global quasi-scope for markers;
 wenzelm parents: 
71621diff
changeset | 579 |           Protocol.Error_Message_Marker.unapply(line).map(log_file.parse_props) match {
 | 
| 66874 
0b8da0fc9563
store theory timings in session in build_log database;
 wenzelm parents: 
66873diff
changeset | 580 | case Some(List((SESSION_NAME, name), (Markup.CONTENT, msg))) => | 
| 71620 | 581 | errors += (name -> (msg :: errors.getOrElse(name, Nil))) | 
| 66874 
0b8da0fc9563
store theory timings in session in build_log database;
 wenzelm parents: 
66873diff
changeset | 582 |             case _ => log_file.err("malformed error message " + quote(line))
 | 
| 
0b8da0fc9563
store theory timings in session in build_log database;
 wenzelm parents: 
66873diff
changeset | 583 | } | 
| 65937 | 584 | |
| 64054 | 585 | case _ => | 
| 586 | } | |
| 587 | } | |
| 588 | ||
| 64085 
1c451e5c145f
clarified parse_build_info: isabelle build output;
 wenzelm parents: 
64083diff
changeset | 589 | val sessions = | 
| 
1c451e5c145f
clarified parse_build_info: isabelle build output;
 wenzelm parents: 
64083diff
changeset | 590 | Map( | 
| 
1c451e5c145f
clarified parse_build_info: isabelle build output;
 wenzelm parents: 
64083diff
changeset | 591 |         (for (name <- all_sessions.toList) yield {
 | 
| 
1c451e5c145f
clarified parse_build_info: isabelle build output;
 wenzelm parents: 
64083diff
changeset | 592 | val status = | 
| 72694 | 593 | if (timing.isDefinedAt(name) || ml_timing.isDefinedAt(name)) | 
| 65633 | 594 | Session_Status.finished | 
| 595 | else if (started(name)) Session_Status.failed | |
| 596 | else Session_Status.existing | |
| 64085 
1c451e5c145f
clarified parse_build_info: isabelle build output;
 wenzelm parents: 
64083diff
changeset | 597 | val entry = | 
| 
1c451e5c145f
clarified parse_build_info: isabelle build output;
 wenzelm parents: 
64083diff
changeset | 598 | Session_Entry( | 
| 65643 | 599 | chapter = chapter.getOrElse(name, ""), | 
| 600 | groups = groups.getOrElse(name, Nil), | |
| 601 | threads = threads.get(name), | |
| 602 | timing = timing.getOrElse(name, Timing.zero), | |
| 603 | ml_timing = ml_timing.getOrElse(name, Timing.zero), | |
| 66913 | 604 | sources = sources.get(name), | 
| 65643 | 605 | heap_size = heap_sizes.get(name), | 
| 606 | status = Some(status), | |
| 65937 | 607 | errors = errors.getOrElse(name, Nil).reverse, | 
| 66874 
0b8da0fc9563
store theory timings in session in build_log database;
 wenzelm parents: 
66873diff
changeset | 608 | theory_timings = theory_timings.getOrElse(name, Map.empty), | 
| 65643 | 609 | ml_statistics = ml_statistics.getOrElse(name, Nil).reverse) | 
| 64085 
1c451e5c145f
clarified parse_build_info: isabelle build output;
 wenzelm parents: 
64083diff
changeset | 610 | (name -> entry) | 
| 
1c451e5c145f
clarified parse_build_info: isabelle build output;
 wenzelm parents: 
64083diff
changeset | 611 | }):_*) | 
| 
1c451e5c145f
clarified parse_build_info: isabelle build output;
 wenzelm parents: 
64083diff
changeset | 612 | Build_Info(sessions) | 
| 64054 | 613 | } | 
| 64099 | 614 | |
| 615 | ||
| 616 | ||
| 72860 | 617 | /** session info: produced by isabelle build as session database **/ | 
| 64099 | 618 | |
| 619 | sealed case class Session_Info( | |
| 620 | session_timing: Properties.T, | |
| 621 | command_timings: List[Properties.T], | |
| 66873 
9953ae603a23
provide theory timing information, similar to command timing but always considered relevant;
 wenzelm parents: 
66863diff
changeset | 622 | theory_timings: List[Properties.T], | 
| 64099 | 623 | ml_statistics: List[Properties.T], | 
| 65934 | 624 | task_statistics: List[Properties.T], | 
| 625 | errors: List[String]) | |
| 66944 
05df740cb54b
more informative timeout message, notably for build_status;
 wenzelm parents: 
66913diff
changeset | 626 |   {
 | 
| 
05df740cb54b
more informative timeout message, notably for build_status;
 wenzelm parents: 
66913diff
changeset | 627 | def error(s: String): Session_Info = | 
| 
05df740cb54b
more informative timeout message, notably for build_status;
 wenzelm parents: 
66913diff
changeset | 628 | copy(errors = errors ::: List(s)) | 
| 
05df740cb54b
more informative timeout message, notably for build_status;
 wenzelm parents: 
66913diff
changeset | 629 | } | 
| 64099 | 630 | |
| 631 | private def parse_session_info( | |
| 632 | log_file: Log_File, | |
| 633 | command_timings: Boolean, | |
| 66873 
9953ae603a23
provide theory timing information, similar to command timing but always considered relevant;
 wenzelm parents: 
66863diff
changeset | 634 | theory_timings: Boolean, | 
| 64099 | 635 | ml_statistics: Boolean, | 
| 636 | task_statistics: Boolean): Session_Info = | |
| 637 |   {
 | |
| 65290 | 638 | Session_Info( | 
| 72012 | 639 | session_timing = log_file.find_props(Protocol.Session_Timing_Marker) getOrElse Nil, | 
| 71630 
50425e4c3910
clarified modules: global quasi-scope for markers;
 wenzelm parents: 
71621diff
changeset | 640 | command_timings = | 
| 
50425e4c3910
clarified modules: global quasi-scope for markers;
 wenzelm parents: 
71621diff
changeset | 641 | if (command_timings) log_file.filter_props(Protocol.Command_Timing_Marker) else Nil, | 
| 
50425e4c3910
clarified modules: global quasi-scope for markers;
 wenzelm parents: 
71621diff
changeset | 642 | theory_timings = | 
| 
50425e4c3910
clarified modules: global quasi-scope for markers;
 wenzelm parents: 
71621diff
changeset | 643 | if (theory_timings) log_file.filter_props(Protocol.Theory_Timing_Marker) else Nil, | 
| 
50425e4c3910
clarified modules: global quasi-scope for markers;
 wenzelm parents: 
71621diff
changeset | 644 | ml_statistics = | 
| 
50425e4c3910
clarified modules: global quasi-scope for markers;
 wenzelm parents: 
71621diff
changeset | 645 | if (ml_statistics) log_file.filter_props(Protocol.ML_Statistics_Marker) else Nil, | 
| 
50425e4c3910
clarified modules: global quasi-scope for markers;
 wenzelm parents: 
71621diff
changeset | 646 | task_statistics = | 
| 
50425e4c3910
clarified modules: global quasi-scope for markers;
 wenzelm parents: 
71621diff
changeset | 647 | if (task_statistics) log_file.filter_props(Protocol.Task_Statistics_Marker) else Nil, | 
| 
50425e4c3910
clarified modules: global quasi-scope for markers;
 wenzelm parents: 
71621diff
changeset | 648 | errors = log_file.filter(Protocol.Error_Message_Marker)) | 
| 64099 | 649 | } | 
| 65595 | 650 | |
| 73024 | 651 | def compress_errors(errors: List[String], cache: XZ.Cache = XZ.Cache()): Option[Bytes] = | 
| 65937 | 652 | if (errors.isEmpty) None | 
| 68018 | 653 |     else {
 | 
| 654 | Some(Bytes(YXML.string_of_body(XML.Encode.list(XML.Encode.string)(errors))). | |
| 655 | compress(cache = cache)) | |
| 656 | } | |
| 65937 | 657 | |
| 73033 | 658 | def uncompress_errors(bytes: Bytes, cache: XML.Cache = XML.Cache.make()): List[String] = | 
| 72885 | 659 | if (bytes.is_empty) Nil | 
| 68018 | 660 |     else {
 | 
| 73033 | 661 | XML.Decode.list(YXML.string_of_body)( | 
| 662 | YXML.parse_body(bytes.uncompress(cache = cache.xz).text, cache = cache)) | |
| 68018 | 663 | } | 
| 65937 | 664 | |
| 65595 | 665 | |
| 666 | ||
| 667 | /** persistent store **/ | |
| 668 | ||
| 65694 | 669 | /* SQL data model */ | 
| 670 | ||
| 671 | object Data | |
| 672 |   {
 | |
| 65702 | 673 | def build_log_table(name: String, columns: List[SQL.Column], body: String = ""): SQL.Table = | 
| 65700 | 674 |       SQL.Table("isabelle_build_log_" + name, columns, body)
 | 
| 675 | ||
| 676 | ||
| 65694 | 677 | /* main content */ | 
| 678 | ||
| 66857 | 679 |     val log_name = SQL.Column.string("log_name").make_primary_key
 | 
| 680 |     val session_name = SQL.Column.string("session_name").make_primary_key
 | |
| 66874 
0b8da0fc9563
store theory timings in session in build_log database;
 wenzelm parents: 
66873diff
changeset | 681 |     val theory_name = SQL.Column.string("theory_name").make_primary_key
 | 
| 65694 | 682 |     val chapter = SQL.Column.string("chapter")
 | 
| 683 |     val groups = SQL.Column.string("groups")
 | |
| 684 |     val threads = SQL.Column.int("threads")
 | |
| 685 |     val timing_elapsed = SQL.Column.long("timing_elapsed")
 | |
| 686 |     val timing_cpu = SQL.Column.long("timing_cpu")
 | |
| 687 |     val timing_gc = SQL.Column.long("timing_gc")
 | |
| 688 |     val timing_factor = SQL.Column.double("timing_factor")
 | |
| 689 |     val ml_timing_elapsed = SQL.Column.long("ml_timing_elapsed")
 | |
| 690 |     val ml_timing_cpu = SQL.Column.long("ml_timing_cpu")
 | |
| 691 |     val ml_timing_gc = SQL.Column.long("ml_timing_gc")
 | |
| 692 |     val ml_timing_factor = SQL.Column.double("ml_timing_factor")
 | |
| 66874 
0b8da0fc9563
store theory timings in session in build_log database;
 wenzelm parents: 
66873diff
changeset | 693 |     val theory_timing_elapsed = SQL.Column.long("theory_timing_elapsed")
 | 
| 
0b8da0fc9563
store theory timings in session in build_log database;
 wenzelm parents: 
66873diff
changeset | 694 |     val theory_timing_cpu = SQL.Column.long("theory_timing_cpu")
 | 
| 
0b8da0fc9563
store theory timings in session in build_log database;
 wenzelm parents: 
66873diff
changeset | 695 |     val theory_timing_gc = SQL.Column.long("theory_timing_gc")
 | 
| 65694 | 696 |     val heap_size = SQL.Column.long("heap_size")
 | 
| 697 |     val status = SQL.Column.string("status")
 | |
| 65937 | 698 |     val errors = SQL.Column.bytes("errors")
 | 
| 66913 | 699 |     val sources = SQL.Column.string("sources")
 | 
| 65694 | 700 |     val ml_statistics = SQL.Column.bytes("ml_statistics")
 | 
| 65783 
d3d5cb2d6866
pick isabelle_version based on build_log database;
 wenzelm parents: 
65781diff
changeset | 701 |     val known = SQL.Column.bool("known")
 | 
| 65694 | 702 | |
| 703 | val meta_info_table = | |
| 65702 | 704 |       build_log_table("meta_info", log_name :: Prop.all_props ::: Settings.all_settings)
 | 
| 65694 | 705 | |
| 706 | val sessions_table = | |
| 65702 | 707 |       build_log_table("sessions",
 | 
| 65694 | 708 | List(log_name, session_name, chapter, groups, threads, timing_elapsed, timing_cpu, | 
| 709 | timing_gc, timing_factor, ml_timing_elapsed, ml_timing_cpu, ml_timing_gc, ml_timing_factor, | |
| 66913 | 710 | heap_size, status, errors, sources)) | 
| 65694 | 711 | |
| 66874 
0b8da0fc9563
store theory timings in session in build_log database;
 wenzelm parents: 
66873diff
changeset | 712 | val theories_table = | 
| 
0b8da0fc9563
store theory timings in session in build_log database;
 wenzelm parents: 
66873diff
changeset | 713 |       build_log_table("theories",
 | 
| 
0b8da0fc9563
store theory timings in session in build_log database;
 wenzelm parents: 
66873diff
changeset | 714 | List(log_name, session_name, theory_name, theory_timing_elapsed, theory_timing_cpu, | 
| 
0b8da0fc9563
store theory timings in session in build_log database;
 wenzelm parents: 
66873diff
changeset | 715 | theory_timing_gc)) | 
| 
0b8da0fc9563
store theory timings in session in build_log database;
 wenzelm parents: 
66873diff
changeset | 716 | |
| 65694 | 717 | val ml_statistics_table = | 
| 65702 | 718 |       build_log_table("ml_statistics", List(log_name, session_name, ml_statistics))
 | 
| 65694 | 719 | |
| 720 | ||
| 66855 | 721 | /* AFP versions */ | 
| 722 | ||
| 723 | val isabelle_afp_versions_table: SQL.Table = | |
| 724 |     {
 | |
| 725 | val version1 = Prop.isabelle_version | |
| 726 | val version2 = Prop.afp_version | |
| 66857 | 727 |       build_log_table("isabelle_afp_versions", List(version1.make_primary_key, version2),
 | 
| 66855 | 728 | SQL.select(List(version1, version2), distinct = true) + meta_info_table + | 
| 66856 | 729 | " WHERE " + version1.defined + " AND " + version2.defined) | 
| 66855 | 730 | } | 
| 731 | ||
| 732 | ||
| 65705 | 733 | /* earliest pull date for repository version (PostgreSQL queries) */ | 
| 65694 | 734 | |
| 71621 | 735 | def pull_date(afp: Boolean = false): SQL.Column = | 
| 66880 
486f4af28db9
more thorough treatment of afp_version and afp_pull_date;
 wenzelm parents: 
66874diff
changeset | 736 |       if (afp) SQL.Column.date("afp_pull_date")
 | 
| 
486f4af28db9
more thorough treatment of afp_version and afp_pull_date;
 wenzelm parents: 
66874diff
changeset | 737 |       else SQL.Column.date("pull_date")
 | 
| 65694 | 738 | |
| 66863 
6acd1a2bd146
clarified afp_pull_date: both repository versions are relevant;
 wenzelm parents: 
66858diff
changeset | 739 | def pull_date_table(afp: Boolean = false): SQL.Table = | 
| 65709 | 740 |     {
 | 
| 66863 
6acd1a2bd146
clarified afp_pull_date: both repository versions are relevant;
 wenzelm parents: 
66858diff
changeset | 741 | val (name, versions) = | 
| 
6acd1a2bd146
clarified afp_pull_date: both repository versions are relevant;
 wenzelm parents: 
66858diff
changeset | 742 |         if (afp) ("afp_pull_date", List(Prop.isabelle_version, Prop.afp_version))
 | 
| 
6acd1a2bd146
clarified afp_pull_date: both repository versions are relevant;
 wenzelm parents: 
66858diff
changeset | 743 |         else ("pull_date", List(Prop.isabelle_version))
 | 
| 65694 | 744 | |
| 66880 
486f4af28db9
more thorough treatment of afp_version and afp_pull_date;
 wenzelm parents: 
66874diff
changeset | 745 | build_log_table(name, versions.map(_.make_primary_key) ::: List(pull_date(afp)), | 
| 
486f4af28db9
more thorough treatment of afp_version and afp_pull_date;
 wenzelm parents: 
66874diff
changeset | 746 |         "SELECT " + versions.mkString(", ") +
 | 
| 
486f4af28db9
more thorough treatment of afp_version and afp_pull_date;
 wenzelm parents: 
66874diff
changeset | 747 |           ", min(" + Prop.build_start + ") AS " + pull_date(afp) +
 | 
| 66863 
6acd1a2bd146
clarified afp_pull_date: both repository versions are relevant;
 wenzelm parents: 
66858diff
changeset | 748 | " FROM " + meta_info_table + | 
| 
6acd1a2bd146
clarified afp_pull_date: both repository versions are relevant;
 wenzelm parents: 
66858diff
changeset | 749 |         " WHERE " + (versions ::: List(Prop.build_start)).map(_.defined).mkString(" AND ") +
 | 
| 
6acd1a2bd146
clarified afp_pull_date: both repository versions are relevant;
 wenzelm parents: 
66858diff
changeset | 750 |         " GROUP BY " + versions.mkString(", "))
 | 
| 66855 | 751 | } | 
| 752 | ||
| 753 | ||
| 754 | /* recent entries */ | |
| 755 | ||
| 65736 | 756 | def recent_time(days: Int): SQL.Source = | 
| 757 | "now() - INTERVAL '" + days.max(0) + " days'" | |
| 758 | ||
| 66863 
6acd1a2bd146
clarified afp_pull_date: both repository versions are relevant;
 wenzelm parents: 
66858diff
changeset | 759 | def recent_pull_date_table( | 
| 
6acd1a2bd146
clarified afp_pull_date: both repository versions are relevant;
 wenzelm parents: 
66858diff
changeset | 760 | days: Int, rev: String = "", afp_rev: Option[String] = None): SQL.Table = | 
| 65702 | 761 |     {
 | 
| 66863 
6acd1a2bd146
clarified afp_pull_date: both repository versions are relevant;
 wenzelm parents: 
66858diff
changeset | 762 | val afp = afp_rev.isDefined | 
| 
6acd1a2bd146
clarified afp_pull_date: both repository versions are relevant;
 wenzelm parents: 
66858diff
changeset | 763 |       val rev2 = afp_rev.getOrElse("")
 | 
| 
6acd1a2bd146
clarified afp_pull_date: both repository versions are relevant;
 wenzelm parents: 
66858diff
changeset | 764 | val table = pull_date_table(afp) | 
| 
6acd1a2bd146
clarified afp_pull_date: both repository versions are relevant;
 wenzelm parents: 
66858diff
changeset | 765 | |
| 
6acd1a2bd146
clarified afp_pull_date: both repository versions are relevant;
 wenzelm parents: 
66858diff
changeset | 766 | val version1 = Prop.isabelle_version | 
| 
6acd1a2bd146
clarified afp_pull_date: both repository versions are relevant;
 wenzelm parents: 
66858diff
changeset | 767 | val version2 = Prop.afp_version | 
| 73342 | 768 | val eq1 = version1(table).toString + " = " + SQL.string(rev) | 
| 769 | val eq2 = version2(table).toString + " = " + SQL.string(rev2) | |
| 66863 
6acd1a2bd146
clarified afp_pull_date: both repository versions are relevant;
 wenzelm parents: 
66858diff
changeset | 770 | |
| 65777 | 771 |       SQL.Table("recent_pull_date", table.columns,
 | 
| 65783 
d3d5cb2d6866
pick isabelle_version based on build_log database;
 wenzelm parents: 
65781diff
changeset | 772 | table.select(table.columns, | 
| 66880 
486f4af28db9
more thorough treatment of afp_version and afp_pull_date;
 wenzelm parents: 
66874diff
changeset | 773 | "WHERE " + pull_date(afp)(table) + " > " + recent_time(days) + | 
| 66863 
6acd1a2bd146
clarified afp_pull_date: both repository versions are relevant;
 wenzelm parents: 
66858diff
changeset | 774 | (if (rev != "" && rev2 == "") " OR " + eq1 | 
| 
6acd1a2bd146
clarified afp_pull_date: both repository versions are relevant;
 wenzelm parents: 
66858diff
changeset | 775 | else if (rev == "" && rev2 != "") " OR " + eq2 | 
| 
6acd1a2bd146
clarified afp_pull_date: both repository versions are relevant;
 wenzelm parents: 
66858diff
changeset | 776 |            else if (rev != "" && rev2 != "") " OR (" + eq1 + " AND " + eq2 + ")"
 | 
| 
6acd1a2bd146
clarified afp_pull_date: both repository versions are relevant;
 wenzelm parents: 
66858diff
changeset | 777 | else ""))) | 
| 65702 | 778 | } | 
| 65694 | 779 | |
| 65781 | 780 | def select_recent_log_names(days: Int): SQL.Source = | 
| 781 |     {
 | |
| 782 | val table1 = meta_info_table | |
| 783 | val table2 = recent_pull_date_table(days) | |
| 784 | table1.select(List(log_name), distinct = true) + SQL.join_inner + table2.query_named + | |
| 785 | " ON " + Prop.isabelle_version(table1) + " = " + Prop.isabelle_version(table2) | |
| 786 | } | |
| 787 | ||
| 66863 
6acd1a2bd146
clarified afp_pull_date: both repository versions are relevant;
 wenzelm parents: 
66858diff
changeset | 788 | def select_recent_versions(days: Int, | 
| 
6acd1a2bd146
clarified afp_pull_date: both repository versions are relevant;
 wenzelm parents: 
66858diff
changeset | 789 | rev: String = "", afp_rev: Option[String] = None, sql: SQL.Source = ""): SQL.Source = | 
| 65783 
d3d5cb2d6866
pick isabelle_version based on build_log database;
 wenzelm parents: 
65781diff
changeset | 790 |     {
 | 
| 66880 
486f4af28db9
more thorough treatment of afp_version and afp_pull_date;
 wenzelm parents: 
66874diff
changeset | 791 | val afp = afp_rev.isDefined | 
| 66858 | 792 | val version = Prop.isabelle_version | 
| 66863 
6acd1a2bd146
clarified afp_pull_date: both repository versions are relevant;
 wenzelm parents: 
66858diff
changeset | 793 | val table1 = recent_pull_date_table(days, rev = rev, afp_rev = afp_rev) | 
| 65783 
d3d5cb2d6866
pick isabelle_version based on build_log database;
 wenzelm parents: 
65781diff
changeset | 794 | val table2 = meta_info_table | 
| 
d3d5cb2d6866
pick isabelle_version based on build_log database;
 wenzelm parents: 
65781diff
changeset | 795 |       val aux_table = SQL.Table("aux", table2.columns, table2.select(sql = sql))
 | 
| 
d3d5cb2d6866
pick isabelle_version based on build_log database;
 wenzelm parents: 
65781diff
changeset | 796 | |
| 
d3d5cb2d6866
pick isabelle_version based on build_log database;
 wenzelm parents: 
65781diff
changeset | 797 | val columns = | 
| 66858 | 798 | table1.columns.map(c => c(table1)) ::: | 
| 799 | List(known.copy(expr = log_name(aux_table).defined)) | |
| 65783 
d3d5cb2d6866
pick isabelle_version based on build_log database;
 wenzelm parents: 
65781diff
changeset | 800 | SQL.select(columns, distinct = true) + | 
| 
d3d5cb2d6866
pick isabelle_version based on build_log database;
 wenzelm parents: 
65781diff
changeset | 801 | table1.query_named + SQL.join_outer + aux_table.query_named + | 
| 66858 | 802 | " ON " + version(table1) + " = " + version(aux_table) + | 
| 66880 
486f4af28db9
more thorough treatment of afp_version and afp_pull_date;
 wenzelm parents: 
66874diff
changeset | 803 | " ORDER BY " + pull_date(afp)(table1) + " DESC" | 
| 65783 
d3d5cb2d6866
pick isabelle_version based on build_log database;
 wenzelm parents: 
65781diff
changeset | 804 | } | 
| 
d3d5cb2d6866
pick isabelle_version based on build_log database;
 wenzelm parents: 
65781diff
changeset | 805 | |
| 65724 | 806 | |
| 807 | /* universal view on main data */ | |
| 808 | ||
| 809 | val universal_table: SQL.Table = | |
| 810 |     {
 | |
| 66880 
486f4af28db9
more thorough treatment of afp_version and afp_pull_date;
 wenzelm parents: 
66874diff
changeset | 811 | val afp_pull_date = pull_date(afp = true) | 
| 
486f4af28db9
more thorough treatment of afp_version and afp_pull_date;
 wenzelm parents: 
66874diff
changeset | 812 | val version1 = Prop.isabelle_version | 
| 
486f4af28db9
more thorough treatment of afp_version and afp_pull_date;
 wenzelm parents: 
66874diff
changeset | 813 | val version2 = Prop.afp_version | 
| 65724 | 814 | val table1 = meta_info_table | 
| 66880 
486f4af28db9
more thorough treatment of afp_version and afp_pull_date;
 wenzelm parents: 
66874diff
changeset | 815 | val table2 = pull_date_table(afp = true) | 
| 
486f4af28db9
more thorough treatment of afp_version and afp_pull_date;
 wenzelm parents: 
66874diff
changeset | 816 | val table3 = pull_date_table() | 
| 65724 | 817 | |
| 66880 
486f4af28db9
more thorough treatment of afp_version and afp_pull_date;
 wenzelm parents: 
66874diff
changeset | 818 | val a_columns = log_name :: afp_pull_date :: table1.columns.tail | 
| 65850 
5414c14c3984
clarified universal table: include ml_statistics;
 wenzelm parents: 
65804diff
changeset | 819 | val a_table = | 
| 
5414c14c3984
clarified universal table: include ml_statistics;
 wenzelm parents: 
65804diff
changeset | 820 |         SQL.Table("a", a_columns,
 | 
| 66880 
486f4af28db9
more thorough treatment of afp_version and afp_pull_date;
 wenzelm parents: 
66874diff
changeset | 821 | SQL.select(List(log_name, afp_pull_date) ::: table1.columns.tail.map(_.apply(table1))) + | 
| 
486f4af28db9
more thorough treatment of afp_version and afp_pull_date;
 wenzelm parents: 
66874diff
changeset | 822 | table1 + SQL.join_outer + table2 + | 
| 
486f4af28db9
more thorough treatment of afp_version and afp_pull_date;
 wenzelm parents: 
66874diff
changeset | 823 | " ON " + version1(table1) + " = " + version1(table2) + | 
| 
486f4af28db9
more thorough treatment of afp_version and afp_pull_date;
 wenzelm parents: 
66874diff
changeset | 824 | " AND " + version2(table1) + " = " + version2(table2)) | 
| 65724 | 825 | |
| 66880 
486f4af28db9
more thorough treatment of afp_version and afp_pull_date;
 wenzelm parents: 
66874diff
changeset | 826 | val b_columns = log_name :: pull_date() :: a_columns.tail | 
| 65850 
5414c14c3984
clarified universal table: include ml_statistics;
 wenzelm parents: 
65804diff
changeset | 827 | val b_table = | 
| 
5414c14c3984
clarified universal table: include ml_statistics;
 wenzelm parents: 
65804diff
changeset | 828 |         SQL.Table("b", b_columns,
 | 
| 66880 
486f4af28db9
more thorough treatment of afp_version and afp_pull_date;
 wenzelm parents: 
66874diff
changeset | 829 | SQL.select( | 
| 
486f4af28db9
more thorough treatment of afp_version and afp_pull_date;
 wenzelm parents: 
66874diff
changeset | 830 | List(log_name(a_table), pull_date()(table3)) ::: a_columns.tail.map(_.apply(a_table))) + | 
| 
486f4af28db9
more thorough treatment of afp_version and afp_pull_date;
 wenzelm parents: 
66874diff
changeset | 831 | a_table.query_named + SQL.join_outer + table3 + | 
| 
486f4af28db9
more thorough treatment of afp_version and afp_pull_date;
 wenzelm parents: 
66874diff
changeset | 832 | " ON " + version1(a_table) + " = " + version1(table3)) | 
| 65850 
5414c14c3984
clarified universal table: include ml_statistics;
 wenzelm parents: 
65804diff
changeset | 833 | |
| 66880 
486f4af28db9
more thorough treatment of afp_version and afp_pull_date;
 wenzelm parents: 
66874diff
changeset | 834 | val c_columns = b_columns ::: sessions_table.columns.tail | 
| 
486f4af28db9
more thorough treatment of afp_version and afp_pull_date;
 wenzelm parents: 
66874diff
changeset | 835 | val c_table = | 
| 
486f4af28db9
more thorough treatment of afp_version and afp_pull_date;
 wenzelm parents: 
66874diff
changeset | 836 |         SQL.Table("c", c_columns,
 | 
| 
486f4af28db9
more thorough treatment of afp_version and afp_pull_date;
 wenzelm parents: 
66874diff
changeset | 837 | SQL.select(log_name(b_table) :: c_columns.tail) + | 
| 
486f4af28db9
more thorough treatment of afp_version and afp_pull_date;
 wenzelm parents: 
66874diff
changeset | 838 | b_table.query_named + SQL.join_inner + sessions_table + | 
| 
486f4af28db9
more thorough treatment of afp_version and afp_pull_date;
 wenzelm parents: 
66874diff
changeset | 839 | " ON " + log_name(b_table) + " = " + log_name(sessions_table)) | 
| 
486f4af28db9
more thorough treatment of afp_version and afp_pull_date;
 wenzelm parents: 
66874diff
changeset | 840 | |
| 
486f4af28db9
more thorough treatment of afp_version and afp_pull_date;
 wenzelm parents: 
66874diff
changeset | 841 |       SQL.Table("isabelle_build_log", c_columns ::: List(ml_statistics),
 | 
| 65724 | 842 |         {
 | 
| 66880 
486f4af28db9
more thorough treatment of afp_version and afp_pull_date;
 wenzelm parents: 
66874diff
changeset | 843 | SQL.select(c_columns.map(_.apply(c_table)) ::: List(ml_statistics)) + | 
| 
486f4af28db9
more thorough treatment of afp_version and afp_pull_date;
 wenzelm parents: 
66874diff
changeset | 844 | c_table.query_named + SQL.join_outer + ml_statistics_table + | 
| 
486f4af28db9
more thorough treatment of afp_version and afp_pull_date;
 wenzelm parents: 
66874diff
changeset | 845 | " ON " + log_name(c_table) + " = " + log_name(ml_statistics_table) + | 
| 
486f4af28db9
more thorough treatment of afp_version and afp_pull_date;
 wenzelm parents: 
66874diff
changeset | 846 | " AND " + session_name(c_table) + " = " + session_name(ml_statistics_table) | 
| 65724 | 847 | }) | 
| 848 | } | |
| 65694 | 849 | } | 
| 850 | ||
| 851 | ||
| 852 | /* database access */ | |
| 853 | ||
| 73031 
f93f0597f4fb
clarified signature: absorb XZ.Cache into XML.Cache;
 wenzelm parents: 
73025diff
changeset | 854 | def store(options: Options, cache: XML.Cache = XML.Cache.make()): Store = | 
| 
f93f0597f4fb
clarified signature: absorb XZ.Cache into XML.Cache;
 wenzelm parents: 
73025diff
changeset | 855 | new Store(options, cache) | 
| 65595 | 856 | |
| 73031 
f93f0597f4fb
clarified signature: absorb XZ.Cache into XML.Cache;
 wenzelm parents: 
73025diff
changeset | 857 | class Store private[Build_Log](options: Options, val cache: XML.Cache) | 
| 65595 | 858 |   {
 | 
| 859 | def open_database( | |
| 860 |       user: String = options.string("build_log_database_user"),
 | |
| 861 |       password: String = options.string("build_log_database_password"),
 | |
| 862 |       database: String = options.string("build_log_database_name"),
 | |
| 863 |       host: String = options.string("build_log_database_host"),
 | |
| 864 |       port: Int = options.int("build_log_database_port"),
 | |
| 865 |       ssh_host: String = options.string("build_log_ssh_host"),
 | |
| 866 |       ssh_user: String = options.string("build_log_ssh_user"),
 | |
| 867 |       ssh_port: Int = options.int("build_log_ssh_port")): PostgreSQL.Database =
 | |
| 868 |     {
 | |
| 869 | PostgreSQL.open_database( | |
| 870 | user = user, password = password, database = database, host = host, port = port, | |
| 871 | ssh = | |
| 872 | if (ssh_host == "") None | |
| 73025 | 873 | else Some(SSH.open_session(options, host = ssh_host, user = ssh_user, port = ssh_port)), | 
| 65636 
df804cdba5f9
ssh_close for proper termination after use of database;
 wenzelm parents: 
65633diff
changeset | 874 | ssh_close = true) | 
| 65595 | 875 | } | 
| 65599 | 876 | |
| 73340 | 877 | def update_database( | 
| 878 | db: PostgreSQL.Database, dirs: List[Path], ml_statistics: Boolean = false): Unit = | |
| 65694 | 879 |     {
 | 
| 69299 
2fd070377c99
clarified default (amending 72a9860f8602): avoid implicit change of File.find_files (it can have bad effects e.g. on "isabelle update_cartouches");
 wenzelm parents: 
68169diff
changeset | 880 | val log_files = | 
| 
2fd070377c99
clarified default (amending 72a9860f8602): avoid implicit change of File.find_files (it can have bad effects e.g. on "isabelle update_cartouches");
 wenzelm parents: 
68169diff
changeset | 881 | dirs.flatMap(dir => | 
| 
2fd070377c99
clarified default (amending 72a9860f8602): avoid implicit change of File.find_files (it can have bad effects e.g. on "isabelle update_cartouches");
 wenzelm parents: 
68169diff
changeset | 882 | File.find_files(dir.file, pred = Log_File.is_log(_), follow_links = true)) | 
| 
2fd070377c99
clarified default (amending 72a9860f8602): avoid implicit change of File.find_files (it can have bad effects e.g. on "isabelle update_cartouches");
 wenzelm parents: 
68169diff
changeset | 883 | write_info(db, log_files, ml_statistics = ml_statistics) | 
| 65694 | 884 | |
| 66863 
6acd1a2bd146
clarified afp_pull_date: both repository versions are relevant;
 wenzelm parents: 
66858diff
changeset | 885 | db.create_view(Data.pull_date_table()) | 
| 
6acd1a2bd146
clarified afp_pull_date: both repository versions are relevant;
 wenzelm parents: 
66858diff
changeset | 886 | db.create_view(Data.pull_date_table(afp = true)) | 
| 65724 | 887 | db.create_view(Data.universal_table) | 
| 65694 | 888 | } | 
| 889 | ||
| 65723 
3ee466e89047
clarified signature: PostgreSQL manages high-volume data, SQLite only sees small snapshots;
 wenzelm parents: 
65722diff
changeset | 890 | def snapshot_database(db: PostgreSQL.Database, sqlite_database: Path, | 
| 73340 | 891 | days: Int = 100, ml_statistics: Boolean = false): Unit = | 
| 65694 | 892 |     {
 | 
| 72375 | 893 | Isabelle_System.make_directory(sqlite_database.dir) | 
| 65694 | 894 | sqlite_database.file.delete | 
| 895 | ||
| 896 | using(SQLite.open_database(sqlite_database))(db2 => | |
| 897 |       {
 | |
| 898 |         db.transaction {
 | |
| 899 |           db2.transaction {
 | |
| 65705 | 900 | // main content | 
| 901 | db2.create_table(Data.meta_info_table) | |
| 902 | db2.create_table(Data.sessions_table) | |
| 66874 
0b8da0fc9563
store theory timings in session in build_log database;
 wenzelm parents: 
66873diff
changeset | 903 | db2.create_table(Data.theories_table) | 
| 65705 | 904 | db2.create_table(Data.ml_statistics_table) | 
| 905 | ||
| 906 | val recent_log_names = | |
| 65781 | 907 | db.using_statement(Data.select_recent_log_names(days))(stmt => | 
| 65779 | 908 | stmt.execute_query().iterator(_.string(Data.log_name)).toList) | 
| 65705 | 909 | |
| 910 |             for (log_name <- recent_log_names) {
 | |
| 911 | read_meta_info(db, log_name).foreach(meta_info => | |
| 912 | update_meta_info(db2, log_name, meta_info)) | |
| 913 | ||
| 914 | update_sessions(db2, log_name, read_build_info(db, log_name)) | |
| 915 | ||
| 65856 | 916 |               if (ml_statistics) {
 | 
| 917 | update_ml_statistics(db2, log_name, | |
| 918 | read_build_info(db, log_name, ml_statistics = true)) | |
| 919 | } | |
| 65705 | 920 | } | 
| 921 | ||
| 922 | // pull_date | |
| 66880 
486f4af28db9
more thorough treatment of afp_version and afp_pull_date;
 wenzelm parents: 
66874diff
changeset | 923 | for (afp <- List(false, true)) | 
| 65694 | 924 |             {
 | 
| 66880 
486f4af28db9
more thorough treatment of afp_version and afp_pull_date;
 wenzelm parents: 
66874diff
changeset | 925 |               val afp_rev = if (afp) Some("") else None
 | 
| 
486f4af28db9
more thorough treatment of afp_version and afp_pull_date;
 wenzelm parents: 
66874diff
changeset | 926 | val table = Data.pull_date_table(afp) | 
| 65694 | 927 | db2.create_table(table) | 
| 65698 | 928 | db2.using_statement(table.insert())(stmt2 => | 
| 65694 | 929 |               {
 | 
| 66880 
486f4af28db9
more thorough treatment of afp_version and afp_pull_date;
 wenzelm parents: 
66874diff
changeset | 930 | db.using_statement( | 
| 
486f4af28db9
more thorough treatment of afp_version and afp_pull_date;
 wenzelm parents: 
66874diff
changeset | 931 | Data.recent_pull_date_table(days, afp_rev = afp_rev).query)(stmt => | 
| 65694 | 932 |                 {
 | 
| 65740 | 933 | val res = stmt.execute_query() | 
| 934 |                   while (res.next()) {
 | |
| 65748 | 935 |                     for ((c, i) <- table.columns.zipWithIndex) {
 | 
| 936 | stmt2.string(i + 1) = res.get_string(c) | |
| 937 | } | |
| 65740 | 938 | stmt2.execute() | 
| 65694 | 939 | } | 
| 940 | }) | |
| 941 | }) | |
| 65709 | 942 | } | 
| 65705 | 943 | |
| 944 | // full view | |
| 65724 | 945 | db2.create_view(Data.universal_table) | 
| 65694 | 946 | } | 
| 947 | } | |
| 65708 | 948 | db2.rebuild | 
| 65694 | 949 | }) | 
| 950 | } | |
| 951 | ||
| 65688 | 952 | def domain(db: SQL.Database, table: SQL.Table, column: SQL.Column): Set[String] = | 
| 65698 | 953 | db.using_statement(table.select(List(column), distinct = true))(stmt => | 
| 65740 | 954 | stmt.execute_query().iterator(_.string(column)).toSet) | 
| 65688 | 955 | |
| 73340 | 956 | def update_meta_info(db: SQL.Database, log_name: String, meta_info: Meta_Info): Unit = | 
| 65632 | 957 |     {
 | 
| 65694 | 958 | val table = Data.meta_info_table | 
| 65703 
cead65c19f2e
more direct insert_permissive statement, which avoids somewhat fragile nested transactions;
 wenzelm parents: 
65702diff
changeset | 959 | db.using_statement(db.insert_permissive(table))(stmt => | 
| 
cead65c19f2e
more direct insert_permissive statement, which avoids somewhat fragile nested transactions;
 wenzelm parents: 
65702diff
changeset | 960 |       {
 | 
| 65748 | 961 | stmt.string(1) = log_name | 
| 65703 
cead65c19f2e
more direct insert_permissive statement, which avoids somewhat fragile nested transactions;
 wenzelm parents: 
65702diff
changeset | 962 |         for ((c, i) <- table.columns.tail.zipWithIndex) {
 | 
| 
cead65c19f2e
more direct insert_permissive statement, which avoids somewhat fragile nested transactions;
 wenzelm parents: 
65702diff
changeset | 963 | if (c.T == SQL.Type.Date) | 
| 65748 | 964 | stmt.date(i + 2) = meta_info.get_date(c) | 
| 65703 
cead65c19f2e
more direct insert_permissive statement, which avoids somewhat fragile nested transactions;
 wenzelm parents: 
65702diff
changeset | 965 | else | 
| 65748 | 966 | stmt.string(i + 2) = meta_info.get(c) | 
| 65703 
cead65c19f2e
more direct insert_permissive statement, which avoids somewhat fragile nested transactions;
 wenzelm parents: 
65702diff
changeset | 967 | } | 
| 
cead65c19f2e
more direct insert_permissive statement, which avoids somewhat fragile nested transactions;
 wenzelm parents: 
65702diff
changeset | 968 | stmt.execute() | 
| 
cead65c19f2e
more direct insert_permissive statement, which avoids somewhat fragile nested transactions;
 wenzelm parents: 
65702diff
changeset | 969 | }) | 
| 65600 | 970 | } | 
| 971 | ||
| 73340 | 972 | def update_sessions(db: SQL.Database, log_name: String, build_info: Build_Info): Unit = | 
| 65599 | 973 |     {
 | 
| 65694 | 974 | val table = Data.sessions_table | 
| 65703 
cead65c19f2e
more direct insert_permissive statement, which avoids somewhat fragile nested transactions;
 wenzelm parents: 
65702diff
changeset | 975 | db.using_statement(db.insert_permissive(table))(stmt => | 
| 
cead65c19f2e
more direct insert_permissive statement, which avoids somewhat fragile nested transactions;
 wenzelm parents: 
65702diff
changeset | 976 |       {
 | 
| 66874 
0b8da0fc9563
store theory timings in session in build_log database;
 wenzelm parents: 
66873diff
changeset | 977 | val sessions = | 
| 
0b8da0fc9563
store theory timings in session in build_log database;
 wenzelm parents: 
66873diff
changeset | 978 | if (build_info.sessions.isEmpty) Build_Info.sessions_dummy | 
| 
0b8da0fc9563
store theory timings in session in build_log database;
 wenzelm parents: 
66873diff
changeset | 979 | else build_info.sessions | 
| 
0b8da0fc9563
store theory timings in session in build_log database;
 wenzelm parents: 
66873diff
changeset | 980 |         for ((session_name, session) <- sessions) {
 | 
| 65748 | 981 | stmt.string(1) = log_name | 
| 982 | stmt.string(2) = session_name | |
| 65853 | 983 | stmt.string(3) = proper_string(session.chapter) | 
| 65748 | 984 | stmt.string(4) = session.proper_groups | 
| 985 | stmt.int(5) = session.threads | |
| 986 | stmt.long(6) = session.timing.elapsed.proper_ms | |
| 987 | stmt.long(7) = session.timing.cpu.proper_ms | |
| 988 | stmt.long(8) = session.timing.gc.proper_ms | |
| 989 | stmt.double(9) = session.timing.factor | |
| 990 | stmt.long(10) = session.ml_timing.elapsed.proper_ms | |
| 991 | stmt.long(11) = session.ml_timing.cpu.proper_ms | |
| 992 | stmt.long(12) = session.ml_timing.gc.proper_ms | |
| 993 | stmt.double(13) = session.ml_timing.factor | |
| 994 | stmt.long(14) = session.heap_size | |
| 995 | stmt.string(15) = session.status.map(_.toString) | |
| 73031 
f93f0597f4fb
clarified signature: absorb XZ.Cache into XML.Cache;
 wenzelm parents: 
73025diff
changeset | 996 | stmt.bytes(16) = compress_errors(session.errors, cache = cache.xz) | 
| 66913 | 997 | stmt.string(17) = session.sources | 
| 65703 
cead65c19f2e
more direct insert_permissive statement, which avoids somewhat fragile nested transactions;
 wenzelm parents: 
65702diff
changeset | 998 | stmt.execute() | 
| 
cead65c19f2e
more direct insert_permissive statement, which avoids somewhat fragile nested transactions;
 wenzelm parents: 
65702diff
changeset | 999 | } | 
| 
cead65c19f2e
more direct insert_permissive statement, which avoids somewhat fragile nested transactions;
 wenzelm parents: 
65702diff
changeset | 1000 | }) | 
| 65642 | 1001 | } | 
| 1002 | ||
| 73340 | 1003 | def update_theories(db: SQL.Database, log_name: String, build_info: Build_Info): Unit = | 
| 66874 
0b8da0fc9563
store theory timings in session in build_log database;
 wenzelm parents: 
66873diff
changeset | 1004 |     {
 | 
| 
0b8da0fc9563
store theory timings in session in build_log database;
 wenzelm parents: 
66873diff
changeset | 1005 | val table = Data.theories_table | 
| 
0b8da0fc9563
store theory timings in session in build_log database;
 wenzelm parents: 
66873diff
changeset | 1006 | db.using_statement(db.insert_permissive(table))(stmt => | 
| 
0b8da0fc9563
store theory timings in session in build_log database;
 wenzelm parents: 
66873diff
changeset | 1007 |       {
 | 
| 
0b8da0fc9563
store theory timings in session in build_log database;
 wenzelm parents: 
66873diff
changeset | 1008 | val sessions = | 
| 
0b8da0fc9563
store theory timings in session in build_log database;
 wenzelm parents: 
66873diff
changeset | 1009 |           if (build_info.sessions.forall({ case (_, session) => session.theory_timings.isEmpty }))
 | 
| 
0b8da0fc9563
store theory timings in session in build_log database;
 wenzelm parents: 
66873diff
changeset | 1010 | Build_Info.sessions_dummy | 
| 
0b8da0fc9563
store theory timings in session in build_log database;
 wenzelm parents: 
66873diff
changeset | 1011 | else build_info.sessions | 
| 
0b8da0fc9563
store theory timings in session in build_log database;
 wenzelm parents: 
66873diff
changeset | 1012 |         for {
 | 
| 
0b8da0fc9563
store theory timings in session in build_log database;
 wenzelm parents: 
66873diff
changeset | 1013 | (session_name, session) <- sessions | 
| 
0b8da0fc9563
store theory timings in session in build_log database;
 wenzelm parents: 
66873diff
changeset | 1014 | (theory_name, timing) <- session.theory_timings | 
| 
0b8da0fc9563
store theory timings in session in build_log database;
 wenzelm parents: 
66873diff
changeset | 1015 |         } {
 | 
| 
0b8da0fc9563
store theory timings in session in build_log database;
 wenzelm parents: 
66873diff
changeset | 1016 | stmt.string(1) = log_name | 
| 
0b8da0fc9563
store theory timings in session in build_log database;
 wenzelm parents: 
66873diff
changeset | 1017 | stmt.string(2) = session_name | 
| 
0b8da0fc9563
store theory timings in session in build_log database;
 wenzelm parents: 
66873diff
changeset | 1018 | stmt.string(3) = theory_name | 
| 
0b8da0fc9563
store theory timings in session in build_log database;
 wenzelm parents: 
66873diff
changeset | 1019 | stmt.long(4) = timing.elapsed.ms | 
| 
0b8da0fc9563
store theory timings in session in build_log database;
 wenzelm parents: 
66873diff
changeset | 1020 | stmt.long(5) = timing.cpu.ms | 
| 
0b8da0fc9563
store theory timings in session in build_log database;
 wenzelm parents: 
66873diff
changeset | 1021 | stmt.long(6) = timing.gc.ms | 
| 
0b8da0fc9563
store theory timings in session in build_log database;
 wenzelm parents: 
66873diff
changeset | 1022 | stmt.execute() | 
| 
0b8da0fc9563
store theory timings in session in build_log database;
 wenzelm parents: 
66873diff
changeset | 1023 | } | 
| 
0b8da0fc9563
store theory timings in session in build_log database;
 wenzelm parents: 
66873diff
changeset | 1024 | }) | 
| 
0b8da0fc9563
store theory timings in session in build_log database;
 wenzelm parents: 
66873diff
changeset | 1025 | } | 
| 
0b8da0fc9563
store theory timings in session in build_log database;
 wenzelm parents: 
66873diff
changeset | 1026 | |
| 73340 | 1027 | def update_ml_statistics(db: SQL.Database, log_name: String, build_info: Build_Info): Unit = | 
| 65645 
2c704ae04db1
clarified database layout: bulky ml_statistics are stored/retrieved separately;
 wenzelm parents: 
65643diff
changeset | 1028 |     {
 | 
| 65694 | 1029 | val table = Data.ml_statistics_table | 
| 65703 
cead65c19f2e
more direct insert_permissive statement, which avoids somewhat fragile nested transactions;
 wenzelm parents: 
65702diff
changeset | 1030 | db.using_statement(db.insert_permissive(table))(stmt => | 
| 
cead65c19f2e
more direct insert_permissive statement, which avoids somewhat fragile nested transactions;
 wenzelm parents: 
65702diff
changeset | 1031 |       {
 | 
| 
cead65c19f2e
more direct insert_permissive statement, which avoids somewhat fragile nested transactions;
 wenzelm parents: 
65702diff
changeset | 1032 | val ml_stats: List[(String, Option[Bytes])] = | 
| 
cead65c19f2e
more direct insert_permissive statement, which avoids somewhat fragile nested transactions;
 wenzelm parents: 
65702diff
changeset | 1033 | Par_List.map[(String, Session_Entry), (String, Option[Bytes])]( | 
| 73031 
f93f0597f4fb
clarified signature: absorb XZ.Cache into XML.Cache;
 wenzelm parents: 
73025diff
changeset | 1034 |             { case (a, b) => (a, Properties.compress(b.ml_statistics, cache = cache.xz).proper) },
 | 
| 65703 
cead65c19f2e
more direct insert_permissive statement, which avoids somewhat fragile nested transactions;
 wenzelm parents: 
65702diff
changeset | 1035 | build_info.sessions.iterator.filter(p => p._2.ml_statistics.nonEmpty).toList) | 
| 
cead65c19f2e
more direct insert_permissive statement, which avoids somewhat fragile nested transactions;
 wenzelm parents: 
65702diff
changeset | 1036 |         val entries = if (ml_stats.nonEmpty) ml_stats else List("" -> None)
 | 
| 
cead65c19f2e
more direct insert_permissive statement, which avoids somewhat fragile nested transactions;
 wenzelm parents: 
65702diff
changeset | 1037 |         for ((session_name, ml_statistics) <- entries) {
 | 
| 65748 | 1038 | stmt.string(1) = log_name | 
| 1039 | stmt.string(2) = session_name | |
| 1040 | stmt.bytes(3) = ml_statistics | |
| 65703 
cead65c19f2e
more direct insert_permissive statement, which avoids somewhat fragile nested transactions;
 wenzelm parents: 
65702diff
changeset | 1041 | stmt.execute() | 
| 
cead65c19f2e
more direct insert_permissive statement, which avoids somewhat fragile nested transactions;
 wenzelm parents: 
65702diff
changeset | 1042 | } | 
| 
cead65c19f2e
more direct insert_permissive statement, which avoids somewhat fragile nested transactions;
 wenzelm parents: 
65702diff
changeset | 1043 | }) | 
| 65645 
2c704ae04db1
clarified database layout: bulky ml_statistics are stored/retrieved separately;
 wenzelm parents: 
65643diff
changeset | 1044 | } | 
| 
2c704ae04db1
clarified database layout: bulky ml_statistics are stored/retrieved separately;
 wenzelm parents: 
65643diff
changeset | 1045 | |
| 73340 | 1046 | def write_info(db: SQL.Database, files: List[JFile], ml_statistics: Boolean = false): Unit = | 
| 65642 | 1047 |     {
 | 
| 65705 | 1048 | abstract class Table_Status(table: SQL.Table) | 
| 65642 | 1049 |       {
 | 
| 65688 | 1050 | db.create_table(table) | 
| 65694 | 1051 | private var known: Set[String] = domain(db, table, Data.log_name) | 
| 65688 | 1052 | |
| 65642 | 1053 | def required(file: JFile): Boolean = !known(Log_File.plain_name(file.getName)) | 
| 65705 | 1054 | |
| 1055 | def update_db(db: SQL.Database, log_file: Log_File): Unit | |
| 73340 | 1056 | def update(log_file: Log_File): Unit = | 
| 65642 | 1057 |         {
 | 
| 1058 |           if (!known(log_file.name)) {
 | |
| 1059 | update_db(db, log_file) | |
| 1060 | known += log_file.name | |
| 65618 | 1061 | } | 
| 65614 
325801edb37d
clarified transaction boundaries: more robust incremental write operations;
 wenzelm parents: 
65613diff
changeset | 1062 | } | 
| 65605 | 1063 | } | 
| 65642 | 1064 | val status = | 
| 1065 | List( | |
| 65705 | 1066 |           new Table_Status(Data.meta_info_table) {
 | 
| 1067 | override def update_db(db: SQL.Database, log_file: Log_File): Unit = | |
| 1068 | update_meta_info(db, log_file.name, log_file.parse_meta_info()) | |
| 1069 | }, | |
| 1070 |           new Table_Status(Data.sessions_table) {
 | |
| 1071 | override def update_db(db: SQL.Database, log_file: Log_File): Unit = | |
| 1072 | update_sessions(db, log_file.name, log_file.parse_build_info()) | |
| 1073 | }, | |
| 66874 
0b8da0fc9563
store theory timings in session in build_log database;
 wenzelm parents: 
66873diff
changeset | 1074 |           new Table_Status(Data.theories_table) {
 | 
| 
0b8da0fc9563
store theory timings in session in build_log database;
 wenzelm parents: 
66873diff
changeset | 1075 | override def update_db(db: SQL.Database, log_file: Log_File): Unit = | 
| 
0b8da0fc9563
store theory timings in session in build_log database;
 wenzelm parents: 
66873diff
changeset | 1076 | update_theories(db, log_file.name, log_file.parse_build_info()) | 
| 
0b8da0fc9563
store theory timings in session in build_log database;
 wenzelm parents: 
66873diff
changeset | 1077 | }, | 
| 65705 | 1078 |           new Table_Status(Data.ml_statistics_table) {
 | 
| 1079 | override def update_db(db: SQL.Database, log_file: Log_File): Unit = | |
| 1080 |             if (ml_statistics) {
 | |
| 1081 | update_ml_statistics(db, log_file.name, | |
| 1082 | log_file.parse_build_info(ml_statistics = true)) | |
| 1083 | } | |
| 1084 | }) | |
| 65642 | 1085 | |
| 67743 | 1086 | for (file_group <- | 
| 1087 | files.filter(file => status.exists(_.required(file))). | |
| 1088 |               grouped(options.int("build_log_transaction_size") max 1))
 | |
| 1089 |       {
 | |
| 71621 | 1090 | val log_files = Par_List.map[JFile, Log_File](Log_File.apply, file_group) | 
| 65642 | 1091 |         db.transaction { log_files.foreach(log_file => status.foreach(_.update(log_file))) }
 | 
| 1092 | } | |
| 65605 | 1093 | } | 
| 1094 | ||
| 65621 | 1095 | def read_meta_info(db: SQL.Database, log_name: String): Option[Meta_Info] = | 
| 1096 |     {
 | |
| 65694 | 1097 | val table = Data.meta_info_table | 
| 65642 | 1098 | val columns = table.columns.tail | 
| 65699 | 1099 | db.using_statement(table.select(columns, Data.log_name.where_equal(log_name)))(stmt => | 
| 65621 | 1100 |       {
 | 
| 65740 | 1101 | val res = stmt.execute_query() | 
| 73344 | 1102 | if (!res.next()) None | 
| 65621 | 1103 |         else {
 | 
| 1104 | val results = | |
| 65642 | 1105 | columns.map(c => c.name -> | 
| 65621 | 1106 | (if (c.T == SQL.Type.Date) | 
| 65740 | 1107 | res.get_date(c).map(Log_File.Date_Format(_)) | 
| 65621 | 1108 | else | 
| 65740 | 1109 | res.get_string(c))) | 
| 65621 | 1110 | val n = Prop.all_props.length | 
| 1111 | val props = for ((x, Some(y)) <- results.take(n)) yield (x, y) | |
| 1112 | val settings = for ((x, Some(y)) <- results.drop(n)) yield (x, y) | |
| 1113 | Some(Meta_Info(props, settings)) | |
| 1114 | } | |
| 1115 | }) | |
| 1116 | } | |
| 1117 | ||
| 1118 | def read_build_info( | |
| 65629 | 1119 | db: SQL.Database, | 
| 1120 | log_name: String, | |
| 1121 | session_names: List[String] = Nil, | |
| 1122 | ml_statistics: Boolean = false): Build_Info = | |
| 65621 | 1123 |     {
 | 
| 65694 | 1124 | val table1 = Data.sessions_table | 
| 1125 | val table2 = Data.ml_statistics_table | |
| 65629 | 1126 | |
| 65645 
2c704ae04db1
clarified database layout: bulky ml_statistics are stored/retrieved separately;
 wenzelm parents: 
65643diff
changeset | 1127 | val where_log_name = | 
| 65699 | 1128 | Data.log_name(table1).where_equal(log_name) + " AND " + | 
| 65701 | 1129 | Data.session_name(table1) + " <> ''" | 
| 65621 | 1130 | val where = | 
| 65645 
2c704ae04db1
clarified database layout: bulky ml_statistics are stored/retrieved separately;
 wenzelm parents: 
65643diff
changeset | 1131 | if (session_names.isEmpty) where_log_name | 
| 65804 | 1132 | else where_log_name + " AND " + SQL.member(Data.session_name(table1).ident, session_names) | 
| 65629 | 1133 | |
| 65645 
2c704ae04db1
clarified database layout: bulky ml_statistics are stored/retrieved separately;
 wenzelm parents: 
65643diff
changeset | 1134 | val columns1 = table1.columns.tail.map(_.apply(table1)) | 
| 
2c704ae04db1
clarified database layout: bulky ml_statistics are stored/retrieved separately;
 wenzelm parents: 
65643diff
changeset | 1135 | val (columns, from) = | 
| 
2c704ae04db1
clarified database layout: bulky ml_statistics are stored/retrieved separately;
 wenzelm parents: 
65643diff
changeset | 1136 |         if (ml_statistics) {
 | 
| 65694 | 1137 | val columns = columns1 ::: List(Data.ml_statistics(table2)) | 
| 65668 | 1138 | val join = | 
| 73342 | 1139 | table1.toString + SQL.join_outer + table2 + " ON " + | 
| 65738 | 1140 | Data.log_name(table1) + " = " + Data.log_name(table2) + " AND " + | 
| 1141 | Data.session_name(table1) + " = " + Data.session_name(table2) | |
| 65668 | 1142 | (columns, SQL.enclose(join)) | 
| 65645 
2c704ae04db1
clarified database layout: bulky ml_statistics are stored/retrieved separately;
 wenzelm parents: 
65643diff
changeset | 1143 | } | 
| 65695 | 1144 | else (columns1, table1.ident) | 
| 65645 
2c704ae04db1
clarified database layout: bulky ml_statistics are stored/retrieved separately;
 wenzelm parents: 
65643diff
changeset | 1145 | |
| 65621 | 1146 | val sessions = | 
| 65698 | 1147 | db.using_statement(SQL.select(columns) + from + " " + where)(stmt => | 
| 65621 | 1148 |         {
 | 
| 65740 | 1149 | stmt.execute_query().iterator(res => | 
| 65621 | 1150 |           {
 | 
| 65740 | 1151 | val session_name = res.string(Data.session_name) | 
| 65626 | 1152 | val session_entry = | 
| 1153 | Session_Entry( | |
| 65740 | 1154 | chapter = res.string(Data.chapter), | 
| 1155 | groups = split_lines(res.string(Data.groups)), | |
| 1156 | threads = res.get_int(Data.threads), | |
| 65741 | 1157 | timing = res.timing(Data.timing_elapsed, Data.timing_cpu, Data.timing_gc), | 
| 65626 | 1158 | ml_timing = | 
| 65741 | 1159 | res.timing(Data.ml_timing_elapsed, Data.ml_timing_cpu, Data.ml_timing_gc), | 
| 66913 | 1160 | sources = res.get_string(Data.sources), | 
| 65740 | 1161 | heap_size = res.get_long(Data.heap_size), | 
| 71621 | 1162 | status = res.get_string(Data.status).map(Session_Status.withName), | 
| 73033 | 1163 | errors = uncompress_errors(res.bytes(Data.errors), cache = cache), | 
| 65629 | 1164 | ml_statistics = | 
| 68018 | 1165 |                   if (ml_statistics) {
 | 
| 73031 
f93f0597f4fb
clarified signature: absorb XZ.Cache into XML.Cache;
 wenzelm parents: 
73025diff
changeset | 1166 | Properties.uncompress(res.bytes(Data.ml_statistics), cache = cache) | 
| 68018 | 1167 | } | 
| 65629 | 1168 | else Nil) | 
| 65626 | 1169 | session_name -> session_entry | 
| 65621 | 1170 | }).toMap | 
| 1171 | }) | |
| 1172 | Build_Info(sessions) | |
| 1173 | } | |
| 65595 | 1174 | } | 
| 64045 | 1175 | } |