author | wenzelm |
Wed, 29 Mar 2023 14:22:01 +0200 | |
changeset 77744 | 1398add8c414 |
parent 77679 | e92000492895 |
child 77745 | ebf70b199db7 |
permissions | -rw-r--r-- |
64160 | 1 |
/* Title: Pure/Admin/build_log.scala |
64045 | 2 |
Author: Makarius |
3 |
||
65608 | 4 |
Management of build log files and database storage. |
64045 | 5 |
*/ |
6 |
||
7 |
package isabelle |
|
8 |
||
9 |
||
64100 | 10 |
import java.io.{File => JFile} |
64110 | 11 |
import java.time.format.{DateTimeFormatter, DateTimeParseException} |
64096 | 12 |
import java.util.Locale |
64061
1bbea2b55d22
some support for header and data fields, notably from afp-test;
wenzelm
parents:
64054
diff
changeset
|
13 |
|
65600 | 14 |
import scala.collection.immutable.SortedMap |
64054 | 15 |
import scala.collection.mutable |
16 |
import scala.util.matching.Regex |
|
17 |
||
18 |
||
75393 | 19 |
object Build_Log { |
64298 | 20 |
/** content **/ |
64101 | 21 |
|
64298 | 22 |
/* properties */ |
64150 | 23 |
|
75393 | 24 |
object Prop { |
65624 | 25 |
val build_tags = SQL.Column.string("build_tags") // lines |
26 |
val build_args = SQL.Column.string("build_args") // lines |
|
65591 | 27 |
val build_group_id = SQL.Column.string("build_group_id") |
28 |
val build_id = SQL.Column.string("build_id") |
|
29 |
val build_engine = SQL.Column.string("build_engine") |
|
30 |
val build_host = SQL.Column.string("build_host") |
|
31 |
val build_start = SQL.Column.date("build_start") |
|
32 |
val build_end = SQL.Column.date("build_end") |
|
33 |
val isabelle_version = SQL.Column.string("isabelle_version") |
|
34 |
val afp_version = SQL.Column.string("afp_version") |
|
35 |
||
65611 | 36 |
val all_props: List[SQL.Column] = |
65591 | 37 |
List(build_tags, build_args, build_group_id, build_id, build_engine, |
38 |
build_host, build_start, build_end, isabelle_version, afp_version) |
|
64298 | 39 |
} |
64150 | 40 |
|
41 |
||
64298 | 42 |
/* settings */ |
64080 | 43 |
|
75393 | 44 |
object Settings { |
65611 | 45 |
val ISABELLE_BUILD_OPTIONS = SQL.Column.string("ISABELLE_BUILD_OPTIONS") |
46 |
val ML_PLATFORM = SQL.Column.string("ML_PLATFORM") |
|
47 |
val ML_HOME = SQL.Column.string("ML_HOME") |
|
48 |
val ML_SYSTEM = SQL.Column.string("ML_SYSTEM") |
|
49 |
val ML_OPTIONS = SQL.Column.string("ML_OPTIONS") |
|
50 |
||
51 |
val ml_settings = List(ML_PLATFORM, ML_HOME, ML_SYSTEM, ML_OPTIONS) |
|
52 |
val all_settings = ISABELLE_BUILD_OPTIONS :: ml_settings |
|
64081 | 53 |
|
54 |
type Entry = (String, String) |
|
55 |
type T = List[Entry] |
|
64080 | 56 |
|
75393 | 57 |
object Entry { |
64081 | 58 |
def unapply(s: String): Option[Entry] = |
73712 | 59 |
for { (a, b) <- Properties.Eq.unapply(s) } |
60 |
yield (a, Library.perhaps_unquote(b)) |
|
73713 | 61 |
def getenv(a: String): String = |
73715
bf51c23f3f99
clarified signature -- avoid odd warning about scala/bug#6675;
wenzelm
parents:
73713
diff
changeset
|
62 |
Properties.Eq(a, quote(Isabelle_System.getenv(a))) |
64081 | 63 |
} |
64080 | 64 |
|
71992 | 65 |
def show(): String = |
64081 | 66 |
cat_lines( |
71992 | 67 |
List(Entry.getenv("ISABELLE_TOOL_JAVA_OPTIONS"), |
68 |
Entry.getenv(ISABELLE_BUILD_OPTIONS.name), "") ::: |
|
65611 | 69 |
ml_settings.map(c => Entry.getenv(c.name))) |
64080 | 70 |
} |
71 |
||
72 |
||
64298 | 73 |
/* file names */ |
74 |
||
75 |
def log_date(date: Date): String = |
|
76 |
String.format(Locale.ROOT, "%s.%05d", |
|
77 |
DateTimeFormatter.ofPattern("yyyy-MM-dd").format(date.rep), |
|
71163 | 78 |
java.lang.Long.valueOf((date.time - date.midnight.time).ms / 1000)) |
64298 | 79 |
|
80 |
def log_subdir(date: Date): Path = |
|
81 |
Path.explode("log") + Path.explode(date.rep.getYear.toString) |
|
82 |
||
83 |
def log_filename(engine: String, date: Date, more: List[String] = Nil): Path = |
|
84 |
Path.explode((engine :: log_date(date) :: more).mkString("", "_", ".log")) |
|
85 |
||
86 |
||
64100 | 87 |
|
64062 | 88 |
/** log file **/ |
64045 | 89 |
|
64155 | 90 |
def print_date(date: Date): String = Log_File.Date_Format(date) |
91 |
||
75393 | 92 |
object Log_File { |
65607 | 93 |
/* log file */ |
94 |
||
75393 | 95 |
def plain_name(name: String): String = { |
71621 | 96 |
List(".log", ".log.gz", ".log.xz", ".gz", ".xz").find(name.endsWith) match { |
65609 | 97 |
case Some(s) => Library.try_unsuffix(s, name).get |
98 |
case None => name |
|
99 |
} |
|
100 |
} |
|
101 |
||
64062 | 102 |
def apply(name: String, lines: List[String]): Log_File = |
71653
6f7a54954f19
more robust: process stdout on Windows may contain CR;
wenzelm
parents:
71630
diff
changeset
|
103 |
new Log_File(plain_name(name), lines.map(Library.trim_line)) |
64062 | 104 |
|
105 |
def apply(name: String, text: String): Log_File = |
|
71653
6f7a54954f19
more robust: process stdout on Windows may contain CR;
wenzelm
parents:
71630
diff
changeset
|
106 |
new Log_File(plain_name(name), Library.trim_split_lines(text)) |
64090 | 107 |
|
75393 | 108 |
def apply(file: JFile): Log_File = { |
64090 | 109 |
val name = file.getName |
65609 | 110 |
val text = |
75906
2167b9e3157a
clarified signature: support for adhoc file types;
wenzelm
parents:
75776
diff
changeset
|
111 |
if (File.is_gz(name)) File.read_gzip(file) |
2167b9e3157a
clarified signature: support for adhoc file types;
wenzelm
parents:
75776
diff
changeset
|
112 |
else if (File.is_xz(name)) File.read_xz(file) |
65609 | 113 |
else File.read(file) |
114 |
apply(name, text) |
|
64090 | 115 |
} |
116 |
||
117 |
def apply(path: Path): Log_File = apply(path.file) |
|
64101 | 118 |
|
64110 | 119 |
|
65607 | 120 |
/* log file collections */ |
121 |
||
122 |
def is_log(file: JFile, |
|
123 |
prefixes: List[String] = |
|
66995
9cb263dbb2f7
plain identify job for Isabelle + AFP, independent of any Isabelle technology;
wenzelm
parents:
66944
diff
changeset
|
124 |
List(Build_History.log_prefix, Identify.log_prefix, Identify.log_prefix2, |
77133
536c033fb6eb
removed somewhat pointless support for Jenkins log files: it has stopped working long ago;
wenzelm
parents:
77113
diff
changeset
|
125 |
Isatest.log_prefix, AFP_Test.log_prefix), |
75393 | 126 |
suffixes: List[String] = List(".log", ".log.gz", ".log.xz") |
127 |
): Boolean = { |
|
65607 | 128 |
val name = file.getName |
65639 | 129 |
|
71621 | 130 |
prefixes.exists(name.startsWith) && |
131 |
suffixes.exists(name.endsWith) && |
|
65639 | 132 |
name != "isatest.log" && |
133 |
name != "afp-test.log" && |
|
134 |
name != "main.log" |
|
65607 | 135 |
} |
136 |
||
137 |
||
64110 | 138 |
/* date format */ |
139 |
||
75393 | 140 |
val Date_Format = { |
64101 | 141 |
val fmts = |
142 |
Date.Formatter.variants( |
|
64116 | 143 |
List("EEE MMM d HH:mm:ss O yyyy", "EEE MMM d HH:mm:ss VV yyyy"), |
64104
b70fa05d6746
more permissive: accept all historic isatest and afp-test logs;
wenzelm
parents:
64103
diff
changeset
|
144 |
List(Locale.ENGLISH, Locale.GERMAN)) ::: |
64110 | 145 |
List( |
146 |
DateTimeFormatter.RFC_1123_DATE_TIME, |
|
69980 | 147 |
Date.Formatter.pattern("EEE MMM d HH:mm:ss yyyy").withZone(Date.timezone_berlin)) |
64101 | 148 |
|
64104
b70fa05d6746
more permissive: accept all historic isatest and afp-test logs;
wenzelm
parents:
64103
diff
changeset
|
149 |
def tune_timezone(s: String): String = |
b70fa05d6746
more permissive: accept all historic isatest and afp-test logs;
wenzelm
parents:
64103
diff
changeset
|
150 |
s match { |
64101 | 151 |
case "CET" | "MET" => "GMT+1" |
152 |
case "CEST" | "MEST" => "GMT+2" |
|
64104
b70fa05d6746
more permissive: accept all historic isatest and afp-test logs;
wenzelm
parents:
64103
diff
changeset
|
153 |
case "EST" => "Europe/Berlin" |
b70fa05d6746
more permissive: accept all historic isatest and afp-test logs;
wenzelm
parents:
64103
diff
changeset
|
154 |
case _ => s |
b70fa05d6746
more permissive: accept all historic isatest and afp-test logs;
wenzelm
parents:
64103
diff
changeset
|
155 |
} |
b70fa05d6746
more permissive: accept all historic isatest and afp-test logs;
wenzelm
parents:
64103
diff
changeset
|
156 |
def tune_weekday(s: String): String = |
b70fa05d6746
more permissive: accept all historic isatest and afp-test logs;
wenzelm
parents:
64103
diff
changeset
|
157 |
s match { |
b70fa05d6746
more permissive: accept all historic isatest and afp-test logs;
wenzelm
parents:
64103
diff
changeset
|
158 |
case "Die" => "Di" |
b70fa05d6746
more permissive: accept all historic isatest and afp-test logs;
wenzelm
parents:
64103
diff
changeset
|
159 |
case "Mit" => "Mi" |
b70fa05d6746
more permissive: accept all historic isatest and afp-test logs;
wenzelm
parents:
64103
diff
changeset
|
160 |
case "Don" => "Do" |
b70fa05d6746
more permissive: accept all historic isatest and afp-test logs;
wenzelm
parents:
64103
diff
changeset
|
161 |
case "Fre" => "Fr" |
b70fa05d6746
more permissive: accept all historic isatest and afp-test logs;
wenzelm
parents:
64103
diff
changeset
|
162 |
case "Sam" => "Sa" |
b70fa05d6746
more permissive: accept all historic isatest and afp-test logs;
wenzelm
parents:
64103
diff
changeset
|
163 |
case "Son" => "So" |
b70fa05d6746
more permissive: accept all historic isatest and afp-test logs;
wenzelm
parents:
64103
diff
changeset
|
164 |
case _ => s |
b70fa05d6746
more permissive: accept all historic isatest and afp-test logs;
wenzelm
parents:
64103
diff
changeset
|
165 |
} |
b70fa05d6746
more permissive: accept all historic isatest and afp-test logs;
wenzelm
parents:
64103
diff
changeset
|
166 |
|
b70fa05d6746
more permissive: accept all historic isatest and afp-test logs;
wenzelm
parents:
64103
diff
changeset
|
167 |
def tune(s: String): String = |
b70fa05d6746
more permissive: accept all historic isatest and afp-test logs;
wenzelm
parents:
64103
diff
changeset
|
168 |
Word.implode( |
b70fa05d6746
more permissive: accept all historic isatest and afp-test logs;
wenzelm
parents:
64103
diff
changeset
|
169 |
Word.explode(s) match { |
71621 | 170 |
case a :: "M\uFFFDr" :: bs => tune_weekday(a) :: "Mär" :: bs.map(tune_timezone) |
171 |
case a :: bs => tune_weekday(a) :: bs.map(tune_timezone) |
|
64104
b70fa05d6746
more permissive: accept all historic isatest and afp-test logs;
wenzelm
parents:
64103
diff
changeset
|
172 |
case Nil => Nil |
b70fa05d6746
more permissive: accept all historic isatest and afp-test logs;
wenzelm
parents:
64103
diff
changeset
|
173 |
} |
b70fa05d6746
more permissive: accept all historic isatest and afp-test logs;
wenzelm
parents:
64103
diff
changeset
|
174 |
) |
64101 | 175 |
|
176 |
Date.Format.make(fmts, tune) |
|
177 |
} |
|
64102 | 178 |
} |
179 |
||
75393 | 180 |
class Log_File private(val name: String, val lines: List[String]) { |
64102 | 181 |
log_file => |
182 |
||
183 |
override def toString: String = name |
|
184 |
||
185 |
def text: String = cat_lines(lines) |
|
186 |
||
187 |
def err(msg: String): Nothing = |
|
188 |
error("Error in log file " + quote(name) + ": " + msg) |
|
189 |
||
190 |
||
191 |
/* date format */ |
|
64101 | 192 |
|
75393 | 193 |
object Strict_Date { |
64101 | 194 |
def unapply(s: String): Some[Date] = |
64102 | 195 |
try { Some(Log_File.Date_Format.parse(s)) } |
64101 | 196 |
catch { case exn: DateTimeParseException => log_file.err(exn.getMessage) } |
197 |
} |
|
198 |
||
199 |
||
71620 | 200 |
/* inlined text */ |
64062 | 201 |
|
71620 | 202 |
def filter(Marker: Protocol_Message.Marker): List[String] = |
203 |
for (Marker(text) <- lines) yield text |
|
64062 | 204 |
|
71620 | 205 |
def find(Marker: Protocol_Message.Marker): Option[String] = |
206 |
lines.collectFirst({ case Marker(text) => text }) |
|
64196
6688b9cd443b
more robust wrt. old versions that use clear-text properties (e.g. Timing in build_history_base);
wenzelm
parents:
64193
diff
changeset
|
207 |
|
65684 | 208 |
def find_match(regexes: List[Regex]): Option[String] = |
209 |
regexes match { |
|
210 |
case Nil => None |
|
211 |
case regex :: rest => |
|
212 |
lines.iterator.map(regex.unapplySeq(_)).find(res => res.isDefined && res.get.length == 1). |
|
213 |
map(res => res.get.head) orElse find_match(rest) |
|
214 |
} |
|
64062 | 215 |
|
216 |
||
217 |
/* settings */ |
|
218 |
||
73715
bf51c23f3f99
clarified signature -- avoid odd warning about scala/bug#6675;
wenzelm
parents:
73713
diff
changeset
|
219 |
def get_setting(name: String): Option[Settings.Entry] = |
bf51c23f3f99
clarified signature -- avoid odd warning about scala/bug#6675;
wenzelm
parents:
73713
diff
changeset
|
220 |
lines.collectFirst({ case Settings.Entry(a, b) if a == name => a -> b }) |
64045 | 221 |
|
65611 | 222 |
def get_all_settings: Settings.T = |
223 |
for { c <- Settings.all_settings; entry <- get_setting(c.name) } |
|
224 |
yield entry |
|
64062 | 225 |
|
226 |
||
227 |
/* properties (YXML) */ |
|
228 |
||
73031
f93f0597f4fb
clarified signature: absorb XZ.Cache into XML.Cache;
wenzelm
parents:
73025
diff
changeset
|
229 |
val cache: XML.Cache = XML.Cache.make() |
64062 | 230 |
|
231 |
def parse_props(text: String): Properties.T = |
|
73031
f93f0597f4fb
clarified signature: absorb XZ.Cache into XML.Cache;
wenzelm
parents:
73025
diff
changeset
|
232 |
try { cache.props(XML.Decode.properties(YXML.parse_body(text))) } |
66046 | 233 |
catch { case _: XML.Error => log_file.err("malformed properties") } |
64062 | 234 |
|
71620 | 235 |
def filter_props(marker: Protocol_Message.Marker): List[Properties.T] = |
236 |
for (text <- filter(marker) if YXML.detect(text)) yield parse_props(text) |
|
64062 | 237 |
|
71620 | 238 |
def find_props(marker: Protocol_Message.Marker): Option[Properties.T] = |
239 |
for (text <- find(marker) if YXML.detect(text)) yield parse_props(text) |
|
64062 | 240 |
|
241 |
||
242 |
/* parse various formats */ |
|
243 |
||
64105 | 244 |
def parse_meta_info(): Meta_Info = Build_Log.parse_meta_info(log_file) |
245 |
||
65646 | 246 |
def parse_build_info(ml_statistics: Boolean = false): Build_Info = |
247 |
Build_Log.parse_build_info(log_file, ml_statistics) |
|
64105 | 248 |
|
64082 | 249 |
def parse_session_info( |
250 |
command_timings: Boolean = false, |
|
66873
9953ae603a23
provide theory timing information, similar to command timing but always considered relevant;
wenzelm
parents:
66863
diff
changeset
|
251 |
theory_timings: Boolean = false, |
64082 | 252 |
ml_statistics: Boolean = false, |
253 |
task_statistics: Boolean = false): Session_Info = |
|
66873
9953ae603a23
provide theory timing information, similar to command timing but always considered relevant;
wenzelm
parents:
66863
diff
changeset
|
254 |
Build_Log.parse_session_info( |
9953ae603a23
provide theory timing information, similar to command timing but always considered relevant;
wenzelm
parents:
66863
diff
changeset
|
255 |
log_file, command_timings, theory_timings, ml_statistics, task_statistics) |
64045 | 256 |
} |
257 |
||
258 |
||
64098 | 259 |
|
75518
cb4af8c6152f
clarified remote vs. local build_history: operate on hg_sync directory instead of repository;
wenzelm
parents:
75394
diff
changeset
|
260 |
/** digested meta info: produced by Admin/build_other in log.xz file **/ |
64045 | 261 |
|
75393 | 262 |
object Meta_Info { |
64108 | 263 |
val empty: Meta_Info = Meta_Info(Nil, Nil) |
64099 | 264 |
} |
64098 | 265 |
|
75393 | 266 |
sealed case class Meta_Info(props: Properties.T, settings: Settings.T) { |
64103 | 267 |
def is_empty: Boolean = props.isEmpty && settings.isEmpty |
65599 | 268 |
|
65611 | 269 |
def get(c: SQL.Column): Option[String] = |
270 |
Properties.get(props, c.name) orElse |
|
271 |
Properties.get(settings, c.name) |
|
272 |
||
273 |
def get_date(c: SQL.Column): Option[Date] = |
|
71621 | 274 |
get(c).map(Log_File.Date_Format.parse) |
64103 | 275 |
} |
64061
1bbea2b55d22
some support for header and data fields, notably from afp-test;
wenzelm
parents:
64054
diff
changeset
|
276 |
|
75393 | 277 |
object Identify { |
65625 | 278 |
val log_prefix = "isabelle_identify_" |
66995
9cb263dbb2f7
plain identify job for Isabelle + AFP, independent of any Isabelle technology;
wenzelm
parents:
66944
diff
changeset
|
279 |
val log_prefix2 = "plain_identify_" |
65674
23897f5d885d
approximate repository identify job based on isabelle-nightly-slow;
wenzelm
parents:
65670
diff
changeset
|
280 |
|
23897f5d885d
approximate repository identify job based on isabelle-nightly-slow;
wenzelm
parents:
65670
diff
changeset
|
281 |
def engine(log_file: Log_File): String = |
77133
536c033fb6eb
removed somewhat pointless support for Jenkins log files: it has stopped working long ago;
wenzelm
parents:
77113
diff
changeset
|
282 |
if (log_file.name.startsWith(log_prefix2)) "plain_identify" else "identify" |
65674
23897f5d885d
approximate repository identify job based on isabelle-nightly-slow;
wenzelm
parents:
65670
diff
changeset
|
283 |
|
23897f5d885d
approximate repository identify job based on isabelle-nightly-slow;
wenzelm
parents:
65670
diff
changeset
|
284 |
def content(date: Date, isabelle_version: Option[String], afp_version: Option[String]): String = |
23897f5d885d
approximate repository identify job based on isabelle-nightly-slow;
wenzelm
parents:
65670
diff
changeset
|
285 |
terminate_lines( |
23897f5d885d
approximate repository identify job based on isabelle-nightly-slow;
wenzelm
parents:
65670
diff
changeset
|
286 |
List("isabelle_identify: " + Build_Log.print_date(date), "") ::: |
23897f5d885d
approximate repository identify job based on isabelle-nightly-slow;
wenzelm
parents:
65670
diff
changeset
|
287 |
isabelle_version.map("Isabelle version: " + _).toList ::: |
23897f5d885d
approximate repository identify job based on isabelle-nightly-slow;
wenzelm
parents:
65670
diff
changeset
|
288 |
afp_version.map("AFP version: " + _).toList) |
23897f5d885d
approximate repository identify job based on isabelle-nightly-slow;
wenzelm
parents:
65670
diff
changeset
|
289 |
|
65625 | 290 |
val Start = new Regex("""^isabelle_identify: (.+)$""") |
291 |
val No_End = new Regex("""$.""") |
|
65684 | 292 |
val Isabelle_Version = List(new Regex("""^Isabelle version: (\S+)$""")) |
293 |
val AFP_Version = List(new Regex("""^AFP version: (\S+)$""")) |
|
65625 | 294 |
} |
295 |
||
75393 | 296 |
object Isatest { |
65588 | 297 |
val log_prefix = "isatest-makeall-" |
64108 | 298 |
val engine = "isatest" |
64109 | 299 |
val Start = new Regex("""^------------------- starting test --- (.+) --- (.+)$""") |
300 |
val End = new Regex("""^------------------- test (?:successful|FAILED) --- (.+) --- .*$""") |
|
65684 | 301 |
val Isabelle_Version = List(new Regex("""^Isabelle version: (\S+)$""")) |
64095 | 302 |
} |
303 |
||
75393 | 304 |
object AFP_Test { |
65588 | 305 |
val log_prefix = "afp-test-devel-" |
64108 | 306 |
val engine = "afp-test" |
64109 | 307 |
val Start = new Regex("""^Start test(?: for .+)? at ([^,]+), (.*)$""") |
308 |
val Start_Old = new Regex("""^Start test(?: for .+)? at ([^,]+)$""") |
|
309 |
val End = new Regex("""^End test on (.+), .+, elapsed time:.*$""") |
|
65684 | 310 |
val Isabelle_Version = List(new Regex("""^Isabelle version: .* -- hg id (\S+)$""")) |
311 |
val AFP_Version = List(new Regex("""^AFP version: .* -- hg id (\S+)$""")) |
|
64104
b70fa05d6746
more permissive: accept all historic isatest and afp-test logs;
wenzelm
parents:
64103
diff
changeset
|
312 |
val Bad_Init = new Regex("""^cp:.*: Disc quota exceeded$""") |
64061
1bbea2b55d22
some support for header and data fields, notably from afp-test;
wenzelm
parents:
64054
diff
changeset
|
313 |
} |
1bbea2b55d22
some support for header and data fields, notably from afp-test;
wenzelm
parents:
64054
diff
changeset
|
314 |
|
75393 | 315 |
object Jenkins { |
65664 | 316 |
val log_prefix = "jenkins_" |
64110 | 317 |
val engine = "jenkins" |
65663 | 318 |
val Host = new Regex("""^Building remotely on (\S+) \((\S+)\).*$""") |
65665 | 319 |
val Start = new Regex("""^(?:Started by an SCM change|Started from command line by admin|).*$""") |
64110 | 320 |
val Start_Date = new Regex("""^Build started at (.+)$""") |
321 |
val No_End = new Regex("""$.""") |
|
65674
23897f5d885d
approximate repository identify job based on isabelle-nightly-slow;
wenzelm
parents:
65670
diff
changeset
|
322 |
val Isabelle_Version = |
65684 | 323 |
List(new Regex("""^(?:Build for Isabelle id|Isabelle id) (\w+).*$"""), |
65685 | 324 |
new Regex("""^ISABELLE_CI_REPO_ID="(\w+)".*$"""), |
325 |
new Regex("""^(\w{12}) tip.*$""")) |
|
65674
23897f5d885d
approximate repository identify job based on isabelle-nightly-slow;
wenzelm
parents:
65670
diff
changeset
|
326 |
val AFP_Version = |
65684 | 327 |
List(new Regex("""^(?:Build for AFP id|AFP id) (\w+).*$"""), |
328 |
new Regex("""^ISABELLE_CI_AFP_ID="(\w+)".*$""")) |
|
64110 | 329 |
val CONFIGURATION = "=== CONFIGURATION ===" |
330 |
val BUILD = "=== BUILD ===" |
|
331 |
} |
|
332 |
||
75393 | 333 |
private def parse_meta_info(log_file: Log_File): Meta_Info = { |
64108 | 334 |
def parse(engine: String, host: String, start: Date, |
75393 | 335 |
End: Regex, Isabelle_Version: List[Regex], AFP_Version: List[Regex] |
336 |
): Meta_Info = { |
|
337 |
val build_id = { |
|
65714 | 338 |
val prefix = proper_string(host) orElse proper_string(engine) getOrElse "build" |
339 |
prefix + ":" + start.time.ms |
|
64296
544481988e65
explicit identification of builds and correlated build groups;
wenzelm
parents:
64196
diff
changeset
|
340 |
} |
65591 | 341 |
val build_engine = if (engine == "") Nil else List(Prop.build_engine.name -> engine) |
342 |
val build_host = if (host == "") Nil else List(Prop.build_host.name -> host) |
|
64108 | 343 |
|
65599 | 344 |
val start_date = List(Prop.build_start.name -> print_date(start)) |
64091 | 345 |
val end_date = |
346 |
log_file.lines.last match { |
|
64109 | 347 |
case End(log_file.Strict_Date(end_date)) => |
65599 | 348 |
List(Prop.build_end.name -> print_date(end_date)) |
64091 | 349 |
case _ => Nil |
350 |
} |
|
351 |
||
352 |
val isabelle_version = |
|
65591 | 353 |
log_file.find_match(Isabelle_Version).map(Prop.isabelle_version.name -> _) |
64091 | 354 |
val afp_version = |
65591 | 355 |
log_file.find_match(AFP_Version).map(Prop.afp_version.name -> _) |
64062 | 356 |
|
65591 | 357 |
Meta_Info((Prop.build_id.name -> build_id) :: build_engine ::: build_host ::: |
64108 | 358 |
start_date ::: end_date ::: isabelle_version.toList ::: afp_version.toList, |
65611 | 359 |
log_file.get_all_settings) |
64091 | 360 |
} |
361 |
||
362 |
log_file.lines match { |
|
71630
50425e4c3910
clarified modules: global quasi-scope for markers;
wenzelm
parents:
71621
diff
changeset
|
363 |
case line :: _ if Protocol.Meta_Info_Marker.test_yxml(line) => |
50425e4c3910
clarified modules: global quasi-scope for markers;
wenzelm
parents:
71621
diff
changeset
|
364 |
Meta_Info(log_file.find_props(Protocol.Meta_Info_Marker).get, log_file.get_all_settings) |
64117 | 365 |
|
65625 | 366 |
case Identify.Start(log_file.Strict_Date(start)) :: _ => |
65674
23897f5d885d
approximate repository identify job based on isabelle-nightly-slow;
wenzelm
parents:
65670
diff
changeset
|
367 |
parse(Identify.engine(log_file), "", start, Identify.No_End, |
65625 | 368 |
Identify.Isabelle_Version, Identify.AFP_Version) |
369 |
||
64109 | 370 |
case Isatest.Start(log_file.Strict_Date(start), host) :: _ => |
371 |
parse(Isatest.engine, host, start, Isatest.End, |
|
65684 | 372 |
Isatest.Isabelle_Version, Nil) |
64099 | 373 |
|
64109 | 374 |
case AFP_Test.Start(log_file.Strict_Date(start), host) :: _ => |
375 |
parse(AFP_Test.engine, host, start, AFP_Test.End, |
|
376 |
AFP_Test.Isabelle_Version, AFP_Test.AFP_Version) |
|
64099 | 377 |
|
64109 | 378 |
case AFP_Test.Start_Old(log_file.Strict_Date(start)) :: _ => |
379 |
parse(AFP_Test.engine, "", start, AFP_Test.End, |
|
380 |
AFP_Test.Isabelle_Version, AFP_Test.AFP_Version) |
|
64099 | 381 |
|
64341 | 382 |
case line :: _ if line.startsWith("\u0000") => Meta_Info.empty |
64109 | 383 |
case List(Isatest.End(_)) => Meta_Info.empty |
384 |
case _ :: AFP_Test.Bad_Init() :: _ => Meta_Info.empty |
|
64105 | 385 |
case Nil => Meta_Info.empty |
64104
b70fa05d6746
more permissive: accept all historic isatest and afp-test logs;
wenzelm
parents:
64103
diff
changeset
|
386 |
|
64110 | 387 |
case _ => log_file.err("cannot detect log file format") |
64061
1bbea2b55d22
some support for header and data fields, notably from afp-test;
wenzelm
parents:
64054
diff
changeset
|
388 |
} |
1bbea2b55d22
some support for header and data fields, notably from afp-test;
wenzelm
parents:
64054
diff
changeset
|
389 |
} |
1bbea2b55d22
some support for header and data fields, notably from afp-test;
wenzelm
parents:
64054
diff
changeset
|
390 |
|
64085
1c451e5c145f
clarified parse_build_info: isabelle build output;
wenzelm
parents:
64083
diff
changeset
|
391 |
|
64098 | 392 |
|
75518
cb4af8c6152f
clarified remote vs. local build_history: operate on hg_sync directory instead of repository;
wenzelm
parents:
75394
diff
changeset
|
393 |
/** build info: toplevel output of isabelle build or Admin/build_other **/ |
64119
8094eaa38d4b
inline session ML statistics into main build log;
wenzelm
parents:
64117
diff
changeset
|
394 |
|
8094eaa38d4b
inline session ML statistics into main build log;
wenzelm
parents:
64117
diff
changeset
|
395 |
val SESSION_NAME = "session_name" |
64085
1c451e5c145f
clarified parse_build_info: isabelle build output;
wenzelm
parents:
64083
diff
changeset
|
396 |
|
75393 | 397 |
object Session_Status extends Enumeration { |
65633 | 398 |
val existing, finished, failed, cancelled = Value |
64061
1bbea2b55d22
some support for header and data fields, notably from afp-test;
wenzelm
parents:
64054
diff
changeset
|
399 |
} |
1bbea2b55d22
some support for header and data fields, notably from afp-test;
wenzelm
parents:
64054
diff
changeset
|
400 |
|
64085
1c451e5c145f
clarified parse_build_info: isabelle build output;
wenzelm
parents:
64083
diff
changeset
|
401 |
sealed case class Session_Entry( |
65643 | 402 |
chapter: String = "", |
403 |
groups: List[String] = Nil, |
|
404 |
threads: Option[Int] = None, |
|
405 |
timing: Timing = Timing.zero, |
|
406 |
ml_timing: Timing = Timing.zero, |
|
66913 | 407 |
sources: Option[String] = None, |
77113 | 408 |
heap_size: Option[Space] = None, |
65643 | 409 |
status: Option[Session_Status.Value] = None, |
65937 | 410 |
errors: List[String] = Nil, |
66874
0b8da0fc9563
store theory timings in session in build_log database;
wenzelm
parents:
66873
diff
changeset
|
411 |
theory_timings: Map[String, Timing] = Map.empty, |
75393 | 412 |
ml_statistics: List[Properties.T] = Nil |
413 |
) { |
|
65631 | 414 |
def proper_groups: Option[String] = if (groups.isEmpty) None else Some(cat_lines(groups)) |
65643 | 415 |
def finished: Boolean = status == Some(Session_Status.finished) |
65937 | 416 |
def failed: Boolean = status == Some(Session_Status.failed) |
64085
1c451e5c145f
clarified parse_build_info: isabelle build output;
wenzelm
parents:
64083
diff
changeset
|
417 |
} |
64054 | 418 |
|
75393 | 419 |
object Build_Info { |
66874
0b8da0fc9563
store theory timings in session in build_log database;
wenzelm
parents:
66873
diff
changeset
|
420 |
val sessions_dummy: Map[String, Session_Entry] = |
0b8da0fc9563
store theory timings in session in build_log database;
wenzelm
parents:
66873
diff
changeset
|
421 |
Map("" -> Session_Entry(theory_timings = Map("" -> Timing.zero))) |
0b8da0fc9563
store theory timings in session in build_log database;
wenzelm
parents:
66873
diff
changeset
|
422 |
} |
0b8da0fc9563
store theory timings in session in build_log database;
wenzelm
parents:
66873
diff
changeset
|
423 |
|
75393 | 424 |
sealed case class Build_Info(sessions: Map[String, Session_Entry]) { |
65937 | 425 |
def finished_sessions: List[String] = for ((a, b) <- sessions.toList if b.finished) yield a |
426 |
def failed_sessions: List[String] = for ((a, b) <- sessions.toList if b.failed) yield a |
|
64054 | 427 |
} |
428 |
||
75393 | 429 |
private def parse_build_info(log_file: Log_File, parse_ml_statistics: Boolean): Build_Info = { |
430 |
object Chapter_Name { |
|
64085
1c451e5c145f
clarified parse_build_info: isabelle build output;
wenzelm
parents:
64083
diff
changeset
|
431 |
def unapply(s: String): Some[(String, String)] = |
1c451e5c145f
clarified parse_build_info: isabelle build output;
wenzelm
parents:
64083
diff
changeset
|
432 |
space_explode('/', s) match { |
1c451e5c145f
clarified parse_build_info: isabelle build output;
wenzelm
parents:
64083
diff
changeset
|
433 |
case List(chapter, name) => Some((chapter, name)) |
1c451e5c145f
clarified parse_build_info: isabelle build output;
wenzelm
parents:
64083
diff
changeset
|
434 |
case _ => Some(("", s)) |
1c451e5c145f
clarified parse_build_info: isabelle build output;
wenzelm
parents:
64083
diff
changeset
|
435 |
} |
1c451e5c145f
clarified parse_build_info: isabelle build output;
wenzelm
parents:
64083
diff
changeset
|
436 |
} |
64054 | 437 |
|
64085
1c451e5c145f
clarified parse_build_info: isabelle build output;
wenzelm
parents:
64083
diff
changeset
|
438 |
val Session_No_Groups = new Regex("""^Session (\S+)$""") |
1c451e5c145f
clarified parse_build_info: isabelle build output;
wenzelm
parents:
64083
diff
changeset
|
439 |
val Session_Groups = new Regex("""^Session (\S+) \((.*)\)$""") |
1c451e5c145f
clarified parse_build_info: isabelle build output;
wenzelm
parents:
64083
diff
changeset
|
440 |
val Session_Finished1 = |
1c451e5c145f
clarified parse_build_info: isabelle build output;
wenzelm
parents:
64083
diff
changeset
|
441 |
new Regex("""^Finished (\S+) \((\d+):(\d+):(\d+) elapsed time, (\d+):(\d+):(\d+) cpu time.*$""") |
1c451e5c145f
clarified parse_build_info: isabelle build output;
wenzelm
parents:
64083
diff
changeset
|
442 |
val Session_Finished2 = |
72695 | 443 |
new Regex("""^Finished ([^\s/]+) \((\d+):(\d+):(\d+) elapsed time.*$""") |
64085
1c451e5c145f
clarified parse_build_info: isabelle build output;
wenzelm
parents:
64083
diff
changeset
|
444 |
val Session_Timing = |
65679 | 445 |
new Regex("""^Timing (\S+) \((\d+) threads, (\d+\.\d+)s elapsed time, (\d+\.\d+)s cpu time, (\d+\.\d+)s GC time.*$""") |
77551 | 446 |
val Session_Started1 = new Regex("""^(?:Running|Building) (\S+) \.\.\.$""") |
447 |
val Session_Started2 = new Regex("""^(?:Running|Building) (\S+) on \S+ \.\.\.$""") |
|
66913 | 448 |
val Sources = new Regex("""^Sources (\S+) (\S{""" + SHA1.digest_length + """})$""") |
64120 | 449 |
val Heap = new Regex("""^Heap (\S+) \((\d+) bytes\)$""") |
64085
1c451e5c145f
clarified parse_build_info: isabelle build output;
wenzelm
parents:
64083
diff
changeset
|
450 |
|
75393 | 451 |
object Theory_Timing { |
66874
0b8da0fc9563
store theory timings in session in build_log database;
wenzelm
parents:
66873
diff
changeset
|
452 |
def unapply(line: String): Option[(String, (String, Timing))] = |
71630
50425e4c3910
clarified modules: global quasi-scope for markers;
wenzelm
parents:
71621
diff
changeset
|
453 |
Protocol.Theory_Timing_Marker.unapply(line.replace('~', '-')).map(log_file.parse_props) |
50425e4c3910
clarified modules: global quasi-scope for markers;
wenzelm
parents:
71621
diff
changeset
|
454 |
match { |
72753 | 455 |
case Some((SESSION_NAME, session) :: props) => |
456 |
for (theory <- Markup.Name.unapply(props)) |
|
74782 | 457 |
yield (session, theory -> Markup.Timing_Properties.get(props)) |
66874
0b8da0fc9563
store theory timings in session in build_log database;
wenzelm
parents:
66873
diff
changeset
|
458 |
case _ => None |
0b8da0fc9563
store theory timings in session in build_log database;
wenzelm
parents:
66873
diff
changeset
|
459 |
} |
0b8da0fc9563
store theory timings in session in build_log database;
wenzelm
parents:
66873
diff
changeset
|
460 |
} |
0b8da0fc9563
store theory timings in session in build_log database;
wenzelm
parents:
66873
diff
changeset
|
461 |
|
64085
1c451e5c145f
clarified parse_build_info: isabelle build output;
wenzelm
parents:
64083
diff
changeset
|
462 |
var chapter = Map.empty[String, String] |
1c451e5c145f
clarified parse_build_info: isabelle build output;
wenzelm
parents:
64083
diff
changeset
|
463 |
var groups = Map.empty[String, List[String]] |
1c451e5c145f
clarified parse_build_info: isabelle build output;
wenzelm
parents:
64083
diff
changeset
|
464 |
var threads = Map.empty[String, Int] |
64054 | 465 |
var timing = Map.empty[String, Timing] |
64085
1c451e5c145f
clarified parse_build_info: isabelle build output;
wenzelm
parents:
64083
diff
changeset
|
466 |
var ml_timing = Map.empty[String, Timing] |
64086
ac7ae5067783
clarified status: started sessions may bomb without explicit FAILED or CANCELLED (cf. in afp-test-devel-2016-01-03.log);
wenzelm
parents:
64085
diff
changeset
|
467 |
var started = Set.empty[String] |
66913 | 468 |
var sources = Map.empty[String, String] |
77113 | 469 |
var heap_sizes = Map.empty[String, Space] |
66874
0b8da0fc9563
store theory timings in session in build_log database;
wenzelm
parents:
66873
diff
changeset
|
470 |
var theory_timings = Map.empty[String, Map[String, Timing]] |
64119
8094eaa38d4b
inline session ML statistics into main build log;
wenzelm
parents:
64117
diff
changeset
|
471 |
var ml_statistics = Map.empty[String, List[Properties.T]] |
65937 | 472 |
var errors = Map.empty[String, List[String]] |
64119
8094eaa38d4b
inline session ML statistics into main build log;
wenzelm
parents:
64117
diff
changeset
|
473 |
|
64085
1c451e5c145f
clarified parse_build_info: isabelle build output;
wenzelm
parents:
64083
diff
changeset
|
474 |
def all_sessions: Set[String] = |
64120 | 475 |
chapter.keySet ++ groups.keySet ++ threads.keySet ++ timing.keySet ++ ml_timing.keySet ++ |
72694 | 476 |
started ++ sources.keySet ++ heap_sizes.keySet ++ |
66913 | 477 |
theory_timings.keySet ++ ml_statistics.keySet |
64085
1c451e5c145f
clarified parse_build_info: isabelle build output;
wenzelm
parents:
64083
diff
changeset
|
478 |
|
64054 | 479 |
|
64062 | 480 |
for (line <- log_file.lines) { |
64054 | 481 |
line match { |
64085
1c451e5c145f
clarified parse_build_info: isabelle build output;
wenzelm
parents:
64083
diff
changeset
|
482 |
case Session_No_Groups(Chapter_Name(chapt, name)) => |
1c451e5c145f
clarified parse_build_info: isabelle build output;
wenzelm
parents:
64083
diff
changeset
|
483 |
chapter += (name -> chapt) |
1c451e5c145f
clarified parse_build_info: isabelle build output;
wenzelm
parents:
64083
diff
changeset
|
484 |
groups += (name -> Nil) |
64119
8094eaa38d4b
inline session ML statistics into main build log;
wenzelm
parents:
64117
diff
changeset
|
485 |
|
64085
1c451e5c145f
clarified parse_build_info: isabelle build output;
wenzelm
parents:
64083
diff
changeset
|
486 |
case Session_Groups(Chapter_Name(chapt, name), grps) => |
1c451e5c145f
clarified parse_build_info: isabelle build output;
wenzelm
parents:
64083
diff
changeset
|
487 |
chapter += (name -> chapt) |
1c451e5c145f
clarified parse_build_info: isabelle build output;
wenzelm
parents:
64083
diff
changeset
|
488 |
groups += (name -> Word.explode(grps)) |
64119
8094eaa38d4b
inline session ML statistics into main build log;
wenzelm
parents:
64117
diff
changeset
|
489 |
|
77551 | 490 |
case Session_Started1(name) => |
491 |
started += name |
|
492 |
||
493 |
case Session_Started2(name) => |
|
64086
ac7ae5067783
clarified status: started sessions may bomb without explicit FAILED or CANCELLED (cf. in afp-test-devel-2016-01-03.log);
wenzelm
parents:
64085
diff
changeset
|
494 |
started += name |
64119
8094eaa38d4b
inline session ML statistics into main build log;
wenzelm
parents:
64117
diff
changeset
|
495 |
|
64054 | 496 |
case Session_Finished1(name, |
497 |
Value.Int(e1), Value.Int(e2), Value.Int(e3), |
|
498 |
Value.Int(c1), Value.Int(c2), Value.Int(c3)) => |
|
499 |
val elapsed = Time.hms(e1, e2, e3) |
|
500 |
val cpu = Time.hms(c1, c2, c3) |
|
64085
1c451e5c145f
clarified parse_build_info: isabelle build output;
wenzelm
parents:
64083
diff
changeset
|
501 |
timing += (name -> Timing(elapsed, cpu, Time.zero)) |
64119
8094eaa38d4b
inline session ML statistics into main build log;
wenzelm
parents:
64117
diff
changeset
|
502 |
|
64054 | 503 |
case Session_Finished2(name, |
504 |
Value.Int(e1), Value.Int(e2), Value.Int(e3)) => |
|
505 |
val elapsed = Time.hms(e1, e2, e3) |
|
64085
1c451e5c145f
clarified parse_build_info: isabelle build output;
wenzelm
parents:
64083
diff
changeset
|
506 |
timing += (name -> Timing(elapsed, Time.zero, Time.zero)) |
64119
8094eaa38d4b
inline session ML statistics into main build log;
wenzelm
parents:
64117
diff
changeset
|
507 |
|
64054 | 508 |
case Session_Timing(name, |
509 |
Value.Int(t), Value.Double(e), Value.Double(c), Value.Double(g)) => |
|
510 |
val elapsed = Time.seconds(e) |
|
511 |
val cpu = Time.seconds(c) |
|
512 |
val gc = Time.seconds(g) |
|
64085
1c451e5c145f
clarified parse_build_info: isabelle build output;
wenzelm
parents:
64083
diff
changeset
|
513 |
ml_timing += (name -> Timing(elapsed, cpu, gc)) |
64054 | 514 |
threads += (name -> t) |
64119
8094eaa38d4b
inline session ML statistics into main build log;
wenzelm
parents:
64117
diff
changeset
|
515 |
|
66913 | 516 |
case Sources(name, s) => |
517 |
sources += (name -> s) |
|
518 |
||
64120 | 519 |
case Heap(name, Value.Long(size)) => |
77113 | 520 |
heap_sizes += (name -> Space.bytes(size)) |
64120 | 521 |
|
71630
50425e4c3910
clarified modules: global quasi-scope for markers;
wenzelm
parents:
71621
diff
changeset
|
522 |
case _ if Protocol.Theory_Timing_Marker.test_yxml(line) => |
66874
0b8da0fc9563
store theory timings in session in build_log database;
wenzelm
parents:
66873
diff
changeset
|
523 |
line match { |
0b8da0fc9563
store theory timings in session in build_log database;
wenzelm
parents:
66873
diff
changeset
|
524 |
case Theory_Timing(name, theory_timing) => |
0b8da0fc9563
store theory timings in session in build_log database;
wenzelm
parents:
66873
diff
changeset
|
525 |
theory_timings += (name -> (theory_timings.getOrElse(name, Map.empty) + theory_timing)) |
0b8da0fc9563
store theory timings in session in build_log database;
wenzelm
parents:
66873
diff
changeset
|
526 |
case _ => log_file.err("malformed theory_timing " + quote(line)) |
0b8da0fc9563
store theory timings in session in build_log database;
wenzelm
parents:
66873
diff
changeset
|
527 |
} |
0b8da0fc9563
store theory timings in session in build_log database;
wenzelm
parents:
66873
diff
changeset
|
528 |
|
71630
50425e4c3910
clarified modules: global quasi-scope for markers;
wenzelm
parents:
71621
diff
changeset
|
529 |
case _ if parse_ml_statistics && Protocol.ML_Statistics_Marker.test_yxml(line) => |
50425e4c3910
clarified modules: global quasi-scope for markers;
wenzelm
parents:
71621
diff
changeset
|
530 |
Protocol.ML_Statistics_Marker.unapply(line).map(log_file.parse_props) match { |
66874
0b8da0fc9563
store theory timings in session in build_log database;
wenzelm
parents:
66873
diff
changeset
|
531 |
case Some((SESSION_NAME, name) :: props) => |
0b8da0fc9563
store theory timings in session in build_log database;
wenzelm
parents:
66873
diff
changeset
|
532 |
ml_statistics += (name -> (props :: ml_statistics.getOrElse(name, Nil))) |
0b8da0fc9563
store theory timings in session in build_log database;
wenzelm
parents:
66873
diff
changeset
|
533 |
case _ => log_file.err("malformed ML_statistics " + quote(line)) |
0b8da0fc9563
store theory timings in session in build_log database;
wenzelm
parents:
66873
diff
changeset
|
534 |
} |
64119
8094eaa38d4b
inline session ML statistics into main build log;
wenzelm
parents:
64117
diff
changeset
|
535 |
|
71630
50425e4c3910
clarified modules: global quasi-scope for markers;
wenzelm
parents:
71621
diff
changeset
|
536 |
case _ if Protocol.Error_Message_Marker.test_yxml(line) => |
50425e4c3910
clarified modules: global quasi-scope for markers;
wenzelm
parents:
71621
diff
changeset
|
537 |
Protocol.Error_Message_Marker.unapply(line).map(log_file.parse_props) match { |
66874
0b8da0fc9563
store theory timings in session in build_log database;
wenzelm
parents:
66873
diff
changeset
|
538 |
case Some(List((SESSION_NAME, name), (Markup.CONTENT, msg))) => |
71620 | 539 |
errors += (name -> (msg :: errors.getOrElse(name, Nil))) |
66874
0b8da0fc9563
store theory timings in session in build_log database;
wenzelm
parents:
66873
diff
changeset
|
540 |
case _ => log_file.err("malformed error message " + quote(line)) |
0b8da0fc9563
store theory timings in session in build_log database;
wenzelm
parents:
66873
diff
changeset
|
541 |
} |
65937 | 542 |
|
64054 | 543 |
case _ => |
544 |
} |
|
545 |
} |
|
546 |
||
64085
1c451e5c145f
clarified parse_build_info: isabelle build output;
wenzelm
parents:
64083
diff
changeset
|
547 |
val sessions = |
1c451e5c145f
clarified parse_build_info: isabelle build output;
wenzelm
parents:
64083
diff
changeset
|
548 |
Map( |
1c451e5c145f
clarified parse_build_info: isabelle build output;
wenzelm
parents:
64083
diff
changeset
|
549 |
(for (name <- all_sessions.toList) yield { |
1c451e5c145f
clarified parse_build_info: isabelle build output;
wenzelm
parents:
64083
diff
changeset
|
550 |
val status = |
72694 | 551 |
if (timing.isDefinedAt(name) || ml_timing.isDefinedAt(name)) |
65633 | 552 |
Session_Status.finished |
553 |
else if (started(name)) Session_Status.failed |
|
554 |
else Session_Status.existing |
|
64085
1c451e5c145f
clarified parse_build_info: isabelle build output;
wenzelm
parents:
64083
diff
changeset
|
555 |
val entry = |
1c451e5c145f
clarified parse_build_info: isabelle build output;
wenzelm
parents:
64083
diff
changeset
|
556 |
Session_Entry( |
65643 | 557 |
chapter = chapter.getOrElse(name, ""), |
558 |
groups = groups.getOrElse(name, Nil), |
|
559 |
threads = threads.get(name), |
|
560 |
timing = timing.getOrElse(name, Timing.zero), |
|
561 |
ml_timing = ml_timing.getOrElse(name, Timing.zero), |
|
66913 | 562 |
sources = sources.get(name), |
65643 | 563 |
heap_size = heap_sizes.get(name), |
564 |
status = Some(status), |
|
65937 | 565 |
errors = errors.getOrElse(name, Nil).reverse, |
66874
0b8da0fc9563
store theory timings in session in build_log database;
wenzelm
parents:
66873
diff
changeset
|
566 |
theory_timings = theory_timings.getOrElse(name, Map.empty), |
65643 | 567 |
ml_statistics = ml_statistics.getOrElse(name, Nil).reverse) |
64085
1c451e5c145f
clarified parse_build_info: isabelle build output;
wenzelm
parents:
64083
diff
changeset
|
568 |
(name -> entry) |
1c451e5c145f
clarified parse_build_info: isabelle build output;
wenzelm
parents:
64083
diff
changeset
|
569 |
}):_*) |
1c451e5c145f
clarified parse_build_info: isabelle build output;
wenzelm
parents:
64083
diff
changeset
|
570 |
Build_Info(sessions) |
64054 | 571 |
} |
64099 | 572 |
|
573 |
||
574 |
||
72860 | 575 |
/** session info: produced by isabelle build as session database **/ |
64099 | 576 |
|
577 |
sealed case class Session_Info( |
|
578 |
session_timing: Properties.T, |
|
579 |
command_timings: List[Properties.T], |
|
66873
9953ae603a23
provide theory timing information, similar to command timing but always considered relevant;
wenzelm
parents:
66863
diff
changeset
|
580 |
theory_timings: List[Properties.T], |
64099 | 581 |
ml_statistics: List[Properties.T], |
65934 | 582 |
task_statistics: List[Properties.T], |
75393 | 583 |
errors: List[String] |
584 |
) { |
|
66944
05df740cb54b
more informative timeout message, notably for build_status;
wenzelm
parents:
66913
diff
changeset
|
585 |
def error(s: String): Session_Info = |
05df740cb54b
more informative timeout message, notably for build_status;
wenzelm
parents:
66913
diff
changeset
|
586 |
copy(errors = errors ::: List(s)) |
05df740cb54b
more informative timeout message, notably for build_status;
wenzelm
parents:
66913
diff
changeset
|
587 |
} |
64099 | 588 |
|
589 |
private def parse_session_info( |
|
590 |
log_file: Log_File, |
|
591 |
command_timings: Boolean, |
|
66873
9953ae603a23
provide theory timing information, similar to command timing but always considered relevant;
wenzelm
parents:
66863
diff
changeset
|
592 |
theory_timings: Boolean, |
64099 | 593 |
ml_statistics: Boolean, |
75393 | 594 |
task_statistics: Boolean |
595 |
): Session_Info = { |
|
65290 | 596 |
Session_Info( |
72012 | 597 |
session_timing = log_file.find_props(Protocol.Session_Timing_Marker) getOrElse Nil, |
71630
50425e4c3910
clarified modules: global quasi-scope for markers;
wenzelm
parents:
71621
diff
changeset
|
598 |
command_timings = |
50425e4c3910
clarified modules: global quasi-scope for markers;
wenzelm
parents:
71621
diff
changeset
|
599 |
if (command_timings) log_file.filter_props(Protocol.Command_Timing_Marker) else Nil, |
50425e4c3910
clarified modules: global quasi-scope for markers;
wenzelm
parents:
71621
diff
changeset
|
600 |
theory_timings = |
50425e4c3910
clarified modules: global quasi-scope for markers;
wenzelm
parents:
71621
diff
changeset
|
601 |
if (theory_timings) log_file.filter_props(Protocol.Theory_Timing_Marker) else Nil, |
50425e4c3910
clarified modules: global quasi-scope for markers;
wenzelm
parents:
71621
diff
changeset
|
602 |
ml_statistics = |
50425e4c3910
clarified modules: global quasi-scope for markers;
wenzelm
parents:
71621
diff
changeset
|
603 |
if (ml_statistics) log_file.filter_props(Protocol.ML_Statistics_Marker) else Nil, |
50425e4c3910
clarified modules: global quasi-scope for markers;
wenzelm
parents:
71621
diff
changeset
|
604 |
task_statistics = |
50425e4c3910
clarified modules: global quasi-scope for markers;
wenzelm
parents:
71621
diff
changeset
|
605 |
if (task_statistics) log_file.filter_props(Protocol.Task_Statistics_Marker) else Nil, |
50425e4c3910
clarified modules: global quasi-scope for markers;
wenzelm
parents:
71621
diff
changeset
|
606 |
errors = log_file.filter(Protocol.Error_Message_Marker)) |
64099 | 607 |
} |
65595 | 608 |
|
76351
2cee31cd92f0
generic support for XZ and Zstd compression in Isabelle/Scala;
wenzelm
parents:
76350
diff
changeset
|
609 |
def compress_errors( |
2cee31cd92f0
generic support for XZ and Zstd compression in Isabelle/Scala;
wenzelm
parents:
76350
diff
changeset
|
610 |
errors: List[String], |
2cee31cd92f0
generic support for XZ and Zstd compression in Isabelle/Scala;
wenzelm
parents:
76350
diff
changeset
|
611 |
cache: Compress.Cache = Compress.Cache.none |
2cee31cd92f0
generic support for XZ and Zstd compression in Isabelle/Scala;
wenzelm
parents:
76350
diff
changeset
|
612 |
): Option[Bytes] = |
65937 | 613 |
if (errors.isEmpty) None |
68018 | 614 |
else { |
615 |
Some(Bytes(YXML.string_of_body(XML.Encode.list(XML.Encode.string)(errors))). |
|
616 |
compress(cache = cache)) |
|
617 |
} |
|
65937 | 618 |
|
73033 | 619 |
def uncompress_errors(bytes: Bytes, cache: XML.Cache = XML.Cache.make()): List[String] = |
72885 | 620 |
if (bytes.is_empty) Nil |
68018 | 621 |
else { |
73033 | 622 |
XML.Decode.list(YXML.string_of_body)( |
76351
2cee31cd92f0
generic support for XZ and Zstd compression in Isabelle/Scala;
wenzelm
parents:
76350
diff
changeset
|
623 |
YXML.parse_body(bytes.uncompress(cache = cache.compress).text, cache = cache)) |
68018 | 624 |
} |
65937 | 625 |
|
65595 | 626 |
|
627 |
||
628 |
/** persistent store **/ |
|
629 |
||
65694 | 630 |
/* SQL data model */ |
631 |
||
75393 | 632 |
object Data { |
65702 | 633 |
def build_log_table(name: String, columns: List[SQL.Column], body: String = ""): SQL.Table = |
77679 | 634 |
SQL.Table("isabelle_build_log" + if_proper(name, "_" + name), columns, body) |
65700 | 635 |
|
636 |
||
65694 | 637 |
/* main content */ |
638 |
||
66857 | 639 |
val log_name = SQL.Column.string("log_name").make_primary_key |
640 |
val session_name = SQL.Column.string("session_name").make_primary_key |
|
66874
0b8da0fc9563
store theory timings in session in build_log database;
wenzelm
parents:
66873
diff
changeset
|
641 |
val theory_name = SQL.Column.string("theory_name").make_primary_key |
65694 | 642 |
val chapter = SQL.Column.string("chapter") |
643 |
val groups = SQL.Column.string("groups") |
|
644 |
val threads = SQL.Column.int("threads") |
|
645 |
val timing_elapsed = SQL.Column.long("timing_elapsed") |
|
646 |
val timing_cpu = SQL.Column.long("timing_cpu") |
|
647 |
val timing_gc = SQL.Column.long("timing_gc") |
|
648 |
val timing_factor = SQL.Column.double("timing_factor") |
|
649 |
val ml_timing_elapsed = SQL.Column.long("ml_timing_elapsed") |
|
650 |
val ml_timing_cpu = SQL.Column.long("ml_timing_cpu") |
|
651 |
val ml_timing_gc = SQL.Column.long("ml_timing_gc") |
|
652 |
val ml_timing_factor = SQL.Column.double("ml_timing_factor") |
|
66874
0b8da0fc9563
store theory timings in session in build_log database;
wenzelm
parents:
66873
diff
changeset
|
653 |
val theory_timing_elapsed = SQL.Column.long("theory_timing_elapsed") |
0b8da0fc9563
store theory timings in session in build_log database;
wenzelm
parents:
66873
diff
changeset
|
654 |
val theory_timing_cpu = SQL.Column.long("theory_timing_cpu") |
0b8da0fc9563
store theory timings in session in build_log database;
wenzelm
parents:
66873
diff
changeset
|
655 |
val theory_timing_gc = SQL.Column.long("theory_timing_gc") |
65694 | 656 |
val heap_size = SQL.Column.long("heap_size") |
657 |
val status = SQL.Column.string("status") |
|
65937 | 658 |
val errors = SQL.Column.bytes("errors") |
66913 | 659 |
val sources = SQL.Column.string("sources") |
65694 | 660 |
val ml_statistics = SQL.Column.bytes("ml_statistics") |
65783
d3d5cb2d6866
pick isabelle_version based on build_log database;
wenzelm
parents:
65781
diff
changeset
|
661 |
val known = SQL.Column.bool("known") |
65694 | 662 |
|
663 |
val meta_info_table = |
|
65702 | 664 |
build_log_table("meta_info", log_name :: Prop.all_props ::: Settings.all_settings) |
65694 | 665 |
|
666 |
val sessions_table = |
|
65702 | 667 |
build_log_table("sessions", |
65694 | 668 |
List(log_name, session_name, chapter, groups, threads, timing_elapsed, timing_cpu, |
669 |
timing_gc, timing_factor, ml_timing_elapsed, ml_timing_cpu, ml_timing_gc, ml_timing_factor, |
|
66913 | 670 |
heap_size, status, errors, sources)) |
65694 | 671 |
|
66874
0b8da0fc9563
store theory timings in session in build_log database;
wenzelm
parents:
66873
diff
changeset
|
672 |
val theories_table = |
0b8da0fc9563
store theory timings in session in build_log database;
wenzelm
parents:
66873
diff
changeset
|
673 |
build_log_table("theories", |
0b8da0fc9563
store theory timings in session in build_log database;
wenzelm
parents:
66873
diff
changeset
|
674 |
List(log_name, session_name, theory_name, theory_timing_elapsed, theory_timing_cpu, |
0b8da0fc9563
store theory timings in session in build_log database;
wenzelm
parents:
66873
diff
changeset
|
675 |
theory_timing_gc)) |
0b8da0fc9563
store theory timings in session in build_log database;
wenzelm
parents:
66873
diff
changeset
|
676 |
|
65694 | 677 |
val ml_statistics_table = |
65702 | 678 |
build_log_table("ml_statistics", List(log_name, session_name, ml_statistics)) |
65694 | 679 |
|
680 |
||
66855 | 681 |
/* AFP versions */ |
682 |
||
75393 | 683 |
val isabelle_afp_versions_table: SQL.Table = { |
66855 | 684 |
val version1 = Prop.isabelle_version |
685 |
val version2 = Prop.afp_version |
|
66857 | 686 |
build_log_table("isabelle_afp_versions", List(version1.make_primary_key, version2), |
66855 | 687 |
SQL.select(List(version1, version2), distinct = true) + meta_info_table + |
77370 | 688 |
SQL.where(SQL.and(version1.defined, version2.defined))) |
66855 | 689 |
} |
690 |
||
691 |
||
65705 | 692 |
/* earliest pull date for repository version (PostgreSQL queries) */ |
65694 | 693 |
|
71621 | 694 |
def pull_date(afp: Boolean = false): SQL.Column = |
66880
486f4af28db9
more thorough treatment of afp_version and afp_pull_date;
wenzelm
parents:
66874
diff
changeset
|
695 |
if (afp) SQL.Column.date("afp_pull_date") |
486f4af28db9
more thorough treatment of afp_version and afp_pull_date;
wenzelm
parents:
66874
diff
changeset
|
696 |
else SQL.Column.date("pull_date") |
65694 | 697 |
|
75393 | 698 |
def pull_date_table(afp: Boolean = false): SQL.Table = { |
66863
6acd1a2bd146
clarified afp_pull_date: both repository versions are relevant;
wenzelm
parents:
66858
diff
changeset
|
699 |
val (name, versions) = |
6acd1a2bd146
clarified afp_pull_date: both repository versions are relevant;
wenzelm
parents:
66858
diff
changeset
|
700 |
if (afp) ("afp_pull_date", List(Prop.isabelle_version, Prop.afp_version)) |
6acd1a2bd146
clarified afp_pull_date: both repository versions are relevant;
wenzelm
parents:
66858
diff
changeset
|
701 |
else ("pull_date", List(Prop.isabelle_version)) |
65694 | 702 |
|
66880
486f4af28db9
more thorough treatment of afp_version and afp_pull_date;
wenzelm
parents:
66874
diff
changeset
|
703 |
build_log_table(name, versions.map(_.make_primary_key) ::: List(pull_date(afp)), |
486f4af28db9
more thorough treatment of afp_version and afp_pull_date;
wenzelm
parents:
66874
diff
changeset
|
704 |
"SELECT " + versions.mkString(", ") + |
486f4af28db9
more thorough treatment of afp_version and afp_pull_date;
wenzelm
parents:
66874
diff
changeset
|
705 |
", min(" + Prop.build_start + ") AS " + pull_date(afp) + |
66863
6acd1a2bd146
clarified afp_pull_date: both repository versions are relevant;
wenzelm
parents:
66858
diff
changeset
|
706 |
" FROM " + meta_info_table + |
77370 | 707 |
" WHERE " + SQL.AND((versions ::: List(Prop.build_start)).map(_.defined)) + |
66863
6acd1a2bd146
clarified afp_pull_date: both repository versions are relevant;
wenzelm
parents:
66858
diff
changeset
|
708 |
" GROUP BY " + versions.mkString(", ")) |
66855 | 709 |
} |
710 |
||
711 |
||
712 |
/* recent entries */ |
|
713 |
||
75968
5a782ca6872b
tuned signature: build_log db is specific to PostgreSQL;
wenzelm
parents:
75906
diff
changeset
|
714 |
def recent_time(days: Int): PostgreSQL.Source = |
65736 | 715 |
"now() - INTERVAL '" + days.max(0) + " days'" |
716 |
||
66863
6acd1a2bd146
clarified afp_pull_date: both repository versions are relevant;
wenzelm
parents:
66858
diff
changeset
|
717 |
def recent_pull_date_table( |
75393 | 718 |
days: Int, |
719 |
rev: String = "", |
|
720 |
afp_rev: Option[String] = None |
|
721 |
): SQL.Table = { |
|
66863
6acd1a2bd146
clarified afp_pull_date: both repository versions are relevant;
wenzelm
parents:
66858
diff
changeset
|
722 |
val afp = afp_rev.isDefined |
6acd1a2bd146
clarified afp_pull_date: both repository versions are relevant;
wenzelm
parents:
66858
diff
changeset
|
723 |
val rev2 = afp_rev.getOrElse("") |
6acd1a2bd146
clarified afp_pull_date: both repository versions are relevant;
wenzelm
parents:
66858
diff
changeset
|
724 |
val table = pull_date_table(afp) |
6acd1a2bd146
clarified afp_pull_date: both repository versions are relevant;
wenzelm
parents:
66858
diff
changeset
|
725 |
|
77376 | 726 |
val eq_rev = if_proper(rev, Prop.isabelle_version(table).equal(rev)) |
727 |
val eq_rev2 = if_proper(rev2, Prop.afp_version(table).equal(rev2)) |
|
66863
6acd1a2bd146
clarified afp_pull_date: both repository versions are relevant;
wenzelm
parents:
66858
diff
changeset
|
728 |
|
65777 | 729 |
SQL.Table("recent_pull_date", table.columns, |
77381
a86e346b20d8
misc tuning and clarification: more uniform use of optional "sql" in SQL.Table.delete/select;
wenzelm
parents:
77376
diff
changeset
|
730 |
table.select(table.columns, sql = |
77376 | 731 |
SQL.where( |
732 |
SQL.or(pull_date(afp)(table).ident + " > " + recent_time(days), |
|
733 |
SQL.and(eq_rev, eq_rev2))))) |
|
65702 | 734 |
} |
65694 | 735 |
|
75968
5a782ca6872b
tuned signature: build_log db is specific to PostgreSQL;
wenzelm
parents:
75906
diff
changeset
|
736 |
def select_recent_log_names(days: Int): PostgreSQL.Source = { |
65781 | 737 |
val table1 = meta_info_table |
738 |
val table2 = recent_pull_date_table(days) |
|
77381
a86e346b20d8
misc tuning and clarification: more uniform use of optional "sql" in SQL.Table.delete/select;
wenzelm
parents:
77376
diff
changeset
|
739 |
table1.select(List(log_name), distinct = true, sql = |
a86e346b20d8
misc tuning and clarification: more uniform use of optional "sql" in SQL.Table.delete/select;
wenzelm
parents:
77376
diff
changeset
|
740 |
SQL.join_inner + table2.query_named + |
a86e346b20d8
misc tuning and clarification: more uniform use of optional "sql" in SQL.Table.delete/select;
wenzelm
parents:
77376
diff
changeset
|
741 |
" ON " + Prop.isabelle_version(table1) + " = " + Prop.isabelle_version(table2)) |
65781 | 742 |
} |
743 |
||
75393 | 744 |
def select_recent_versions( |
745 |
days: Int, |
|
746 |
rev: String = "", |
|
747 |
afp_rev: Option[String] = None, |
|
75968
5a782ca6872b
tuned signature: build_log db is specific to PostgreSQL;
wenzelm
parents:
75906
diff
changeset
|
748 |
sql: PostgreSQL.Source = "" |
5a782ca6872b
tuned signature: build_log db is specific to PostgreSQL;
wenzelm
parents:
75906
diff
changeset
|
749 |
): PostgreSQL.Source = { |
66880
486f4af28db9
more thorough treatment of afp_version and afp_pull_date;
wenzelm
parents:
66874
diff
changeset
|
750 |
val afp = afp_rev.isDefined |
66858 | 751 |
val version = Prop.isabelle_version |
66863
6acd1a2bd146
clarified afp_pull_date: both repository versions are relevant;
wenzelm
parents:
66858
diff
changeset
|
752 |
val table1 = recent_pull_date_table(days, rev = rev, afp_rev = afp_rev) |
65783
d3d5cb2d6866
pick isabelle_version based on build_log database;
wenzelm
parents:
65781
diff
changeset
|
753 |
val table2 = meta_info_table |
d3d5cb2d6866
pick isabelle_version based on build_log database;
wenzelm
parents:
65781
diff
changeset
|
754 |
val aux_table = SQL.Table("aux", table2.columns, table2.select(sql = sql)) |
d3d5cb2d6866
pick isabelle_version based on build_log database;
wenzelm
parents:
65781
diff
changeset
|
755 |
|
d3d5cb2d6866
pick isabelle_version based on build_log database;
wenzelm
parents:
65781
diff
changeset
|
756 |
val columns = |
66858 | 757 |
table1.columns.map(c => c(table1)) ::: |
758 |
List(known.copy(expr = log_name(aux_table).defined)) |
|
65783
d3d5cb2d6866
pick isabelle_version based on build_log database;
wenzelm
parents:
65781
diff
changeset
|
759 |
SQL.select(columns, distinct = true) + |
d3d5cb2d6866
pick isabelle_version based on build_log database;
wenzelm
parents:
65781
diff
changeset
|
760 |
table1.query_named + SQL.join_outer + aux_table.query_named + |
66858 | 761 |
" ON " + version(table1) + " = " + version(aux_table) + |
76870 | 762 |
SQL.order_by(List(pull_date(afp)(table1)), descending = true) |
65783
d3d5cb2d6866
pick isabelle_version based on build_log database;
wenzelm
parents:
65781
diff
changeset
|
763 |
} |
d3d5cb2d6866
pick isabelle_version based on build_log database;
wenzelm
parents:
65781
diff
changeset
|
764 |
|
65724 | 765 |
|
766 |
/* universal view on main data */ |
|
767 |
||
75393 | 768 |
val universal_table: SQL.Table = { |
66880
486f4af28db9
more thorough treatment of afp_version and afp_pull_date;
wenzelm
parents:
66874
diff
changeset
|
769 |
val afp_pull_date = pull_date(afp = true) |
486f4af28db9
more thorough treatment of afp_version and afp_pull_date;
wenzelm
parents:
66874
diff
changeset
|
770 |
val version1 = Prop.isabelle_version |
486f4af28db9
more thorough treatment of afp_version and afp_pull_date;
wenzelm
parents:
66874
diff
changeset
|
771 |
val version2 = Prop.afp_version |
65724 | 772 |
val table1 = meta_info_table |
66880
486f4af28db9
more thorough treatment of afp_version and afp_pull_date;
wenzelm
parents:
66874
diff
changeset
|
773 |
val table2 = pull_date_table(afp = true) |
486f4af28db9
more thorough treatment of afp_version and afp_pull_date;
wenzelm
parents:
66874
diff
changeset
|
774 |
val table3 = pull_date_table() |
65724 | 775 |
|
66880
486f4af28db9
more thorough treatment of afp_version and afp_pull_date;
wenzelm
parents:
66874
diff
changeset
|
776 |
val a_columns = log_name :: afp_pull_date :: table1.columns.tail |
65850
5414c14c3984
clarified universal table: include ml_statistics;
wenzelm
parents:
65804
diff
changeset
|
777 |
val a_table = |
5414c14c3984
clarified universal table: include ml_statistics;
wenzelm
parents:
65804
diff
changeset
|
778 |
SQL.Table("a", a_columns, |
66880
486f4af28db9
more thorough treatment of afp_version and afp_pull_date;
wenzelm
parents:
66874
diff
changeset
|
779 |
SQL.select(List(log_name, afp_pull_date) ::: table1.columns.tail.map(_.apply(table1))) + |
77376 | 780 |
table1 + SQL.join_outer + table2 + " ON " + |
781 |
SQL.and( |
|
782 |
version1(table1).ident + " = " + version1(table2).ident, |
|
783 |
version2(table1).ident + " = " + version2(table2).ident)) |
|
65724 | 784 |
|
66880
486f4af28db9
more thorough treatment of afp_version and afp_pull_date;
wenzelm
parents:
66874
diff
changeset
|
785 |
val b_columns = log_name :: pull_date() :: a_columns.tail |
65850
5414c14c3984
clarified universal table: include ml_statistics;
wenzelm
parents:
65804
diff
changeset
|
786 |
val b_table = |
5414c14c3984
clarified universal table: include ml_statistics;
wenzelm
parents:
65804
diff
changeset
|
787 |
SQL.Table("b", b_columns, |
66880
486f4af28db9
more thorough treatment of afp_version and afp_pull_date;
wenzelm
parents:
66874
diff
changeset
|
788 |
SQL.select( |
486f4af28db9
more thorough treatment of afp_version and afp_pull_date;
wenzelm
parents:
66874
diff
changeset
|
789 |
List(log_name(a_table), pull_date()(table3)) ::: a_columns.tail.map(_.apply(a_table))) + |
486f4af28db9
more thorough treatment of afp_version and afp_pull_date;
wenzelm
parents:
66874
diff
changeset
|
790 |
a_table.query_named + SQL.join_outer + table3 + |
486f4af28db9
more thorough treatment of afp_version and afp_pull_date;
wenzelm
parents:
66874
diff
changeset
|
791 |
" ON " + version1(a_table) + " = " + version1(table3)) |
65850
5414c14c3984
clarified universal table: include ml_statistics;
wenzelm
parents:
65804
diff
changeset
|
792 |
|
66880
486f4af28db9
more thorough treatment of afp_version and afp_pull_date;
wenzelm
parents:
66874
diff
changeset
|
793 |
val c_columns = b_columns ::: sessions_table.columns.tail |
486f4af28db9
more thorough treatment of afp_version and afp_pull_date;
wenzelm
parents:
66874
diff
changeset
|
794 |
val c_table = |
486f4af28db9
more thorough treatment of afp_version and afp_pull_date;
wenzelm
parents:
66874
diff
changeset
|
795 |
SQL.Table("c", c_columns, |
486f4af28db9
more thorough treatment of afp_version and afp_pull_date;
wenzelm
parents:
66874
diff
changeset
|
796 |
SQL.select(log_name(b_table) :: c_columns.tail) + |
486f4af28db9
more thorough treatment of afp_version and afp_pull_date;
wenzelm
parents:
66874
diff
changeset
|
797 |
b_table.query_named + SQL.join_inner + sessions_table + |
486f4af28db9
more thorough treatment of afp_version and afp_pull_date;
wenzelm
parents:
66874
diff
changeset
|
798 |
" ON " + log_name(b_table) + " = " + log_name(sessions_table)) |
486f4af28db9
more thorough treatment of afp_version and afp_pull_date;
wenzelm
parents:
66874
diff
changeset
|
799 |
|
77679 | 800 |
build_log_table("", c_columns ::: List(ml_statistics), |
65724 | 801 |
{ |
66880
486f4af28db9
more thorough treatment of afp_version and afp_pull_date;
wenzelm
parents:
66874
diff
changeset
|
802 |
SQL.select(c_columns.map(_.apply(c_table)) ::: List(ml_statistics)) + |
77376 | 803 |
c_table.query_named + SQL.join_outer + ml_statistics_table + " ON " + |
804 |
SQL.and( |
|
805 |
log_name(c_table).ident + " = " + log_name(ml_statistics_table).ident, |
|
806 |
session_name(c_table).ident + " = " + session_name(ml_statistics_table).ident) |
|
65724 | 807 |
}) |
808 |
} |
|
65694 | 809 |
} |
810 |
||
811 |
||
812 |
/* database access */ |
|
813 |
||
73031
f93f0597f4fb
clarified signature: absorb XZ.Cache into XML.Cache;
wenzelm
parents:
73025
diff
changeset
|
814 |
def store(options: Options, cache: XML.Cache = XML.Cache.make()): Store = |
f93f0597f4fb
clarified signature: absorb XZ.Cache into XML.Cache;
wenzelm
parents:
73025
diff
changeset
|
815 |
new Store(options, cache) |
65595 | 816 |
|
75393 | 817 |
class Store private[Build_Log](options: Options, val cache: XML.Cache) { |
65595 | 818 |
def open_database( |
819 |
user: String = options.string("build_log_database_user"), |
|
820 |
password: String = options.string("build_log_database_password"), |
|
821 |
database: String = options.string("build_log_database_name"), |
|
822 |
host: String = options.string("build_log_database_host"), |
|
823 |
port: Int = options.int("build_log_database_port"), |
|
824 |
ssh_host: String = options.string("build_log_ssh_host"), |
|
825 |
ssh_user: String = options.string("build_log_ssh_user"), |
|
75393 | 826 |
ssh_port: Int = options.int("build_log_ssh_port") |
827 |
): PostgreSQL.Database = { |
|
65595 | 828 |
PostgreSQL.open_database( |
829 |
user = user, password = password, database = database, host = host, port = port, |
|
830 |
ssh = |
|
831 |
if (ssh_host == "") None |
|
73025 | 832 |
else Some(SSH.open_session(options, host = ssh_host, user = ssh_user, port = ssh_port)), |
65636
df804cdba5f9
ssh_close for proper termination after use of database;
wenzelm
parents:
65633
diff
changeset
|
833 |
ssh_close = true) |
65595 | 834 |
} |
65599 | 835 |
|
73340 | 836 |
def update_database( |
75393 | 837 |
db: PostgreSQL.Database, dirs: List[Path], ml_statistics: Boolean = false): Unit = { |
69299
2fd070377c99
clarified default (amending 72a9860f8602): avoid implicit change of File.find_files (it can have bad effects e.g. on "isabelle update_cartouches");
wenzelm
parents:
68169
diff
changeset
|
838 |
val log_files = |
2fd070377c99
clarified default (amending 72a9860f8602): avoid implicit change of File.find_files (it can have bad effects e.g. on "isabelle update_cartouches");
wenzelm
parents:
68169
diff
changeset
|
839 |
dirs.flatMap(dir => |
2fd070377c99
clarified default (amending 72a9860f8602): avoid implicit change of File.find_files (it can have bad effects e.g. on "isabelle update_cartouches");
wenzelm
parents:
68169
diff
changeset
|
840 |
File.find_files(dir.file, pred = Log_File.is_log(_), follow_links = true)) |
2fd070377c99
clarified default (amending 72a9860f8602): avoid implicit change of File.find_files (it can have bad effects e.g. on "isabelle update_cartouches");
wenzelm
parents:
68169
diff
changeset
|
841 |
write_info(db, log_files, ml_statistics = ml_statistics) |
65694 | 842 |
|
66863
6acd1a2bd146
clarified afp_pull_date: both repository versions are relevant;
wenzelm
parents:
66858
diff
changeset
|
843 |
db.create_view(Data.pull_date_table()) |
6acd1a2bd146
clarified afp_pull_date: both repository versions are relevant;
wenzelm
parents:
66858
diff
changeset
|
844 |
db.create_view(Data.pull_date_table(afp = true)) |
65724 | 845 |
db.create_view(Data.universal_table) |
65694 | 846 |
} |
847 |
||
75393 | 848 |
def snapshot_database( |
849 |
db: PostgreSQL.Database, |
|
850 |
sqlite_database: Path, |
|
851 |
days: Int = 100, |
|
852 |
ml_statistics: Boolean = false |
|
853 |
): Unit = { |
|
72375 | 854 |
Isabelle_System.make_directory(sqlite_database.dir) |
65694 | 855 |
sqlite_database.file.delete |
856 |
||
75394 | 857 |
using(SQLite.open_database(sqlite_database)) { db2 => |
65694 | 858 |
db.transaction { |
859 |
db2.transaction { |
|
65705 | 860 |
// main content |
861 |
db2.create_table(Data.meta_info_table) |
|
862 |
db2.create_table(Data.sessions_table) |
|
66874
0b8da0fc9563
store theory timings in session in build_log database;
wenzelm
parents:
66873
diff
changeset
|
863 |
db2.create_table(Data.theories_table) |
65705 | 864 |
db2.create_table(Data.ml_statistics_table) |
865 |
||
866 |
val recent_log_names = |
|
77552 | 867 |
db.execute_query_statement( |
868 |
Data.select_recent_log_names(days), |
|
869 |
List.from[String], res => res.string(Data.log_name)) |
|
65705 | 870 |
|
871 |
for (log_name <- recent_log_names) { |
|
872 |
read_meta_info(db, log_name).foreach(meta_info => |
|
873 |
update_meta_info(db2, log_name, meta_info)) |
|
874 |
||
875 |
update_sessions(db2, log_name, read_build_info(db, log_name)) |
|
876 |
||
65856 | 877 |
if (ml_statistics) { |
878 |
update_ml_statistics(db2, log_name, |
|
879 |
read_build_info(db, log_name, ml_statistics = true)) |
|
880 |
} |
|
65705 | 881 |
} |
882 |
||
883 |
// pull_date |
|
75393 | 884 |
for (afp <- List(false, true)) { |
66880
486f4af28db9
more thorough treatment of afp_version and afp_pull_date;
wenzelm
parents:
66874
diff
changeset
|
885 |
val afp_rev = if (afp) Some("") else None |
486f4af28db9
more thorough treatment of afp_version and afp_pull_date;
wenzelm
parents:
66874
diff
changeset
|
886 |
val table = Data.pull_date_table(afp) |
65694 | 887 |
db2.create_table(table) |
75394 | 888 |
db2.using_statement(table.insert()) { stmt2 => |
66880
486f4af28db9
more thorough treatment of afp_version and afp_pull_date;
wenzelm
parents:
66874
diff
changeset
|
889 |
db.using_statement( |
75394 | 890 |
Data.recent_pull_date_table(days, afp_rev = afp_rev).query) { stmt => |
65740 | 891 |
val res = stmt.execute_query() |
892 |
while (res.next()) { |
|
65748 | 893 |
for ((c, i) <- table.columns.zipWithIndex) { |
894 |
stmt2.string(i + 1) = res.get_string(c) |
|
895 |
} |
|
65740 | 896 |
stmt2.execute() |
65694 | 897 |
} |
75394 | 898 |
} |
899 |
} |
|
65709 | 900 |
} |
65705 | 901 |
|
902 |
// full view |
|
65724 | 903 |
db2.create_view(Data.universal_table) |
65694 | 904 |
} |
905 |
} |
|
77664
f5d3ade80d15
more specific vacuum operation, which is also relevant to PostgreSQL;
wenzelm
parents:
77552
diff
changeset
|
906 |
db2.vacuum() |
75394 | 907 |
} |
65694 | 908 |
} |
909 |
||
65688 | 910 |
def domain(db: SQL.Database, table: SQL.Table, column: SQL.Column): Set[String] = |
77552 | 911 |
db.execute_query_statement( |
912 |
table.select(List(column), distinct = true), |
|
913 |
Set.from[String], res => res.string(column)) |
|
65688 | 914 |
|
77543 | 915 |
def update_meta_info(db: SQL.Database, log_name: String, meta_info: Meta_Info): Unit = |
916 |
db.execute_statement(db.insert_permissive(Data.meta_info_table), body = |
|
77541 | 917 |
{ stmt => |
918 |
stmt.string(1) = log_name |
|
77543 | 919 |
for ((c, i) <- Data.meta_info_table.columns.tail.zipWithIndex) { |
920 |
if (c.T == SQL.Type.Date) stmt.date(i + 2) = meta_info.get_date(c) |
|
921 |
else stmt.string(i + 2) = meta_info.get(c) |
|
77541 | 922 |
} |
923 |
}) |
|
65600 | 924 |
|
77543 | 925 |
def update_sessions(db: SQL.Database, log_name: String, build_info: Build_Info): Unit = |
926 |
db.execute_statement(db.insert_permissive(Data.sessions_table), body = |
|
77541 | 927 |
{ stmt => |
928 |
val sessions = |
|
929 |
if (build_info.sessions.isEmpty) Build_Info.sessions_dummy |
|
930 |
else build_info.sessions |
|
931 |
for ((session_name, session) <- sessions) { |
|
932 |
stmt.string(1) = log_name |
|
933 |
stmt.string(2) = session_name |
|
934 |
stmt.string(3) = proper_string(session.chapter) |
|
935 |
stmt.string(4) = session.proper_groups |
|
936 |
stmt.int(5) = session.threads |
|
937 |
stmt.long(6) = session.timing.elapsed.proper_ms |
|
938 |
stmt.long(7) = session.timing.cpu.proper_ms |
|
939 |
stmt.long(8) = session.timing.gc.proper_ms |
|
940 |
stmt.double(9) = session.timing.factor |
|
941 |
stmt.long(10) = session.ml_timing.elapsed.proper_ms |
|
942 |
stmt.long(11) = session.ml_timing.cpu.proper_ms |
|
943 |
stmt.long(12) = session.ml_timing.gc.proper_ms |
|
944 |
stmt.double(13) = session.ml_timing.factor |
|
945 |
stmt.long(14) = session.heap_size.map(_.bytes) |
|
946 |
stmt.string(15) = session.status.map(_.toString) |
|
947 |
stmt.bytes(16) = compress_errors(session.errors, cache = cache.compress) |
|
948 |
stmt.string(17) = session.sources |
|
949 |
} |
|
950 |
}) |
|
65642 | 951 |
|
77543 | 952 |
def update_theories(db: SQL.Database, log_name: String, build_info: Build_Info): Unit = |
953 |
db.execute_statement(db.insert_permissive(Data.theories_table), body = |
|
77541 | 954 |
{ stmt => |
955 |
val sessions = |
|
956 |
if (build_info.sessions.forall({ case (_, session) => session.theory_timings.isEmpty })) |
|
957 |
Build_Info.sessions_dummy |
|
958 |
else build_info.sessions |
|
959 |
for { |
|
960 |
(session_name, session) <- sessions |
|
961 |
(theory_name, timing) <- session.theory_timings |
|
962 |
} { |
|
963 |
stmt.string(1) = log_name |
|
964 |
stmt.string(2) = session_name |
|
965 |
stmt.string(3) = theory_name |
|
966 |
stmt.long(4) = timing.elapsed.ms |
|
967 |
stmt.long(5) = timing.cpu.ms |
|
968 |
stmt.long(6) = timing.gc.ms |
|
969 |
} |
|
970 |
}) |
|
66874
0b8da0fc9563
store theory timings in session in build_log database;
wenzelm
parents:
66873
diff
changeset
|
971 |
|
77543 | 972 |
def update_ml_statistics(db: SQL.Database, log_name: String, build_info: Build_Info): Unit = |
973 |
db.execute_statement(db.insert_permissive(Data.ml_statistics_table), body = |
|
77541 | 974 |
{ stmt => |
975 |
val ml_stats: List[(String, Option[Bytes])] = |
|
976 |
Par_List.map[(String, Session_Entry), (String, Option[Bytes])]( |
|
977 |
{ case (a, b) => (a, Properties.compress(b.ml_statistics, cache = cache.compress).proper) }, |
|
978 |
build_info.sessions.iterator.filter(p => p._2.ml_statistics.nonEmpty).toList) |
|
979 |
val entries = if (ml_stats.nonEmpty) ml_stats else List("" -> None) |
|
980 |
for ((session_name, ml_statistics) <- entries) { |
|
981 |
stmt.string(1) = log_name |
|
982 |
stmt.string(2) = session_name |
|
983 |
stmt.bytes(3) = ml_statistics |
|
984 |
} |
|
985 |
}) |
|
65645
2c704ae04db1
clarified database layout: bulky ml_statistics are stored/retrieved separately;
wenzelm
parents:
65643
diff
changeset
|
986 |
|
75393 | 987 |
def write_info(db: SQL.Database, files: List[JFile], ml_statistics: Boolean = false): Unit = { |
988 |
abstract class Table_Status(table: SQL.Table) { |
|
65688 | 989 |
db.create_table(table) |
65694 | 990 |
private var known: Set[String] = domain(db, table, Data.log_name) |
65688 | 991 |
|
65642 | 992 |
def required(file: JFile): Boolean = !known(Log_File.plain_name(file.getName)) |
65705 | 993 |
|
994 |
def update_db(db: SQL.Database, log_file: Log_File): Unit |
|
75393 | 995 |
def update(log_file: Log_File): Unit = { |
65642 | 996 |
if (!known(log_file.name)) { |
997 |
update_db(db, log_file) |
|
998 |
known += log_file.name |
|
65618 | 999 |
} |
65614
325801edb37d
clarified transaction boundaries: more robust incremental write operations;
wenzelm
parents:
65613
diff
changeset
|
1000 |
} |
65605 | 1001 |
} |
65642 | 1002 |
val status = |
1003 |
List( |
|
65705 | 1004 |
new Table_Status(Data.meta_info_table) { |
1005 |
override def update_db(db: SQL.Database, log_file: Log_File): Unit = |
|
1006 |
update_meta_info(db, log_file.name, log_file.parse_meta_info()) |
|
1007 |
}, |
|
1008 |
new Table_Status(Data.sessions_table) { |
|
1009 |
override def update_db(db: SQL.Database, log_file: Log_File): Unit = |
|
1010 |
update_sessions(db, log_file.name, log_file.parse_build_info()) |
|
1011 |
}, |
|
66874
0b8da0fc9563
store theory timings in session in build_log database;
wenzelm
parents:
66873
diff
changeset
|
1012 |
new Table_Status(Data.theories_table) { |
0b8da0fc9563
store theory timings in session in build_log database;
wenzelm
parents:
66873
diff
changeset
|
1013 |
override def update_db(db: SQL.Database, log_file: Log_File): Unit = |
0b8da0fc9563
store theory timings in session in build_log database;
wenzelm
parents:
66873
diff
changeset
|
1014 |
update_theories(db, log_file.name, log_file.parse_build_info()) |
0b8da0fc9563
store theory timings in session in build_log database;
wenzelm
parents:
66873
diff
changeset
|
1015 |
}, |
65705 | 1016 |
new Table_Status(Data.ml_statistics_table) { |
1017 |
override def update_db(db: SQL.Database, log_file: Log_File): Unit = |
|
1018 |
if (ml_statistics) { |
|
1019 |
update_ml_statistics(db, log_file.name, |
|
1020 |
log_file.parse_build_info(ml_statistics = true)) |
|
1021 |
} |
|
1022 |
}) |
|
65642 | 1023 |
|
67743 | 1024 |
for (file_group <- |
1025 |
files.filter(file => status.exists(_.required(file))). |
|
75393 | 1026 |
grouped(options.int("build_log_transaction_size") max 1)) { |
71621 | 1027 |
val log_files = Par_List.map[JFile, Log_File](Log_File.apply, file_group) |
65642 | 1028 |
db.transaction { log_files.foreach(log_file => status.foreach(_.update(log_file))) } |
1029 |
} |
|
65605 | 1030 |
} |
1031 |
||
75393 | 1032 |
def read_meta_info(db: SQL.Database, log_name: String): Option[Meta_Info] = { |
65694 | 1033 |
val table = Data.meta_info_table |
65642 | 1034 |
val columns = table.columns.tail |
77552 | 1035 |
db.execute_query_statementO[Meta_Info]( |
1036 |
table.select(columns, sql = Data.log_name.where_equal(log_name)), |
|
1037 |
{ res => |
|
65621 | 1038 |
val results = |
65642 | 1039 |
columns.map(c => c.name -> |
65621 | 1040 |
(if (c.T == SQL.Type.Date) |
65740 | 1041 |
res.get_date(c).map(Log_File.Date_Format(_)) |
65621 | 1042 |
else |
65740 | 1043 |
res.get_string(c))) |
65621 | 1044 |
val n = Prop.all_props.length |
1045 |
val props = for ((x, Some(y)) <- results.take(n)) yield (x, y) |
|
1046 |
val settings = for ((x, Some(y)) <- results.drop(n)) yield (x, y) |
|
77544 | 1047 |
Meta_Info(props, settings) |
77552 | 1048 |
} |
1049 |
) |
|
65621 | 1050 |
} |
1051 |
||
1052 |
def read_build_info( |
|
65629 | 1053 |
db: SQL.Database, |
1054 |
log_name: String, |
|
1055 |
session_names: List[String] = Nil, |
|
77405 | 1056 |
ml_statistics: Boolean = false |
1057 |
): Build_Info = { |
|
65694 | 1058 |
val table1 = Data.sessions_table |
1059 |
val table2 = Data.ml_statistics_table |
|
65629 | 1060 |
|
65645
2c704ae04db1
clarified database layout: bulky ml_statistics are stored/retrieved separately;
wenzelm
parents:
65643
diff
changeset
|
1061 |
val columns1 = table1.columns.tail.map(_.apply(table1)) |
2c704ae04db1
clarified database layout: bulky ml_statistics are stored/retrieved separately;
wenzelm
parents:
65643
diff
changeset
|
1062 |
val (columns, from) = |
2c704ae04db1
clarified database layout: bulky ml_statistics are stored/retrieved separately;
wenzelm
parents:
65643
diff
changeset
|
1063 |
if (ml_statistics) { |
65694 | 1064 |
val columns = columns1 ::: List(Data.ml_statistics(table2)) |
65668 | 1065 |
val join = |
77402 | 1066 |
table1.ident + SQL.join_outer + table2.ident + " ON " + |
77376 | 1067 |
SQL.and( |
1068 |
Data.log_name(table1).ident + " = " + Data.log_name(table2).ident, |
|
1069 |
Data.session_name(table1).ident + " = " + Data.session_name(table2).ident) |
|
65668 | 1070 |
(columns, SQL.enclose(join)) |
65645
2c704ae04db1
clarified database layout: bulky ml_statistics are stored/retrieved separately;
wenzelm
parents:
65643
diff
changeset
|
1071 |
} |
65695 | 1072 |
else (columns1, table1.ident) |
65645
2c704ae04db1
clarified database layout: bulky ml_statistics are stored/retrieved separately;
wenzelm
parents:
65643
diff
changeset
|
1073 |
|
77404 | 1074 |
val where = |
1075 |
SQL.where( |
|
1076 |
SQL.and( |
|
1077 |
Data.log_name(table1).equal(log_name), |
|
1078 |
Data.session_name(table1).ident + " <> ''", |
|
1079 |
if_proper(session_names, Data.session_name(table1).member(session_names)))) |
|
1080 |
||
65621 | 1081 |
val sessions = |
77552 | 1082 |
db.execute_query_statement( |
1083 |
SQL.select(columns, sql = from + where), |
|
1084 |
Map.from[String, Session_Entry], |
|
1085 |
{ res => |
|
65740 | 1086 |
val session_name = res.string(Data.session_name) |
65626 | 1087 |
val session_entry = |
1088 |
Session_Entry( |
|
65740 | 1089 |
chapter = res.string(Data.chapter), |
1090 |
groups = split_lines(res.string(Data.groups)), |
|
1091 |
threads = res.get_int(Data.threads), |
|
77494 | 1092 |
timing = |
1093 |
res.timing( |
|
1094 |
Data.timing_elapsed, |
|
1095 |
Data.timing_cpu, |
|
1096 |
Data.timing_gc), |
|
65626 | 1097 |
ml_timing = |
77494 | 1098 |
res.timing( |
1099 |
Data.ml_timing_elapsed, |
|
1100 |
Data.ml_timing_cpu, |
|
1101 |
Data.ml_timing_gc), |
|
66913 | 1102 |
sources = res.get_string(Data.sources), |
77113 | 1103 |
heap_size = res.get_long(Data.heap_size).map(Space.bytes), |
71621 | 1104 |
status = res.get_string(Data.status).map(Session_Status.withName), |
73033 | 1105 |
errors = uncompress_errors(res.bytes(Data.errors), cache = cache), |
65629 | 1106 |
ml_statistics = |
68018 | 1107 |
if (ml_statistics) { |
73031
f93f0597f4fb
clarified signature: absorb XZ.Cache into XML.Cache;
wenzelm
parents:
73025
diff
changeset
|
1108 |
Properties.uncompress(res.bytes(Data.ml_statistics), cache = cache) |
68018 | 1109 |
} |
65629 | 1110 |
else Nil) |
65626 | 1111 |
session_name -> session_entry |
77552 | 1112 |
} |
1113 |
) |
|
65621 | 1114 |
Build_Info(sessions) |
1115 |
} |
|
65595 | 1116 |
} |
77744 | 1117 |
|
1118 |
||
1119 |
/* maintain build_log database */ |
|
1120 |
||
1121 |
def build_log_database(options: Options, log_dirs: List[Path], |
|
1122 |
snapshot: Option[Path] = None |
|
1123 |
): Unit = { |
|
1124 |
val store = Build_Log.store(options) |
|
1125 |
using(store.open_database()) { db => |
|
1126 |
db.vacuum() |
|
1127 |
store.update_database(db, log_dirs) |
|
1128 |
store.update_database(db, log_dirs, ml_statistics = true) |
|
1129 |
snapshot.foreach(store.snapshot_database(db, _)) |
|
1130 |
} |
|
1131 |
} |
|
64045 | 1132 |
} |