| author | wenzelm | 
| Wed, 29 Jan 2025 20:17:21 +0100 | |
| changeset 82015 | fe186fd7a168 | 
| parent 80817 | e31ebb2be437 | 
| child 82142 | 508a673c87ac | 
| permissions | -rw-r--r-- | 
| 68308 
119fc05f6b00
support to dump build database produced by PIDE session;
 wenzelm parents: diff
changeset | 1 | /* Title: Pure/Tools/dump.scala | 
| 
119fc05f6b00
support to dump build database produced by PIDE session;
 wenzelm parents: diff
changeset | 2 | Author: Makarius | 
| 
119fc05f6b00
support to dump build database produced by PIDE session;
 wenzelm parents: diff
changeset | 3 | |
| 68348 | 4 | Dump cumulative PIDE session database. | 
| 68308 
119fc05f6b00
support to dump build database produced by PIDE session;
 wenzelm parents: diff
changeset | 5 | */ | 
| 
119fc05f6b00
support to dump build database produced by PIDE session;
 wenzelm parents: diff
changeset | 6 | |
| 
119fc05f6b00
support to dump build database produced by PIDE session;
 wenzelm parents: diff
changeset | 7 | package isabelle | 
| 
119fc05f6b00
support to dump build database produced by PIDE session;
 wenzelm parents: diff
changeset | 8 | |
| 71534 | 9 | import java.io.{BufferedWriter, FileOutputStream, OutputStreamWriter}
 | 
| 10 | ||
| 68308 
119fc05f6b00
support to dump build database produced by PIDE session;
 wenzelm parents: diff
changeset | 11 | |
| 75393 | 12 | object Dump {
 | 
| 68316 | 13 | /* aspects */ | 
| 14 | ||
| 15 | sealed case class Aspect_Args( | |
| 68355 | 16 | options: Options, | 
| 70640 
5f4b8a505090
more explicit type Dump.Session, with context information;
 wenzelm parents: 
70634diff
changeset | 17 | deps: Sessions.Deps, | 
| 68355 | 18 | progress: Progress, | 
| 69896 | 19 | output_dir: Path, | 
| 68929 | 20 | snapshot: Document.Snapshot, | 
| 75393 | 21 | status: Document_Status.Node_Status | 
| 22 |   ) {
 | |
| 23 |     def write_path(file_name: Path): Path = {
 | |
| 68929 | 24 | val path = output_dir + Path.basic(snapshot.node_name.theory) + file_name | 
| 72375 | 25 | Isabelle_System.make_directory(path.dir) | 
| 71534 | 26 | path | 
| 68319 | 27 | } | 
| 28 | ||
| 71534 | 29 | def write(file_name: Path, bytes: Bytes): Unit = | 
| 30 | Bytes.write(write_path(file_name), bytes) | |
| 31 | ||
| 68365 | 32 | def write(file_name: Path, body: XML.Body): Unit = | 
| 80437 
2c07b9b2f9f4
minor performance tuning: more direct Bytes with Symbol.encode;
 wenzelm parents: 
80425diff
changeset | 33 | write(file_name, YXML.bytes_of_body(body, recode = Symbol.encode)) | 
| 68319 | 34 | } | 
| 68316 | 35 | |
| 75393 | 36 | sealed case class Aspect( | 
| 37 | name: String, | |
| 38 | description: String, | |
| 39 | operation: Aspect_Args => Unit, | |
| 40 | options: List[String] = Nil | |
| 41 |   ) {
 | |
| 68345 | 42 | override def toString: String = name | 
| 43 | } | |
| 68316 | 44 | |
| 69521 | 45 | val known_aspects: List[Aspect] = | 
| 68316 | 46 | List( | 
| 68365 | 47 |       Aspect("markup", "PIDE markup (YXML format)",
 | 
| 72724 | 48 | args => args.write(Path.explode(Export.MARKUP), args.snapshot.xml_markup())), | 
| 68319 | 49 |       Aspect("messages", "output messages (YXML format)",
 | 
| 72724 | 50 | args => args.write(Path.explode(Export.MESSAGES), args.snapshot.messages.map(_._1))), | 
| 68347 | 51 |       Aspect("latex", "generated LaTeX source",
 | 
| 72724 | 52 | args => | 
| 53 |           for {
 | |
| 54 | entry <- args.snapshot.exports | |
| 55 | if entry.name_has_prefix(Export.DOCUMENT_PREFIX) | |
| 76852 | 56 | } args.write(Path.explode(entry.name), entry.bytes)), | 
| 68347 | 57 |       Aspect("theory", "foundational theory content",
 | 
| 72724 | 58 | args => | 
| 59 |           for {
 | |
| 60 | entry <- args.snapshot.exports | |
| 61 | if entry.name_has_prefix(Export.THEORY_PREFIX) | |
| 76852 | 62 | } args.write(Path.explode(entry.name), entry.bytes), | 
| 72724 | 63 |         options = List("export_theory"))
 | 
| 68345 | 64 | ).sortBy(_.name) | 
| 68316 | 65 | |
| 66 | def show_aspects: String = | |
| 68345 | 67 | cat_lines(known_aspects.map(aspect => aspect.name + " - " + aspect.description)) | 
| 68316 | 68 | |
| 69 | def the_aspect(name: String): Aspect = | |
| 70 | known_aspects.find(aspect => aspect.name == name) getOrElse | |
| 71 |       error("Unknown aspect " + quote(name))
 | |
| 72 | ||
| 73 | ||
| 70856 
545229df2f82
clarified signature: static Dump.Context vs. dynamic Dump.Session;
 wenzelm parents: 
70796diff
changeset | 74 | /* context and session */ | 
| 69538 
faf547d2834c
clarified signature, notably cascade of dump_options, deps, resources, session;
 wenzelm parents: 
69537diff
changeset | 75 | |
| 69896 | 76 | sealed case class Args( | 
| 69897 | 77 | session: Headless.Session, | 
| 78 | snapshot: Document.Snapshot, | |
| 75393 | 79 | status: Document_Status.Node_Status | 
| 80 |   ) {
 | |
| 69896 | 81 | def print_node: String = snapshot.node_name.toString | 
| 70640 
5f4b8a505090
more explicit type Dump.Session, with context information;
 wenzelm parents: 
70634diff
changeset | 82 | } | 
| 69896 | 83 | |
| 75393 | 84 |   object Context {
 | 
| 70640 
5f4b8a505090
more explicit type Dump.Session, with context information;
 wenzelm parents: 
70634diff
changeset | 85 | def apply( | 
| 
5f4b8a505090
more explicit type Dump.Session, with context information;
 wenzelm parents: 
70634diff
changeset | 86 | options: Options, | 
| 
5f4b8a505090
more explicit type Dump.Session, with context information;
 wenzelm parents: 
70634diff
changeset | 87 | aspects: List[Aspect] = Nil, | 
| 71726 
a5fda30edae2
clarified signature: more uniform treatment of stopped/interrupted state;
 wenzelm parents: 
71678diff
changeset | 88 | progress: Progress = new Progress, | 
| 70640 
5f4b8a505090
more explicit type Dump.Session, with context information;
 wenzelm parents: 
70634diff
changeset | 89 | dirs: List[Path] = Nil, | 
| 
5f4b8a505090
more explicit type Dump.Session, with context information;
 wenzelm parents: 
70634diff
changeset | 90 | select_dirs: List[Path] = Nil, | 
| 71161 
ffccc1f346ae
avoid vacuous session Pure -- dump does not read_pure_theory;
 wenzelm parents: 
71159diff
changeset | 91 | selection: Sessions.Selection = Sessions.Selection.empty, | 
| 71573 
c67076c07fb8
avoid accidental update of base session sources (following documentation in "system" manual);
 wenzelm parents: 
71534diff
changeset | 92 | pure_base: Boolean = false, | 
| 75393 | 93 | skip_base: Boolean = false | 
| 94 |     ): Context = {
 | |
| 95 |       val session_options: Options = {
 | |
| 70856 
545229df2f82
clarified signature: static Dump.Context vs. dynamic Dump.Session;
 wenzelm parents: 
70796diff
changeset | 96 | val options1 = | 
| 78839 
7799ec03b8bd
generalized node infos: allow addressing of numa node segments via relative cpus;
 Fabian Huch <huch@in.tum.de> parents: 
78617diff
changeset | 97 | Host.numa_options(options, Host.numa_node0()) + | 
| 70856 
545229df2f82
clarified signature: static Dump.Context vs. dynamic Dump.Session;
 wenzelm parents: 
70796diff
changeset | 98 | "parallel_proofs=0" + | 
| 71678 | 99 | "completion_limit=0" + | 
| 76426 | 100 | "editor_tracing_messages=0" | 
| 73359 | 101 |         aspects.foldLeft(options1) { case (opts, aspect) => aspect.options.foldLeft(opts)(_ + _) }
 | 
| 70856 
545229df2f82
clarified signature: static Dump.Context vs. dynamic Dump.Session;
 wenzelm parents: 
70796diff
changeset | 102 | } | 
| 
545229df2f82
clarified signature: static Dump.Context vs. dynamic Dump.Session;
 wenzelm parents: 
70796diff
changeset | 103 | |
| 70869 | 104 | val sessions_structure: Sessions.Structure = | 
| 70856 
545229df2f82
clarified signature: static Dump.Context vs. dynamic Dump.Session;
 wenzelm parents: 
70796diff
changeset | 105 | Sessions.load_structure(session_options, dirs = dirs, select_dirs = select_dirs). | 
| 70869 | 106 | selection(selection) | 
| 107 | ||
| 108 |       {
 | |
| 109 | val selection_size = sessions_structure.build_graph.size | |
| 110 |         if (selection_size > 1) progress.echo("Loading " + selection_size + " sessions ...")
 | |
| 111 | } | |
| 112 | ||
| 113 | val deps: Sessions.Deps = | |
| 114 | Sessions.deps(sessions_structure, progress = progress).check_errors | |
| 70856 
545229df2f82
clarified signature: static Dump.Context vs. dynamic Dump.Session;
 wenzelm parents: 
70796diff
changeset | 115 | |
| 71573 
c67076c07fb8
avoid accidental update of base session sources (following documentation in "system" manual);
 wenzelm parents: 
71534diff
changeset | 116 | new Context(options, progress, dirs, select_dirs, pure_base, skip_base, session_options, deps) | 
| 70640 
5f4b8a505090
more explicit type Dump.Session, with context information;
 wenzelm parents: 
70634diff
changeset | 117 | } | 
| 69896 | 118 | } | 
| 119 | ||
| 70856 
545229df2f82
clarified signature: static Dump.Context vs. dynamic Dump.Session;
 wenzelm parents: 
70796diff
changeset | 120 | class Context private( | 
| 
545229df2f82
clarified signature: static Dump.Context vs. dynamic Dump.Session;
 wenzelm parents: 
70796diff
changeset | 121 | val options: Options, | 
| 
545229df2f82
clarified signature: static Dump.Context vs. dynamic Dump.Session;
 wenzelm parents: 
70796diff
changeset | 122 | val progress: Progress, | 
| 
545229df2f82
clarified signature: static Dump.Context vs. dynamic Dump.Session;
 wenzelm parents: 
70796diff
changeset | 123 | val dirs: List[Path], | 
| 
545229df2f82
clarified signature: static Dump.Context vs. dynamic Dump.Session;
 wenzelm parents: 
70796diff
changeset | 124 | val select_dirs: List[Path], | 
| 71161 
ffccc1f346ae
avoid vacuous session Pure -- dump does not read_pure_theory;
 wenzelm parents: 
71159diff
changeset | 125 | val pure_base: Boolean, | 
| 71573 
c67076c07fb8
avoid accidental update of base session sources (following documentation in "system" manual);
 wenzelm parents: 
71534diff
changeset | 126 | val skip_base: Boolean, | 
| 70856 
545229df2f82
clarified signature: static Dump.Context vs. dynamic Dump.Session;
 wenzelm parents: 
70796diff
changeset | 127 | val session_options: Options, | 
| 75393 | 128 | val deps: Sessions.Deps | 
| 129 |   ) {
 | |
| 70859 
6e6254bbce1f
split into standard partitions, for improved scalability;
 wenzelm parents: 
70858diff
changeset | 130 | context => | 
| 
6e6254bbce1f
split into standard partitions, for improved scalability;
 wenzelm parents: 
70858diff
changeset | 131 | |
| 70856 
545229df2f82
clarified signature: static Dump.Context vs. dynamic Dump.Session;
 wenzelm parents: 
70796diff
changeset | 132 | def session_dirs: List[Path] = dirs ::: select_dirs | 
| 68926 | 133 | |
| 75393 | 134 |     def build_logic(logic: String): Unit = {
 | 
| 70857 | 135 | Build.build_logic(options, logic, build_heap = true, progress = progress, | 
| 136 | dirs = session_dirs, strict = true) | |
| 137 | } | |
| 138 | ||
| 70864 | 139 | def sessions( | 
| 70859 
6e6254bbce1f
split into standard partitions, for improved scalability;
 wenzelm parents: 
70858diff
changeset | 140 | logic: String = default_logic, | 
| 79777 | 141 | log: Logger = new Logger | 
| 75393 | 142 |     ): List[Session] = {
 | 
| 70869 | 143 | /* partitions */ | 
| 144 | ||
| 145 | def session_info(session_name: String): Sessions.Info = | |
| 146 | deps.sessions_structure(session_name) | |
| 147 | ||
| 70870 
877fe56af178
proper build_graph to make session selection work as in "isabelle build";
 wenzelm parents: 
70869diff
changeset | 148 | val session_graph = deps.sessions_structure.build_graph | 
| 70869 | 149 | val all_sessions = session_graph.topological_order | 
| 70859 
6e6254bbce1f
split into standard partitions, for improved scalability;
 wenzelm parents: 
70858diff
changeset | 150 | |
| 70862 | 151 | val base_sessions = | 
| 72065 
11dc8929832d
clarified order --- proper sorting of requirements;
 wenzelm parents: 
71894diff
changeset | 152 | session_graph.all_preds_rev(List(logic).filter(session_graph.defined)) | 
| 70859 
6e6254bbce1f
split into standard partitions, for improved scalability;
 wenzelm parents: 
70858diff
changeset | 153 | |
| 70869 | 154 | val proof_sessions = | 
| 155 | session_graph.all_succs( | |
| 156 | for (name <- all_sessions if session_info(name).record_proofs) yield name) | |
| 157 | ||
| 158 | ||
| 159 | /* resulting sessions */ | |
| 160 | ||
| 161 | def make_session( | |
| 162 | selected_sessions: List[String], | |
| 71158 | 163 | session_logic: String = logic, | 
| 71159 | 164 | strict: Boolean = false, | 
| 75393 | 165 | record_proofs: Boolean = false | 
| 166 |       ): List[Session] = {
 | |
| 71159 | 167 | if (selected_sessions.isEmpty && !strict) Nil | 
| 71158 | 168 | else List(new Session(context, session_logic, log, selected_sessions, record_proofs)) | 
| 70869 | 169 | } | 
| 170 | ||
| 71161 
ffccc1f346ae
avoid vacuous session Pure -- dump does not read_pure_theory;
 wenzelm parents: 
71159diff
changeset | 171 | val PURE = isabelle.Thy_Header.PURE | 
| 
ffccc1f346ae
avoid vacuous session Pure -- dump does not read_pure_theory;
 wenzelm parents: 
71159diff
changeset | 172 | |
| 70859 
6e6254bbce1f
split into standard partitions, for improved scalability;
 wenzelm parents: 
70858diff
changeset | 173 | val base = | 
| 71573 
c67076c07fb8
avoid accidental update of base session sources (following documentation in "system" manual);
 wenzelm parents: 
71534diff
changeset | 174 | if ((logic == PURE && !pure_base) || skip_base) Nil | 
| 71161 
ffccc1f346ae
avoid vacuous session Pure -- dump does not read_pure_theory;
 wenzelm parents: 
71159diff
changeset | 175 | else make_session(base_sessions, session_logic = PURE, strict = logic == PURE) | 
| 70859 
6e6254bbce1f
split into standard partitions, for improved scalability;
 wenzelm parents: 
70858diff
changeset | 176 | |
| 
6e6254bbce1f
split into standard partitions, for improved scalability;
 wenzelm parents: 
70858diff
changeset | 177 | val main = | 
| 70869 | 178 | make_session( | 
| 70859 
6e6254bbce1f
split into standard partitions, for improved scalability;
 wenzelm parents: 
70858diff
changeset | 179 | session_graph.topological_order.filterNot(name => | 
| 70869 | 180 | base_sessions.contains(name) || | 
| 181 | proof_sessions.contains(name))) | |
| 182 | ||
| 71161 
ffccc1f346ae
avoid vacuous session Pure -- dump does not read_pure_theory;
 wenzelm parents: 
71159diff
changeset | 183 | val proofs = make_session(proof_sessions, session_logic = PURE, record_proofs = true) | 
| 70859 
6e6254bbce1f
split into standard partitions, for improved scalability;
 wenzelm parents: 
70858diff
changeset | 184 | |
| 78617 
2c3a05b297f4
discontinue special treatment of AFP: "isabelle dump" has been superseded by regular "isabelle build" databases;
 wenzelm parents: 
78435diff
changeset | 185 | proofs ::: base ::: main | 
| 70857 | 186 | } | 
| 70875 
a62c34770df9
proper guard for process_theory: ensure uniform precedence of results;
 wenzelm parents: 
70874diff
changeset | 187 | |
| 
a62c34770df9
proper guard for process_theory: ensure uniform precedence of results;
 wenzelm parents: 
70874diff
changeset | 188 | |
| 
a62c34770df9
proper guard for process_theory: ensure uniform precedence of results;
 wenzelm parents: 
70874diff
changeset | 189 | /* processed theories */ | 
| 
a62c34770df9
proper guard for process_theory: ensure uniform precedence of results;
 wenzelm parents: 
70874diff
changeset | 190 | |
| 
a62c34770df9
proper guard for process_theory: ensure uniform precedence of results;
 wenzelm parents: 
70874diff
changeset | 191 | private val processed_theories = Synchronized(Set.empty[String]) | 
| 
a62c34770df9
proper guard for process_theory: ensure uniform precedence of results;
 wenzelm parents: 
70874diff
changeset | 192 | |
| 
a62c34770df9
proper guard for process_theory: ensure uniform precedence of results;
 wenzelm parents: 
70874diff
changeset | 193 | def process_theory(theory: String): Boolean = | 
| 
a62c34770df9
proper guard for process_theory: ensure uniform precedence of results;
 wenzelm parents: 
70874diff
changeset | 194 | processed_theories.change_result(processed => (!processed(theory), processed + theory)) | 
| 70876 | 195 | |
| 196 | ||
| 197 | /* errors */ | |
| 198 | ||
| 199 | private val errors = Synchronized(List.empty[String]) | |
| 200 | ||
| 75393 | 201 |     def add_errors(more_errs: List[String]): Unit = {
 | 
| 70876 | 202 | errors.change(errs => errs ::: more_errs) | 
| 203 | } | |
| 204 | ||
| 75393 | 205 |     def check_errors: Unit = {
 | 
| 70876 | 206 | val errs = errors.value | 
| 207 |       if (errs.nonEmpty) error(errs.mkString("\n\n"))
 | |
| 208 | } | |
| 70856 
545229df2f82
clarified signature: static Dump.Context vs. dynamic Dump.Session;
 wenzelm parents: 
70796diff
changeset | 209 | } | 
| 68926 | 210 | |
| 70859 
6e6254bbce1f
split into standard partitions, for improved scalability;
 wenzelm parents: 
70858diff
changeset | 211 | class Session private[Dump]( | 
| 70867 | 212 | val context: Context, | 
| 213 | val logic: String, | |
| 214 | log: Logger, | |
| 70869 | 215 | selected_sessions: List[String], | 
| 75393 | 216 | record_proofs: Boolean | 
| 217 |   ) {
 | |
| 70856 
545229df2f82
clarified signature: static Dump.Context vs. dynamic Dump.Session;
 wenzelm parents: 
70796diff
changeset | 218 | /* resources */ | 
| 
545229df2f82
clarified signature: static Dump.Context vs. dynamic Dump.Session;
 wenzelm parents: 
70796diff
changeset | 219 | |
| 70869 | 220 | val options: Options = | 
| 221 | if (record_proofs) context.session_options + "record_proofs=2" | |
| 222 | else context.session_options | |
| 70866 | 223 | |
| 70867 | 224 | private def deps = context.deps | 
| 225 | private def progress = context.progress | |
| 70856 
545229df2f82
clarified signature: static Dump.Context vs. dynamic Dump.Session;
 wenzelm parents: 
70796diff
changeset | 226 | |
| 70640 
5f4b8a505090
more explicit type Dump.Session, with context information;
 wenzelm parents: 
70634diff
changeset | 227 | val resources: Headless.Resources = | 
| 70865 | 228 | Headless.Resources.make(options, logic, progress = progress, log = log, | 
| 70856 
545229df2f82
clarified signature: static Dump.Context vs. dynamic Dump.Session;
 wenzelm parents: 
70796diff
changeset | 229 | session_dirs = context.session_dirs, | 
| 70867 | 230 | include_sessions = deps.sessions_structure.imports_topological_order) | 
| 70640 
5f4b8a505090
more explicit type Dump.Session, with context information;
 wenzelm parents: 
70634diff
changeset | 231 | |
| 75393 | 232 |     val used_theories: List[Document.Node.Name] = {
 | 
| 70640 
5f4b8a505090
more explicit type Dump.Session, with context information;
 wenzelm parents: 
70634diff
changeset | 233 |       for {
 | 
| 70867 | 234 | session_name <- | 
| 70871 
2beac4adc565
more complete coverage of sessions: process_theory operation needs to handle duplicate theories;
 wenzelm parents: 
70870diff
changeset | 235 | deps.sessions_structure.build_graph.restrict(selected_sessions.toSet).topological_order | 
| 70867 | 236 | (name, theory_options) <- deps(session_name).used_theories | 
| 70640 
5f4b8a505090
more explicit type Dump.Session, with context information;
 wenzelm parents: 
70634diff
changeset | 237 | if !resources.session_base.loaded_theory(name.theory) | 
| 70867 | 238 |         if {
 | 
| 239 | def warn(msg: String): Unit = | |
| 240 |             progress.echo_warning("Skipping theory " + name + "  (" + msg + ")")
 | |
| 241 | ||
| 242 | val conditions = | |
| 243 |             space_explode(',', theory_options.string("condition")).
 | |
| 244 | filter(cond => Isabelle_System.getenv(cond) == "") | |
| 245 |           if (conditions.nonEmpty) {
 | |
| 246 |             warn("undefined " + conditions.mkString(", "))
 | |
| 247 | false | |
| 248 | } | |
| 249 |           else if (options.bool("skip_proofs") && !theory_options.bool("skip_proofs")) {
 | |
| 250 |             warn("option skip_proofs")
 | |
| 251 | false | |
| 252 | } | |
| 253 | else true | |
| 254 | } | |
| 70640 
5f4b8a505090
more explicit type Dump.Session, with context information;
 wenzelm parents: 
70634diff
changeset | 255 | } yield name | 
| 68926 | 256 | } | 
| 257 | ||
| 258 | ||
| 70856 
545229df2f82
clarified signature: static Dump.Context vs. dynamic Dump.Session;
 wenzelm parents: 
70796diff
changeset | 259 | /* process */ | 
| 70640 
5f4b8a505090
more explicit type Dump.Session, with context information;
 wenzelm parents: 
70634diff
changeset | 260 | |
| 75393 | 261 |     def process(process_theory: Args => Unit, unicode_symbols: Boolean = false): Unit = {
 | 
| 70640 
5f4b8a505090
more explicit type Dump.Session, with context information;
 wenzelm parents: 
70634diff
changeset | 262 | val session = resources.start_session(progress = progress) | 
| 
5f4b8a505090
more explicit type Dump.Session, with context information;
 wenzelm parents: 
70634diff
changeset | 263 | |
| 
5f4b8a505090
more explicit type Dump.Session, with context information;
 wenzelm parents: 
70634diff
changeset | 264 | |
| 
5f4b8a505090
more explicit type Dump.Session, with context information;
 wenzelm parents: 
70634diff
changeset | 265 | // asynchronous consumer | 
| 
5f4b8a505090
more explicit type Dump.Session, with context information;
 wenzelm parents: 
70634diff
changeset | 266 | |
| 75393 | 267 |       object Consumer {
 | 
| 70640 
5f4b8a505090
more explicit type Dump.Session, with context information;
 wenzelm parents: 
70634diff
changeset | 268 | sealed case class Bad_Theory( | 
| 
5f4b8a505090
more explicit type Dump.Session, with context information;
 wenzelm parents: 
70634diff
changeset | 269 | name: Document.Node.Name, | 
| 
5f4b8a505090
more explicit type Dump.Session, with context information;
 wenzelm parents: 
70634diff
changeset | 270 | status: Document_Status.Node_Status, | 
| 
5f4b8a505090
more explicit type Dump.Session, with context information;
 wenzelm parents: 
70634diff
changeset | 271 | errors: List[String]) | 
| 
5f4b8a505090
more explicit type Dump.Session, with context information;
 wenzelm parents: 
70634diff
changeset | 272 | |
| 
5f4b8a505090
more explicit type Dump.Session, with context information;
 wenzelm parents: 
70634diff
changeset | 273 | private val consumer_bad_theories = Synchronized(List.empty[Bad_Theory]) | 
| 68318 | 274 | |
| 70640 
5f4b8a505090
more explicit type Dump.Session, with context information;
 wenzelm parents: 
70634diff
changeset | 275 | private val consumer = | 
| 75394 | 276 | Consumer_Thread.fork(name = "dump")(consume = | 
| 277 |             { (args: (Document.Snapshot, Document_Status.Node_Status)) =>
 | |
| 278 | val (snapshot, status) = args | |
| 279 | val name = snapshot.node_name | |
| 280 |               if (status.ok) {
 | |
| 281 |                 try {
 | |
| 282 |                   if (context.process_theory(name.theory)) {
 | |
| 283 | process_theory(Args(session, snapshot, status)) | |
| 70640 
5f4b8a505090
more explicit type Dump.Session, with context information;
 wenzelm parents: 
70634diff
changeset | 284 | } | 
| 70871 
2beac4adc565
more complete coverage of sessions: process_theory operation needs to handle duplicate theories;
 wenzelm parents: 
70870diff
changeset | 285 | } | 
| 75394 | 286 |                 catch {
 | 
| 287 | case exn: Throwable if !Exn.is_interrupt(exn) => | |
| 288 | val msg = Exn.message(exn) | |
| 289 |                     progress.echo("FAILED to process theory " + name)
 | |
| 290 | progress.echo_error_message(msg) | |
| 291 | consumer_bad_theories.change(Bad_Theory(name, status, List(msg)) :: _) | |
| 70640 
5f4b8a505090
more explicit type Dump.Session, with context information;
 wenzelm parents: 
70634diff
changeset | 292 | } | 
| 75394 | 293 | } | 
| 294 |               else {
 | |
| 295 | val msgs = | |
| 296 | for ((elem, pos) <- snapshot.messages if Protocol.is_error(elem)) | |
| 297 |                   yield {
 | |
| 298 | "Error" + Position.here(pos) + ":\n" + | |
| 299 | XML.content(Pretty.formatted(List(elem))) | |
| 300 | } | |
| 301 |                 progress.echo("FAILED to process theory " + name)
 | |
| 77509 
3bc49507bae5
clarified treatment of "verbose" messages, e.g. Progress.theory();
 wenzelm parents: 
77477diff
changeset | 302 | msgs.foreach(progress.echo_error_message(_)) | 
| 75394 | 303 | consumer_bad_theories.change(Bad_Theory(name, status, msgs) :: _) | 
| 304 | } | |
| 305 | true | |
| 306 | }) | |
| 70640 
5f4b8a505090
more explicit type Dump.Session, with context information;
 wenzelm parents: 
70634diff
changeset | 307 | |
| 
5f4b8a505090
more explicit type Dump.Session, with context information;
 wenzelm parents: 
70634diff
changeset | 308 | def apply(snapshot: Document.Snapshot, status: Document_Status.Node_Status): Unit = | 
| 
5f4b8a505090
more explicit type Dump.Session, with context information;
 wenzelm parents: 
70634diff
changeset | 309 | consumer.send((snapshot, status)) | 
| 
5f4b8a505090
more explicit type Dump.Session, with context information;
 wenzelm parents: 
70634diff
changeset | 310 | |
| 75393 | 311 |         def shutdown(): List[Bad_Theory] = {
 | 
| 70640 
5f4b8a505090
more explicit type Dump.Session, with context information;
 wenzelm parents: 
70634diff
changeset | 312 | consumer.shutdown() | 
| 
5f4b8a505090
more explicit type Dump.Session, with context information;
 wenzelm parents: 
70634diff
changeset | 313 | consumer_bad_theories.value.reverse | 
| 70634 
0f8742b5a9e8
more scalable isabelle dump (and derivatives): mark individual theories to share common data in ML;
 wenzelm parents: 
70626diff
changeset | 314 | } | 
| 
0f8742b5a9e8
more scalable isabelle dump (and derivatives): mark individual theories to share common data in ML;
 wenzelm parents: 
70626diff
changeset | 315 | } | 
| 
0f8742b5a9e8
more scalable isabelle dump (and derivatives): mark individual theories to share common data in ML;
 wenzelm parents: 
70626diff
changeset | 316 | |
| 70640 
5f4b8a505090
more explicit type Dump.Session, with context information;
 wenzelm parents: 
70634diff
changeset | 317 | |
| 70653 
f7c5b30fc432
load theories in stages, to reduce ML heap requirements;
 wenzelm parents: 
70645diff
changeset | 318 | // synchronous body | 
| 68320 
1d33697199c1
shutdown ML process before output: Theories_Result is timeless/stateless;
 wenzelm parents: 
68319diff
changeset | 319 | |
| 70640 
5f4b8a505090
more explicit type Dump.Session, with context information;
 wenzelm parents: 
70634diff
changeset | 320 |       try {
 | 
| 
5f4b8a505090
more explicit type Dump.Session, with context information;
 wenzelm parents: 
70634diff
changeset | 321 | val use_theories_result = | 
| 
5f4b8a505090
more explicit type Dump.Session, with context information;
 wenzelm parents: 
70634diff
changeset | 322 | session.use_theories(used_theories.map(_.theory), | 
| 
5f4b8a505090
more explicit type Dump.Session, with context information;
 wenzelm parents: 
70634diff
changeset | 323 | unicode_symbols = unicode_symbols, | 
| 
5f4b8a505090
more explicit type Dump.Session, with context information;
 wenzelm parents: 
70634diff
changeset | 324 | progress = progress, | 
| 71601 | 325 | commit = Some(Consumer.apply)) | 
| 70640 
5f4b8a505090
more explicit type Dump.Session, with context information;
 wenzelm parents: 
70634diff
changeset | 326 | |
| 
5f4b8a505090
more explicit type Dump.Session, with context information;
 wenzelm parents: 
70634diff
changeset | 327 | val bad_theories = Consumer.shutdown() | 
| 
5f4b8a505090
more explicit type Dump.Session, with context information;
 wenzelm parents: 
70634diff
changeset | 328 | val bad_msgs = | 
| 
5f4b8a505090
more explicit type Dump.Session, with context information;
 wenzelm parents: 
70634diff
changeset | 329 | bad_theories.map(bad => | 
| 80817 | 330 | Protocol_Message.clean_output( | 
| 70640 
5f4b8a505090
more explicit type Dump.Session, with context information;
 wenzelm parents: 
70634diff
changeset | 331 | "FAILED theory " + bad.name + | 
| 
5f4b8a505090
more explicit type Dump.Session, with context information;
 wenzelm parents: 
70634diff
changeset | 332 | (if (bad.status.consolidated) "" else ": " + bad.status.percentage + "% finished") + | 
| 77368 | 333 |                 if_proper(bad.errors, bad.errors.mkString("\n", "\n", ""))))
 | 
| 70640 
5f4b8a505090
more explicit type Dump.Session, with context information;
 wenzelm parents: 
70634diff
changeset | 334 | |
| 
5f4b8a505090
more explicit type Dump.Session, with context information;
 wenzelm parents: 
70634diff
changeset | 335 | val pending_msgs = | 
| 
5f4b8a505090
more explicit type Dump.Session, with context information;
 wenzelm parents: 
70634diff
changeset | 336 |           use_theories_result.nodes_pending match {
 | 
| 
5f4b8a505090
more explicit type Dump.Session, with context information;
 wenzelm parents: 
70634diff
changeset | 337 | case Nil => Nil | 
| 
5f4b8a505090
more explicit type Dump.Session, with context information;
 wenzelm parents: 
70634diff
changeset | 338 |             case pending => List("Pending theories: " + commas(pending.map(p => p._1.toString)))
 | 
| 
5f4b8a505090
more explicit type Dump.Session, with context information;
 wenzelm parents: 
70634diff
changeset | 339 | } | 
| 
5f4b8a505090
more explicit type Dump.Session, with context information;
 wenzelm parents: 
70634diff
changeset | 340 | |
| 70876 | 341 | context.add_errors(bad_msgs ::: pending_msgs) | 
| 70640 
5f4b8a505090
more explicit type Dump.Session, with context information;
 wenzelm parents: 
70634diff
changeset | 342 | } | 
| 
5f4b8a505090
more explicit type Dump.Session, with context information;
 wenzelm parents: 
70634diff
changeset | 343 |       finally { session.stop() }
 | 
| 69032 
90bb4cabe1e8
clarified errors: no result from forced session.stop, check pending theories;
 wenzelm parents: 
69026diff
changeset | 344 | } | 
| 68308 
119fc05f6b00
support to dump build database produced by PIDE session;
 wenzelm parents: diff
changeset | 345 | } | 
| 
119fc05f6b00
support to dump build database produced by PIDE session;
 wenzelm parents: diff
changeset | 346 | |
| 
119fc05f6b00
support to dump build database produced by PIDE session;
 wenzelm parents: diff
changeset | 347 | |
| 69523 | 348 | /* dump */ | 
| 349 | ||
| 350 |   val default_output_dir: Path = Path.explode("dump")
 | |
| 70858 | 351 | val default_logic: String = Thy_Header.PURE | 
| 69523 | 352 | |
| 70640 
5f4b8a505090
more explicit type Dump.Session, with context information;
 wenzelm parents: 
70634diff
changeset | 353 | def dump( | 
| 
5f4b8a505090
more explicit type Dump.Session, with context information;
 wenzelm parents: 
70634diff
changeset | 354 | options: Options, | 
| 
5f4b8a505090
more explicit type Dump.Session, with context information;
 wenzelm parents: 
70634diff
changeset | 355 | logic: String, | 
| 69523 | 356 | aspects: List[Aspect] = Nil, | 
| 71726 
a5fda30edae2
clarified signature: more uniform treatment of stopped/interrupted state;
 wenzelm parents: 
71678diff
changeset | 357 | progress: Progress = new Progress, | 
| 79777 | 358 | log: Logger = new Logger, | 
| 69523 | 359 | dirs: List[Path] = Nil, | 
| 360 | select_dirs: List[Path] = Nil, | |
| 361 | output_dir: Path = default_output_dir, | |
| 75393 | 362 | selection: Sessions.Selection = Sessions.Selection.empty | 
| 363 |   ): Unit = {
 | |
| 70856 
545229df2f82
clarified signature: static Dump.Context vs. dynamic Dump.Session;
 wenzelm parents: 
70796diff
changeset | 364 | val context = | 
| 
545229df2f82
clarified signature: static Dump.Context vs. dynamic Dump.Session;
 wenzelm parents: 
70796diff
changeset | 365 | Context(options, aspects = aspects, progress = progress, dirs = dirs, | 
| 70796 
2739631ac368
discontinued pointless dump_checkpoint and share_common_data -- superseded by base logic image in Isabelle/MMT;
 wenzelm parents: 
70779diff
changeset | 366 | select_dirs = select_dirs, selection = selection) | 
| 69523 | 367 | |
| 70864 | 368 | context.build_logic(logic) | 
| 369 | ||
| 70865 | 370 |     for (session <- context.sessions(logic = logic, log = log)) {
 | 
| 75394 | 371 |       session.process({ (args: Args) =>
 | 
| 372 |         progress.echo("Processing theory " + args.print_node + " ...")
 | |
| 373 | val aspect_args = | |
| 374 | Aspect_Args(session.options, context.deps, progress, output_dir, | |
| 375 | args.snapshot, args.status) | |
| 376 | aspects.foreach(_.operation(aspect_args)) | |
| 377 | }) | |
| 70865 | 378 | } | 
| 70876 | 379 | |
| 380 | context.check_errors | |
| 69523 | 381 | } | 
| 382 | ||
| 383 | ||
| 68308 
119fc05f6b00
support to dump build database produced by PIDE session;
 wenzelm parents: diff
changeset | 384 | /* Isabelle tool wrapper */ | 
| 
119fc05f6b00
support to dump build database produced by PIDE session;
 wenzelm parents: diff
changeset | 385 | |
| 
119fc05f6b00
support to dump build database produced by PIDE session;
 wenzelm parents: diff
changeset | 386 | val isabelle_tool = | 
| 75393 | 387 |     Isabelle_Tool("dump", "dump cumulative PIDE session database", Scala_Project.here,
 | 
| 75394 | 388 |       { args =>
 | 
| 389 | var aspects: List[Aspect] = known_aspects | |
| 390 | var base_sessions: List[String] = Nil | |
| 391 | var select_dirs: List[Path] = Nil | |
| 392 | var output_dir = default_output_dir | |
| 393 | var requirements = false | |
| 394 | var exclude_session_groups: List[String] = Nil | |
| 395 | var all_sessions = false | |
| 396 | var logic = default_logic | |
| 397 | var dirs: List[Path] = Nil | |
| 398 | var session_groups: List[String] = Nil | |
| 399 | var options = Options.init() | |
| 400 | var verbose = false | |
| 401 | var exclude_sessions: List[String] = Nil | |
| 68308 
119fc05f6b00
support to dump build database produced by PIDE session;
 wenzelm parents: diff
changeset | 402 | |
| 75394 | 403 |         val getopts = Getopts("""
 | 
| 68308 
119fc05f6b00
support to dump build database produced by PIDE session;
 wenzelm parents: diff
changeset | 404 | Usage: isabelle dump [OPTIONS] [SESSIONS ...] | 
| 
119fc05f6b00
support to dump build database produced by PIDE session;
 wenzelm parents: diff
changeset | 405 | |
| 
119fc05f6b00
support to dump build database produced by PIDE session;
 wenzelm parents: diff
changeset | 406 | Options are: | 
| 68345 | 407 |     -A NAMES     dump named aspects (default: """ + known_aspects.mkString("\"", ",", "\"") + """)
 | 
| 68308 
119fc05f6b00
support to dump build database produced by PIDE session;
 wenzelm parents: diff
changeset | 408 | -B NAME include session NAME and all descendants | 
| 
119fc05f6b00
support to dump build database produced by PIDE session;
 wenzelm parents: diff
changeset | 409 | -D DIR include session directory and select its sessions | 
| 68316 | 410 | -O DIR output directory for dumped files (default: """ + default_output_dir + """) | 
| 71807 | 411 | -R refer to requirements of selected sessions | 
| 68308 
119fc05f6b00
support to dump build database produced by PIDE session;
 wenzelm parents: diff
changeset | 412 | -X NAME exclude sessions from group NAME and all descendants | 
| 
119fc05f6b00
support to dump build database produced by PIDE session;
 wenzelm parents: diff
changeset | 413 | -a select all sessions | 
| 70859 
6e6254bbce1f
split into standard partitions, for improved scalability;
 wenzelm parents: 
70858diff
changeset | 414 | -b NAME base logic image (default """ + isabelle.quote(default_logic) + """) | 
| 68308 
119fc05f6b00
support to dump build database produced by PIDE session;
 wenzelm parents: diff
changeset | 415 | -d DIR include session directory | 
| 
119fc05f6b00
support to dump build database produced by PIDE session;
 wenzelm parents: diff
changeset | 416 | -g NAME select session group NAME | 
| 
119fc05f6b00
support to dump build database produced by PIDE session;
 wenzelm parents: diff
changeset | 417 | -o OPTION override Isabelle system OPTION (via NAME=VAL or NAME) | 
| 
119fc05f6b00
support to dump build database produced by PIDE session;
 wenzelm parents: diff
changeset | 418 | -v verbose | 
| 
119fc05f6b00
support to dump build database produced by PIDE session;
 wenzelm parents: diff
changeset | 419 | -x NAME exclude session NAME and all descendants | 
| 
119fc05f6b00
support to dump build database produced by PIDE session;
 wenzelm parents: diff
changeset | 420 | |
| 68348 | 421 | Dump cumulative PIDE session database, with the following aspects: | 
| 68316 | 422 | |
| 73736 | 423 | """ + Library.indent_lines(4, show_aspects) + "\n", | 
| 75394 | 424 |         "A:" -> (arg => aspects = Library.distinct(space_explode(',', arg)).map(the_aspect)),
 | 
| 425 | "B:" -> (arg => base_sessions = base_sessions ::: List(arg)), | |
| 426 | "D:" -> (arg => select_dirs = select_dirs ::: List(Path.explode(arg))), | |
| 427 | "O:" -> (arg => output_dir = Path.explode(arg)), | |
| 428 | "R" -> (_ => requirements = true), | |
| 429 | "X:" -> (arg => exclude_session_groups = exclude_session_groups ::: List(arg)), | |
| 430 | "a" -> (_ => all_sessions = true), | |
| 431 | "b:" -> (arg => logic = arg), | |
| 432 | "d:" -> (arg => dirs = dirs ::: List(Path.explode(arg))), | |
| 433 | "g:" -> (arg => session_groups = session_groups ::: List(arg)), | |
| 434 | "o:" -> (arg => options = options + arg), | |
| 435 | "v" -> (_ => verbose = true), | |
| 436 | "x:" -> (arg => exclude_sessions = exclude_sessions ::: List(arg))) | |
| 68308 
119fc05f6b00
support to dump build database produced by PIDE session;
 wenzelm parents: diff
changeset | 437 | |
| 75394 | 438 | val sessions = getopts(args) | 
| 68308 
119fc05f6b00
support to dump build database produced by PIDE session;
 wenzelm parents: diff
changeset | 439 | |
| 75394 | 440 | val progress = new Console_Progress(verbose = verbose) | 
| 68308 
119fc05f6b00
support to dump build database produced by PIDE session;
 wenzelm parents: diff
changeset | 441 | |
| 75394 | 442 | val start_date = Date.now() | 
| 71661 
6db526adccac
clarified messages: indicate termination explicitly;
 wenzelm parents: 
71573diff
changeset | 443 | |
| 77510 
f5d6cd98b16a
clarified signature: manage "verbose" flag via "progress";
 wenzelm parents: 
77509diff
changeset | 444 |         progress.echo("Started at " + Build_Log.print_date(start_date), verbose = true)
 | 
| 71661 
6db526adccac
clarified messages: indicate termination explicitly;
 wenzelm parents: 
71573diff
changeset | 445 | |
| 75394 | 446 |         progress.interrupt_handler {
 | 
| 447 | dump(options, logic, | |
| 448 | aspects = aspects, | |
| 449 | progress = progress, | |
| 450 | dirs = dirs, | |
| 451 | select_dirs = select_dirs, | |
| 452 | output_dir = output_dir, | |
| 453 | selection = Sessions.Selection( | |
| 454 | requirements = requirements, | |
| 455 | all_sessions = all_sessions, | |
| 456 | base_sessions = base_sessions, | |
| 457 | exclude_session_groups = exclude_session_groups, | |
| 458 | exclude_sessions = exclude_sessions, | |
| 459 | session_groups = session_groups, | |
| 460 | sessions = sessions)) | |
| 461 | } | |
| 71661 
6db526adccac
clarified messages: indicate termination explicitly;
 wenzelm parents: 
71573diff
changeset | 462 | |
| 75394 | 463 | val end_date = Date.now() | 
| 79819 | 464 | val timing = end_date - start_date | 
| 71661 
6db526adccac
clarified messages: indicate termination explicitly;
 wenzelm parents: 
71573diff
changeset | 465 | |
| 77510 
f5d6cd98b16a
clarified signature: manage "verbose" flag via "progress";
 wenzelm parents: 
77509diff
changeset | 466 |         progress.echo("\nFinished at " + Build_Log.print_date(end_date), verbose = true)
 | 
| 75394 | 467 | progress.echo(timing.message_hms + " elapsed time") | 
| 468 | }) | |
| 68308 
119fc05f6b00
support to dump build database produced by PIDE session;
 wenzelm parents: diff
changeset | 469 | } |