src/Pure/Admin/jenkins.scala
author wenzelm
Mon, 01 May 2017 10:58:54 +0200
changeset 65657 2773b6859c55
parent 65656 c266f045258b
child 65658 be817b7b8354
permissions -rw-r--r--
download Jenkins logs with inlined ml_statistics;

/*  Title:      Pure/Admin/jenkins.scala
    Author:     Makarius

Support for Jenkins continuous integration service.
*/

package isabelle


import java.net.URL
import java.time.ZoneId

import scala.util.matching.Regex


object Jenkins
{
  /* server API */

  def root(): String =
    Isabelle_System.getenv_strict("ISABELLE_JENKINS_ROOT")

  def invoke(url: String, args: String*): Any =
  {
    val req = url + "/api/json?" + args.mkString("&")
    val result = Url.read(req)
    try { JSON.parse(result) }
    catch { case ERROR(_) => error("Malformed JSON from " + quote(req)) }
  }


  /* build jobs */

  def build_jobs(): List[String] =
    for {
      job <- JSON.array(invoke(root()), "jobs").getOrElse(Nil)
      _class <- JSON.string(job, "_class")
      if _class == "hudson.model.FreeStyleProject"
      name <- JSON.string(job, "name")
    } yield name


  def download_logs(job_names: List[String], dir: Path)
  {
    val store = Sessions.store()
    for {
      job_name <- job_names.iterator
      info <- build_job_infos(job_name).iterator
    } info.download_log(store, dir)
  }


  /* job info */

  sealed case class Job_Info(
    job_name: String,
    timestamp: Long,
    main_log: URL,
    session_logs: List[(String, String, URL)])
  {
    val date: Date = Date(Time.ms(timestamp), ZoneId.of("Europe/Berlin"))

    def log_filename: Path =
      Build_Log.log_filename(Build_Log.Jenkins.engine, date, List(job_name))

    def read_log_file(): Build_Log.Log_File =
      Build_Log.Log_File(log_filename.implode, Url.read(main_log))

    def read_ml_statistics(store: Sessions.Store, session_name: String): List[Properties.T] =
    {
      def get_log(ext: String): Option[URL] =
        session_logs.collectFirst({ case (a, b, url) if a == session_name && b == ext => url })

      get_log("db") match {
        case Some(url) =>
          Isabelle_System.with_tmp_file(session_name, "db") { database =>
            Bytes.write(database, Bytes.read(url))
            using(SQLite.open_database(database))(db =>
              store.read_build_log(db, session_name, ml_statistics = true)).ml_statistics
          }
        case None =>
          get_log("gz") match {
            case Some(url) =>
              val log_file = Build_Log.Log_File(session_name, Url.read_gzip(url))
              log_file.parse_session_info(ml_statistics = true).ml_statistics
            case None => Nil
          }
      }
    }

    def download_log(store: Sessions.Store, dir: Path)
    {
      val log_dir = dir + Build_Log.log_subdir(date)
      val log_path = log_dir + log_filename

      if (!log_path.is_file) {
        val ml_statistics =
          session_logs.map(_._1).toSet.toList.sorted.flatMap(session_name =>
            read_ml_statistics(store, session_name).
              map(props => (Build_Log.SESSION_NAME -> session_name) :: props))

        Isabelle_System.mkdirs(log_dir)
        File.write_xz(log_path.ext("xz"),
          terminate_lines(Url.read(main_log) ::
            ml_statistics.map(Build_Log.Log_File.print_props(Build_Log.ML_STATISTICS_MARKER, _))),
          XZ.options(6))
      }
    }
  }

  def build_job_infos(job_name: String): List[Job_Info] =
  {
    val Session_Log = new Regex("""^.*/log/([^/]+)\.(db|gz)$""")

    for {
      build <-
        JSON.array(
          invoke(root() + "/job/" + job_name, "tree=allBuilds[number,timestamp,artifacts[*]]"),
          "allBuilds").getOrElse(Nil)
      number <- JSON.int(build, "number")
      timestamp <- JSON.long(build, "timestamp")
    } yield {
      val job_prefix = root() + "/job/" + job_name + "/" + number
      val main_log = Url(job_prefix + "/consoleText")
      val session_logs =
        for {
          artifact <- JSON.array(build, "artifacts").getOrElse(Nil)
          log_path <- JSON.string(artifact, "relativePath")
          (name, ext) <- (log_path match { case Session_Log(a, b) => Some((a, b)) case _ => None })
        } yield (name, ext, Url(job_prefix + "/artifact/" + log_path))
      Job_Info(job_name, timestamp, main_log, session_logs)
    }
  }
}