src/Pure/Tools/build_schedule.scala
author Fabian Huch <huch@in.tum.de>
Fri, 01 Dec 2023 20:54:00 +0100
changeset 79108 ed00312f694f
parent 79107 f5a2f956b531
child 79109 c1255d9870f6
permissions -rw-r--r--
tuned;
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
78845
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
     1
/*  Title:      Pure/Tools/build_schedule.scala
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
     2
    Author:     Fabian Huch, TU Muenchen
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
     3
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
     4
Build schedule generated by Heuristic methods, allowing for more efficient builds.
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
     5
 */
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
     6
package isabelle
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
     7
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
     8
78846
966aa081929f tuned imports;
wenzelm
parents: 78845
diff changeset
     9
import Host.Node_Info
78845
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
    10
import scala.annotation.tailrec
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
    11
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
    12
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
    13
object Build_Schedule {
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
    14
  /* organized historic timing information (extracted from build logs) */
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
    15
79085
cf51ccfd3e39 use full timing information in build schedule;
Fabian Huch <huch@in.tum.de>
parents: 79084
diff changeset
    16
  case class Timing_Entry(job_name: String, hostname: String, threads: Int, timing: Timing) {
cf51ccfd3e39 use full timing information in build schedule;
Fabian Huch <huch@in.tum.de>
parents: 79084
diff changeset
    17
    def elapsed: Time = timing.elapsed
79087
3620010c410a use cpu time for approximation;
Fabian Huch <huch@in.tum.de>
parents: 79086
diff changeset
    18
    def proper_cpu: Option[Time] = timing.cpu.proper_ms.map(Time.ms)
79085
cf51ccfd3e39 use full timing information in build schedule;
Fabian Huch <huch@in.tum.de>
parents: 79084
diff changeset
    19
  }
79035
6beb60b508e6 clarified timing data vs. timing entries: full top-level data view vs. dynamic partial data;
Fabian Huch <huch@in.tum.de>
parents: 79034
diff changeset
    20
  case class Timing_Entries(entries: List[Timing_Entry]) {
6beb60b508e6 clarified timing data vs. timing entries: full top-level data view vs. dynamic partial data;
Fabian Huch <huch@in.tum.de>
parents: 79034
diff changeset
    21
    require(entries.nonEmpty)
78845
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
    22
79035
6beb60b508e6 clarified timing data vs. timing entries: full top-level data view vs. dynamic partial data;
Fabian Huch <huch@in.tum.de>
parents: 79034
diff changeset
    23
    def is_empty = entries.isEmpty
6beb60b508e6 clarified timing data vs. timing entries: full top-level data view vs. dynamic partial data;
Fabian Huch <huch@in.tum.de>
parents: 79034
diff changeset
    24
    def size = entries.length
78845
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
    25
79035
6beb60b508e6 clarified timing data vs. timing entries: full top-level data view vs. dynamic partial data;
Fabian Huch <huch@in.tum.de>
parents: 79034
diff changeset
    26
    lazy val by_job = entries.groupBy(_.job_name).view.mapValues(Timing_Entries(_)).toMap
6beb60b508e6 clarified timing data vs. timing entries: full top-level data view vs. dynamic partial data;
Fabian Huch <huch@in.tum.de>
parents: 79034
diff changeset
    27
    lazy val by_threads = entries.groupBy(_.threads).view.mapValues(Timing_Entries(_)).toMap
6beb60b508e6 clarified timing data vs. timing entries: full top-level data view vs. dynamic partial data;
Fabian Huch <huch@in.tum.de>
parents: 79034
diff changeset
    28
    lazy val by_hostname = entries.groupBy(_.hostname).view.mapValues(Timing_Entries(_)).toMap
78845
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
    29
79035
6beb60b508e6 clarified timing data vs. timing entries: full top-level data view vs. dynamic partial data;
Fabian Huch <huch@in.tum.de>
parents: 79034
diff changeset
    30
    def mean_time: Time = Timing_Data.mean_time(entries.map(_.elapsed))
6beb60b508e6 clarified timing data vs. timing entries: full top-level data view vs. dynamic partial data;
Fabian Huch <huch@in.tum.de>
parents: 79034
diff changeset
    31
    def best_entry: Timing_Entry = entries.minBy(_.elapsed.ms)
6beb60b508e6 clarified timing data vs. timing entries: full top-level data view vs. dynamic partial data;
Fabian Huch <huch@in.tum.de>
parents: 79034
diff changeset
    32
  }
78845
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
    33
79035
6beb60b508e6 clarified timing data vs. timing entries: full top-level data view vs. dynamic partial data;
Fabian Huch <huch@in.tum.de>
parents: 79034
diff changeset
    34
  class Timing_Data private(data: Timing_Entries, val host_infos: Host_Infos) {
79025
f78ee2d48bf5 handle inflection point in interpolation with monotone prefix;
Fabian Huch <huch@in.tum.de>
parents: 79024
diff changeset
    35
    private def inflection_point(last_mono: Int, next: Int): Int =
f78ee2d48bf5 handle inflection point in interpolation with monotone prefix;
Fabian Huch <huch@in.tum.de>
parents: 79024
diff changeset
    36
      last_mono + ((next - last_mono) / 2)
f78ee2d48bf5 handle inflection point in interpolation with monotone prefix;
Fabian Huch <huch@in.tum.de>
parents: 79024
diff changeset
    37
79028
6bada416ba55 clarified timing data operations: proper estimation (instead of known points);
Fabian Huch <huch@in.tum.de>
parents: 79027
diff changeset
    38
    def best_threads(job_name: String, max_threads: Int): Int = {
6bada416ba55 clarified timing data operations: proper estimation (instead of known points);
Fabian Huch <huch@in.tum.de>
parents: 79027
diff changeset
    39
      val worse_threads =
79035
6beb60b508e6 clarified timing data vs. timing entries: full top-level data view vs. dynamic partial data;
Fabian Huch <huch@in.tum.de>
parents: 79034
diff changeset
    40
        data.by_job.get(job_name).toList.flatMap(_.by_hostname).flatMap {
79028
6bada416ba55 clarified timing data operations: proper estimation (instead of known points);
Fabian Huch <huch@in.tum.de>
parents: 79027
diff changeset
    41
          case (hostname, data) =>
6bada416ba55 clarified timing data operations: proper estimation (instead of known points);
Fabian Huch <huch@in.tum.de>
parents: 79027
diff changeset
    42
            val best_threads = data.best_entry.threads
6bada416ba55 clarified timing data operations: proper estimation (instead of known points);
Fabian Huch <huch@in.tum.de>
parents: 79027
diff changeset
    43
            data.by_threads.keys.toList.sorted.find(_ > best_threads).map(
6bada416ba55 clarified timing data operations: proper estimation (instead of known points);
Fabian Huch <huch@in.tum.de>
parents: 79027
diff changeset
    44
              inflection_point(best_threads, _))
6bada416ba55 clarified timing data operations: proper estimation (instead of known points);
Fabian Huch <huch@in.tum.de>
parents: 79027
diff changeset
    45
        }
6bada416ba55 clarified timing data operations: proper estimation (instead of known points);
Fabian Huch <huch@in.tum.de>
parents: 79027
diff changeset
    46
      (max_threads :: worse_threads).min
6bada416ba55 clarified timing data operations: proper estimation (instead of known points);
Fabian Huch <huch@in.tum.de>
parents: 79027
diff changeset
    47
    }
78845
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
    48
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
    49
    private def hostname_factor(from: String, to: String): Double =
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
    50
      host_infos.host_factor(host_infos.the_host(from), host_infos.the_host(to))
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
    51
79041
ff7d48e776ab properly sort entries;
Fabian Huch <huch@in.tum.de>
parents: 79040
diff changeset
    52
    private def approximate_threads(entries_unsorted: List[(Int, Time)], threads: Int): Time = {
ff7d48e776ab properly sort entries;
Fabian Huch <huch@in.tum.de>
parents: 79040
diff changeset
    53
      val entries = entries_unsorted.sortBy(_._1)
ff7d48e776ab properly sort entries;
Fabian Huch <huch@in.tum.de>
parents: 79040
diff changeset
    54
79036
be42ba4b4672 split actual approximation from data handling;
Fabian Huch <huch@in.tum.de>
parents: 79035
diff changeset
    55
      def sorted_prefix[A](xs: List[A], f: A => Long): List[A] =
be42ba4b4672 split actual approximation from data handling;
Fabian Huch <huch@in.tum.de>
parents: 79035
diff changeset
    56
        xs match {
be42ba4b4672 split actual approximation from data handling;
Fabian Huch <huch@in.tum.de>
parents: 79035
diff changeset
    57
          case x1 :: x2 :: xs =>
be42ba4b4672 split actual approximation from data handling;
Fabian Huch <huch@in.tum.de>
parents: 79035
diff changeset
    58
            if (f(x1) <= f(x2)) x1 :: sorted_prefix(x2 :: xs, f) else x1 :: Nil
be42ba4b4672 split actual approximation from data handling;
Fabian Huch <huch@in.tum.de>
parents: 79035
diff changeset
    59
          case xs => xs
be42ba4b4672 split actual approximation from data handling;
Fabian Huch <huch@in.tum.de>
parents: 79035
diff changeset
    60
        }
be42ba4b4672 split actual approximation from data handling;
Fabian Huch <huch@in.tum.de>
parents: 79035
diff changeset
    61
be42ba4b4672 split actual approximation from data handling;
Fabian Huch <huch@in.tum.de>
parents: 79035
diff changeset
    62
      def linear(p0: (Int, Time), p1: (Int, Time)): Time = {
be42ba4b4672 split actual approximation from data handling;
Fabian Huch <huch@in.tum.de>
parents: 79035
diff changeset
    63
        val a = (p1._2 - p0._2).scale(1.0 / (p1._1 - p0._1))
be42ba4b4672 split actual approximation from data handling;
Fabian Huch <huch@in.tum.de>
parents: 79035
diff changeset
    64
        val b = p0._2 - a.scale(p0._1)
be42ba4b4672 split actual approximation from data handling;
Fabian Huch <huch@in.tum.de>
parents: 79035
diff changeset
    65
        Time.ms((a.scale(threads) + b).ms max 0)
be42ba4b4672 split actual approximation from data handling;
Fabian Huch <huch@in.tum.de>
parents: 79035
diff changeset
    66
      }
be42ba4b4672 split actual approximation from data handling;
Fabian Huch <huch@in.tum.de>
parents: 79035
diff changeset
    67
be42ba4b4672 split actual approximation from data handling;
Fabian Huch <huch@in.tum.de>
parents: 79035
diff changeset
    68
      val mono_prefix = sorted_prefix(entries, e => -e._2.ms)
be42ba4b4672 split actual approximation from data handling;
Fabian Huch <huch@in.tum.de>
parents: 79035
diff changeset
    69
be42ba4b4672 split actual approximation from data handling;
Fabian Huch <huch@in.tum.de>
parents: 79035
diff changeset
    70
      val is_mono = entries == mono_prefix
be42ba4b4672 split actual approximation from data handling;
Fabian Huch <huch@in.tum.de>
parents: 79035
diff changeset
    71
      val in_prefix = mono_prefix.length > 1 && threads <= mono_prefix.last._1
be42ba4b4672 split actual approximation from data handling;
Fabian Huch <huch@in.tum.de>
parents: 79035
diff changeset
    72
      val in_inflection =
be42ba4b4672 split actual approximation from data handling;
Fabian Huch <huch@in.tum.de>
parents: 79035
diff changeset
    73
        !is_mono && mono_prefix.length > 1 && threads < entries.drop(mono_prefix.length).head._1
be42ba4b4672 split actual approximation from data handling;
Fabian Huch <huch@in.tum.de>
parents: 79035
diff changeset
    74
      if (is_mono || in_prefix || in_inflection) {
be42ba4b4672 split actual approximation from data handling;
Fabian Huch <huch@in.tum.de>
parents: 79035
diff changeset
    75
        // Model with Amdahl's law
be42ba4b4672 split actual approximation from data handling;
Fabian Huch <huch@in.tum.de>
parents: 79035
diff changeset
    76
        val t_p =
be42ba4b4672 split actual approximation from data handling;
Fabian Huch <huch@in.tum.de>
parents: 79035
diff changeset
    77
          Timing_Data.median_time(for {
be42ba4b4672 split actual approximation from data handling;
Fabian Huch <huch@in.tum.de>
parents: 79035
diff changeset
    78
            (n, t0) <- mono_prefix
be42ba4b4672 split actual approximation from data handling;
Fabian Huch <huch@in.tum.de>
parents: 79035
diff changeset
    79
            (m, t1) <- mono_prefix
be42ba4b4672 split actual approximation from data handling;
Fabian Huch <huch@in.tum.de>
parents: 79035
diff changeset
    80
            if m != n
be42ba4b4672 split actual approximation from data handling;
Fabian Huch <huch@in.tum.de>
parents: 79035
diff changeset
    81
          } yield (t0 - t1).scale(n.toDouble * m / (m - n)))
be42ba4b4672 split actual approximation from data handling;
Fabian Huch <huch@in.tum.de>
parents: 79035
diff changeset
    82
        val t_c =
be42ba4b4672 split actual approximation from data handling;
Fabian Huch <huch@in.tum.de>
parents: 79035
diff changeset
    83
          Timing_Data.median_time(for ((n, t) <- mono_prefix) yield t - t_p.scale(1.0 / n))
be42ba4b4672 split actual approximation from data handling;
Fabian Huch <huch@in.tum.de>
parents: 79035
diff changeset
    84
79086
59d5d1e26393 lower bound for approximated times;
Fabian Huch <huch@in.tum.de>
parents: 79085
diff changeset
    85
        def model(threads: Int): Time = Time.ms((t_c + t_p.scale(1.0 / threads)).ms max 0)
79036
be42ba4b4672 split actual approximation from data handling;
Fabian Huch <huch@in.tum.de>
parents: 79035
diff changeset
    86
be42ba4b4672 split actual approximation from data handling;
Fabian Huch <huch@in.tum.de>
parents: 79035
diff changeset
    87
        if (is_mono || in_prefix) model(threads)
be42ba4b4672 split actual approximation from data handling;
Fabian Huch <huch@in.tum.de>
parents: 79035
diff changeset
    88
        else {
be42ba4b4672 split actual approximation from data handling;
Fabian Huch <huch@in.tum.de>
parents: 79035
diff changeset
    89
          val post_inflection = entries.drop(mono_prefix.length).head
be42ba4b4672 split actual approximation from data handling;
Fabian Huch <huch@in.tum.de>
parents: 79035
diff changeset
    90
          val inflection_threads = inflection_point(mono_prefix.last._1, post_inflection._1)
be42ba4b4672 split actual approximation from data handling;
Fabian Huch <huch@in.tum.de>
parents: 79035
diff changeset
    91
be42ba4b4672 split actual approximation from data handling;
Fabian Huch <huch@in.tum.de>
parents: 79035
diff changeset
    92
          if (threads <= inflection_threads) model(threads)
be42ba4b4672 split actual approximation from data handling;
Fabian Huch <huch@in.tum.de>
parents: 79035
diff changeset
    93
          else linear((inflection_threads, model(inflection_threads)), post_inflection)
be42ba4b4672 split actual approximation from data handling;
Fabian Huch <huch@in.tum.de>
parents: 79035
diff changeset
    94
        }
be42ba4b4672 split actual approximation from data handling;
Fabian Huch <huch@in.tum.de>
parents: 79035
diff changeset
    95
      } else {
be42ba4b4672 split actual approximation from data handling;
Fabian Huch <huch@in.tum.de>
parents: 79035
diff changeset
    96
        // Piecewise linear
be42ba4b4672 split actual approximation from data handling;
Fabian Huch <huch@in.tum.de>
parents: 79035
diff changeset
    97
        val (p0, p1) =
79042
1a9f3806987d proper split;
Fabian Huch <huch@in.tum.de>
parents: 79041
diff changeset
    98
          if (entries.head._1 < threads && threads < entries.last._1) {
1a9f3806987d proper split;
Fabian Huch <huch@in.tum.de>
parents: 79041
diff changeset
    99
            val split = entries.partition(_._1 < threads)
79036
be42ba4b4672 split actual approximation from data handling;
Fabian Huch <huch@in.tum.de>
parents: 79035
diff changeset
   100
            (split._1.last, split._2.head)
be42ba4b4672 split actual approximation from data handling;
Fabian Huch <huch@in.tum.de>
parents: 79035
diff changeset
   101
          } else {
be42ba4b4672 split actual approximation from data handling;
Fabian Huch <huch@in.tum.de>
parents: 79035
diff changeset
   102
            val piece = if (threads < entries.head._1) entries.take(2) else entries.takeRight(2)
be42ba4b4672 split actual approximation from data handling;
Fabian Huch <huch@in.tum.de>
parents: 79035
diff changeset
   103
            (piece.head, piece.last)
be42ba4b4672 split actual approximation from data handling;
Fabian Huch <huch@in.tum.de>
parents: 79035
diff changeset
   104
          }
be42ba4b4672 split actual approximation from data handling;
Fabian Huch <huch@in.tum.de>
parents: 79035
diff changeset
   105
be42ba4b4672 split actual approximation from data handling;
Fabian Huch <huch@in.tum.de>
parents: 79035
diff changeset
   106
        linear(p0, p1)
be42ba4b4672 split actual approximation from data handling;
Fabian Huch <huch@in.tum.de>
parents: 79035
diff changeset
   107
      }
be42ba4b4672 split actual approximation from data handling;
Fabian Huch <huch@in.tum.de>
parents: 79035
diff changeset
   108
    }
be42ba4b4672 split actual approximation from data handling;
Fabian Huch <huch@in.tum.de>
parents: 79035
diff changeset
   109
79037
1b3a6cc4a2bf clarified and tuned timing estimation;
Fabian Huch <huch@in.tum.de>
parents: 79036
diff changeset
   110
    private def unify_hosts(job_name: String, on_host: String): List[(Int, Time)] = {
1b3a6cc4a2bf clarified and tuned timing estimation;
Fabian Huch <huch@in.tum.de>
parents: 79036
diff changeset
   111
      def unify(hostname: String, data: Timing_Entries) =
1b3a6cc4a2bf clarified and tuned timing estimation;
Fabian Huch <huch@in.tum.de>
parents: 79036
diff changeset
   112
        data.mean_time.scale(hostname_factor(hostname, on_host))
1b3a6cc4a2bf clarified and tuned timing estimation;
Fabian Huch <huch@in.tum.de>
parents: 79036
diff changeset
   113
1b3a6cc4a2bf clarified and tuned timing estimation;
Fabian Huch <huch@in.tum.de>
parents: 79036
diff changeset
   114
      for {
1b3a6cc4a2bf clarified and tuned timing estimation;
Fabian Huch <huch@in.tum.de>
parents: 79036
diff changeset
   115
        data <- data.by_job.get(job_name).toList
1b3a6cc4a2bf clarified and tuned timing estimation;
Fabian Huch <huch@in.tum.de>
parents: 79036
diff changeset
   116
        (threads, data) <- data.by_threads
1b3a6cc4a2bf clarified and tuned timing estimation;
Fabian Huch <huch@in.tum.de>
parents: 79036
diff changeset
   117
        entries = data.by_hostname.toList.map(unify)
1b3a6cc4a2bf clarified and tuned timing estimation;
Fabian Huch <huch@in.tum.de>
parents: 79036
diff changeset
   118
      } yield threads -> Timing_Data.median_time(entries)
1b3a6cc4a2bf clarified and tuned timing estimation;
Fabian Huch <huch@in.tum.de>
parents: 79036
diff changeset
   119
    }
1b3a6cc4a2bf clarified and tuned timing estimation;
Fabian Huch <huch@in.tum.de>
parents: 79036
diff changeset
   120
1b3a6cc4a2bf clarified and tuned timing estimation;
Fabian Huch <huch@in.tum.de>
parents: 79036
diff changeset
   121
    def estimate_threads(job_name: String, hostname: String, threads: Int): Option[Time] = {
79087
3620010c410a use cpu time for approximation;
Fabian Huch <huch@in.tum.de>
parents: 79086
diff changeset
   122
      def try_approximate(data: Timing_Entries): Option[Time] = {
3620010c410a use cpu time for approximation;
Fabian Huch <huch@in.tum.de>
parents: 79086
diff changeset
   123
        val entries =
3620010c410a use cpu time for approximation;
Fabian Huch <huch@in.tum.de>
parents: 79086
diff changeset
   124
          data.by_threads.toList match {
3620010c410a use cpu time for approximation;
Fabian Huch <huch@in.tum.de>
parents: 79086
diff changeset
   125
            case List((i, Timing_Entries(List(entry)))) if i != 1 =>
3620010c410a use cpu time for approximation;
Fabian Huch <huch@in.tum.de>
parents: 79086
diff changeset
   126
              (i, data.mean_time) :: entry.proper_cpu.map(1 -> _).toList
3620010c410a use cpu time for approximation;
Fabian Huch <huch@in.tum.de>
parents: 79086
diff changeset
   127
            case entries => entries.map((threads, data) => threads -> data.mean_time)
3620010c410a use cpu time for approximation;
Fabian Huch <huch@in.tum.de>
parents: 79086
diff changeset
   128
          }
3620010c410a use cpu time for approximation;
Fabian Huch <huch@in.tum.de>
parents: 79086
diff changeset
   129
        if (entries.size < 2) None else Some(approximate_threads(entries, threads))
3620010c410a use cpu time for approximation;
Fabian Huch <huch@in.tum.de>
parents: 79086
diff changeset
   130
      }
3620010c410a use cpu time for approximation;
Fabian Huch <huch@in.tum.de>
parents: 79086
diff changeset
   131
79037
1b3a6cc4a2bf clarified and tuned timing estimation;
Fabian Huch <huch@in.tum.de>
parents: 79036
diff changeset
   132
      for {
1b3a6cc4a2bf clarified and tuned timing estimation;
Fabian Huch <huch@in.tum.de>
parents: 79036
diff changeset
   133
        data <- data.by_job.get(job_name)
1b3a6cc4a2bf clarified and tuned timing estimation;
Fabian Huch <huch@in.tum.de>
parents: 79036
diff changeset
   134
        data <- data.by_hostname.get(hostname)
79087
3620010c410a use cpu time for approximation;
Fabian Huch <huch@in.tum.de>
parents: 79086
diff changeset
   135
        time <- data.by_threads.get(threads).map(_.mean_time).orElse(try_approximate(data))
79037
1b3a6cc4a2bf clarified and tuned timing estimation;
Fabian Huch <huch@in.tum.de>
parents: 79036
diff changeset
   136
      } yield time
1b3a6cc4a2bf clarified and tuned timing estimation;
Fabian Huch <huch@in.tum.de>
parents: 79036
diff changeset
   137
    }
1b3a6cc4a2bf clarified and tuned timing estimation;
Fabian Huch <huch@in.tum.de>
parents: 79036
diff changeset
   138
1b3a6cc4a2bf clarified and tuned timing estimation;
Fabian Huch <huch@in.tum.de>
parents: 79036
diff changeset
   139
    def global_threads_factor(from: Int, to: Int): Double = {
1b3a6cc4a2bf clarified and tuned timing estimation;
Fabian Huch <huch@in.tum.de>
parents: 79036
diff changeset
   140
      def median(xs: Iterable[Double]): Double = xs.toList.sorted.apply(xs.size / 2)
79036
be42ba4b4672 split actual approximation from data handling;
Fabian Huch <huch@in.tum.de>
parents: 79035
diff changeset
   141
79037
1b3a6cc4a2bf clarified and tuned timing estimation;
Fabian Huch <huch@in.tum.de>
parents: 79036
diff changeset
   142
      val estimates =
1b3a6cc4a2bf clarified and tuned timing estimation;
Fabian Huch <huch@in.tum.de>
parents: 79036
diff changeset
   143
        for {
1b3a6cc4a2bf clarified and tuned timing estimation;
Fabian Huch <huch@in.tum.de>
parents: 79036
diff changeset
   144
          (hostname, data) <- data.by_hostname
1b3a6cc4a2bf clarified and tuned timing estimation;
Fabian Huch <huch@in.tum.de>
parents: 79036
diff changeset
   145
          job_name <- data.by_job.keys
1b3a6cc4a2bf clarified and tuned timing estimation;
Fabian Huch <huch@in.tum.de>
parents: 79036
diff changeset
   146
          from_time <- estimate_threads(job_name, hostname, from)
1b3a6cc4a2bf clarified and tuned timing estimation;
Fabian Huch <huch@in.tum.de>
parents: 79036
diff changeset
   147
          to_time <- estimate_threads(job_name, hostname, to)
1b3a6cc4a2bf clarified and tuned timing estimation;
Fabian Huch <huch@in.tum.de>
parents: 79036
diff changeset
   148
        } yield from_time.ms.toDouble / to_time.ms
78845
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   149
79037
1b3a6cc4a2bf clarified and tuned timing estimation;
Fabian Huch <huch@in.tum.de>
parents: 79036
diff changeset
   150
      if (estimates.nonEmpty) median(estimates)
1b3a6cc4a2bf clarified and tuned timing estimation;
Fabian Huch <huch@in.tum.de>
parents: 79036
diff changeset
   151
      else {
1b3a6cc4a2bf clarified and tuned timing estimation;
Fabian Huch <huch@in.tum.de>
parents: 79036
diff changeset
   152
        // unify hosts
1b3a6cc4a2bf clarified and tuned timing estimation;
Fabian Huch <huch@in.tum.de>
parents: 79036
diff changeset
   153
        val estimates =
1b3a6cc4a2bf clarified and tuned timing estimation;
Fabian Huch <huch@in.tum.de>
parents: 79036
diff changeset
   154
          for {
1b3a6cc4a2bf clarified and tuned timing estimation;
Fabian Huch <huch@in.tum.de>
parents: 79036
diff changeset
   155
            (job_name, data) <- data.by_job
1b3a6cc4a2bf clarified and tuned timing estimation;
Fabian Huch <huch@in.tum.de>
parents: 79036
diff changeset
   156
            hostname = data.by_hostname.keys.head
1b3a6cc4a2bf clarified and tuned timing estimation;
Fabian Huch <huch@in.tum.de>
parents: 79036
diff changeset
   157
            entries = unify_hosts(job_name, hostname)
1b3a6cc4a2bf clarified and tuned timing estimation;
Fabian Huch <huch@in.tum.de>
parents: 79036
diff changeset
   158
            if entries.length > 1
1b3a6cc4a2bf clarified and tuned timing estimation;
Fabian Huch <huch@in.tum.de>
parents: 79036
diff changeset
   159
          } yield
1b3a6cc4a2bf clarified and tuned timing estimation;
Fabian Huch <huch@in.tum.de>
parents: 79036
diff changeset
   160
            approximate_threads(entries, from).ms.toDouble / approximate_threads(entries, to).ms
78845
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   161
79037
1b3a6cc4a2bf clarified and tuned timing estimation;
Fabian Huch <huch@in.tum.de>
parents: 79036
diff changeset
   162
        if (estimates.nonEmpty) median(estimates)
1b3a6cc4a2bf clarified and tuned timing estimation;
Fabian Huch <huch@in.tum.de>
parents: 79036
diff changeset
   163
        else from.toDouble / to.toDouble
1b3a6cc4a2bf clarified and tuned timing estimation;
Fabian Huch <huch@in.tum.de>
parents: 79036
diff changeset
   164
      }
78845
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   165
    }
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   166
79026
6585acdd6505 clarified time estimation: does not use config;
Fabian Huch <huch@in.tum.de>
parents: 79025
diff changeset
   167
    def estimate(job_name: String, hostname: String, threads: Int): Time =
79035
6beb60b508e6 clarified timing data vs. timing entries: full top-level data view vs. dynamic partial data;
Fabian Huch <huch@in.tum.de>
parents: 79034
diff changeset
   168
      data.by_job.get(job_name) match {
79038
cd7c1acc9cf2 better estimation for unknown jobs;
Fabian Huch <huch@in.tum.de>
parents: 79037
diff changeset
   169
        case None =>
cd7c1acc9cf2 better estimation for unknown jobs;
Fabian Huch <huch@in.tum.de>
parents: 79037
diff changeset
   170
          // no data for job, take average of other jobs for given threads
cd7c1acc9cf2 better estimation for unknown jobs;
Fabian Huch <huch@in.tum.de>
parents: 79037
diff changeset
   171
          val job_estimates = data.by_job.keys.flatMap(estimate_threads(_, hostname, threads))
cd7c1acc9cf2 better estimation for unknown jobs;
Fabian Huch <huch@in.tum.de>
parents: 79037
diff changeset
   172
          if (job_estimates.nonEmpty) Timing_Data.mean_time(job_estimates)
cd7c1acc9cf2 better estimation for unknown jobs;
Fabian Huch <huch@in.tum.de>
parents: 79037
diff changeset
   173
          else {
cd7c1acc9cf2 better estimation for unknown jobs;
Fabian Huch <huch@in.tum.de>
parents: 79037
diff changeset
   174
            // no other job to estimate from, use global curve to approximate any other job
cd7c1acc9cf2 better estimation for unknown jobs;
Fabian Huch <huch@in.tum.de>
parents: 79037
diff changeset
   175
            val (threads1, data1) = data.by_threads.head
cd7c1acc9cf2 better estimation for unknown jobs;
Fabian Huch <huch@in.tum.de>
parents: 79037
diff changeset
   176
            data1.mean_time.scale(global_threads_factor(threads1, threads))
cd7c1acc9cf2 better estimation for unknown jobs;
Fabian Huch <huch@in.tum.de>
parents: 79037
diff changeset
   177
          }
cd7c1acc9cf2 better estimation for unknown jobs;
Fabian Huch <huch@in.tum.de>
parents: 79037
diff changeset
   178
78845
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   179
        case Some(data) =>
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   180
          data.by_threads.get(threads) match {
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   181
            case None => // interpolate threads
79037
1b3a6cc4a2bf clarified and tuned timing estimation;
Fabian Huch <huch@in.tum.de>
parents: 79036
diff changeset
   182
              estimate_threads(job_name, hostname, threads).getOrElse {
1b3a6cc4a2bf clarified and tuned timing estimation;
Fabian Huch <huch@in.tum.de>
parents: 79036
diff changeset
   183
                // per machine, try to approximate config for threads
1b3a6cc4a2bf clarified and tuned timing estimation;
Fabian Huch <huch@in.tum.de>
parents: 79036
diff changeset
   184
                val approximated =
1b3a6cc4a2bf clarified and tuned timing estimation;
Fabian Huch <huch@in.tum.de>
parents: 79036
diff changeset
   185
                  for {
1b3a6cc4a2bf clarified and tuned timing estimation;
Fabian Huch <huch@in.tum.de>
parents: 79036
diff changeset
   186
                    hostname1 <- data.by_hostname.keys
1b3a6cc4a2bf clarified and tuned timing estimation;
Fabian Huch <huch@in.tum.de>
parents: 79036
diff changeset
   187
                    estimate <- estimate_threads(job_name, hostname1, threads)
1b3a6cc4a2bf clarified and tuned timing estimation;
Fabian Huch <huch@in.tum.de>
parents: 79036
diff changeset
   188
                    factor = hostname_factor(hostname1, hostname)
1b3a6cc4a2bf clarified and tuned timing estimation;
Fabian Huch <huch@in.tum.de>
parents: 79036
diff changeset
   189
                  } yield estimate.scale(factor)
78845
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   190
79037
1b3a6cc4a2bf clarified and tuned timing estimation;
Fabian Huch <huch@in.tum.de>
parents: 79036
diff changeset
   191
                if (approximated.nonEmpty) Timing_Data.mean_time(approximated)
1b3a6cc4a2bf clarified and tuned timing estimation;
Fabian Huch <huch@in.tum.de>
parents: 79036
diff changeset
   192
                else {
1b3a6cc4a2bf clarified and tuned timing estimation;
Fabian Huch <huch@in.tum.de>
parents: 79036
diff changeset
   193
                  // no single machine where config can be approximated, unify data points
1b3a6cc4a2bf clarified and tuned timing estimation;
Fabian Huch <huch@in.tum.de>
parents: 79036
diff changeset
   194
                  val unified_entries = unify_hosts(job_name, hostname)
1b3a6cc4a2bf clarified and tuned timing estimation;
Fabian Huch <huch@in.tum.de>
parents: 79036
diff changeset
   195
1b3a6cc4a2bf clarified and tuned timing estimation;
Fabian Huch <huch@in.tum.de>
parents: 79036
diff changeset
   196
                  if (unified_entries.length > 1) approximate_threads(unified_entries, threads)
78845
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   197
                  else {
79037
1b3a6cc4a2bf clarified and tuned timing estimation;
Fabian Huch <huch@in.tum.de>
parents: 79036
diff changeset
   198
                    // only single data point, use global curve to approximate
1b3a6cc4a2bf clarified and tuned timing estimation;
Fabian Huch <huch@in.tum.de>
parents: 79036
diff changeset
   199
                    val (job_threads, job_time) = unified_entries.head
1b3a6cc4a2bf clarified and tuned timing estimation;
Fabian Huch <huch@in.tum.de>
parents: 79036
diff changeset
   200
                    job_time.scale(global_threads_factor(job_threads, threads))
78845
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   201
                  }
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   202
                }
79037
1b3a6cc4a2bf clarified and tuned timing estimation;
Fabian Huch <huch@in.tum.de>
parents: 79036
diff changeset
   203
              }
78845
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   204
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   205
            case Some(data) => // time for job/thread exists, interpolate machine
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   206
              data.by_hostname.get(hostname).map(_.mean_time).getOrElse {
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   207
                Timing_Data.median_time(
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   208
                  data.by_hostname.toList.map((hostname1, data) =>
78888
95bbf9a576b3 prefer Time.scale(), following Isabelle/ML;
wenzelm
parents: 78884
diff changeset
   209
                    data.mean_time.scale(hostname_factor(hostname1, hostname))))
78845
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   210
              }
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   211
          }
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   212
      }
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   213
  }
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   214
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   215
  object Timing_Data {
79085
cf51ccfd3e39 use full timing information in build schedule;
Fabian Huch <huch@in.tum.de>
parents: 79084
diff changeset
   216
    def median_timing(obs: List[Timing]): Timing = obs.sortBy(_.elapsed.ms).apply(obs.length / 2)
79039
Fabian Huch <huch@in.tum.de>
parents: 79038
diff changeset
   217
    def median_time(obs: List[Time]): Time = obs.sortBy(_.ms).apply(obs.length / 2)
78845
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   218
    def mean_time(obs: Iterable[Time]): Time = Time.ms(obs.map(_.ms).sum / obs.size)
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   219
79085
cf51ccfd3e39 use full timing information in build schedule;
Fabian Huch <huch@in.tum.de>
parents: 79084
diff changeset
   220
    private def dummy_entries(host: Host, host_factor: Double) = {
cf51ccfd3e39 use full timing information in build schedule;
Fabian Huch <huch@in.tum.de>
parents: 79084
diff changeset
   221
      val baseline = Time.minutes(5).scale(host_factor)
cf51ccfd3e39 use full timing information in build schedule;
Fabian Huch <huch@in.tum.de>
parents: 79084
diff changeset
   222
      val gc = Time.seconds(10).scale(host_factor)
78845
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   223
      List(
79103
883f61f0beda clarified build schedule host: more operations;
Fabian Huch <huch@in.tum.de>
parents: 79102
diff changeset
   224
        Timing_Entry("dummy", host.name, 1, Timing(baseline, baseline, gc)),
883f61f0beda clarified build schedule host: more operations;
Fabian Huch <huch@in.tum.de>
parents: 79102
diff changeset
   225
        Timing_Entry("dummy", host.name, 8, Timing(baseline.scale(0.2), baseline, gc)))
79085
cf51ccfd3e39 use full timing information in build schedule;
Fabian Huch <huch@in.tum.de>
parents: 79084
diff changeset
   226
    }
78845
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   227
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   228
    def make(
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   229
      host_infos: Host_Infos,
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   230
      build_history: List[(Build_Log.Meta_Info, Build_Log.Build_Info)],
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   231
    ): Timing_Data = {
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   232
      val hosts = host_infos.hosts
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   233
      val measurements =
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   234
        for {
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   235
          (meta_info, build_info) <- build_history
79083
2d18d481c115 filter hosts properly;
Fabian Huch <huch@in.tum.de>
parents: 79073
diff changeset
   236
          build_host = meta_info.get(Build_Log.Prop.build_host)
78845
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   237
          (job_name, session_info) <- build_info.sessions.toList
78933
4f940d7293ea use only finished sessions in timing data;
Fabian Huch <huch@in.tum.de>
parents: 78932
diff changeset
   238
          if build_info.finished_sessions.contains(job_name)
79083
2d18d481c115 filter hosts properly;
Fabian Huch <huch@in.tum.de>
parents: 79073
diff changeset
   239
          hostname <- session_info.hostname.orElse(build_host).toList
2d18d481c115 filter hosts properly;
Fabian Huch <huch@in.tum.de>
parents: 79073
diff changeset
   240
          host <- hosts.find(_.info.hostname == hostname).toList
78845
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   241
          threads = session_info.threads.getOrElse(host.info.num_cpus)
79085
cf51ccfd3e39 use full timing information in build schedule;
Fabian Huch <huch@in.tum.de>
parents: 79084
diff changeset
   242
        } yield (job_name, hostname, threads) -> session_info.timing
78845
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   243
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   244
      val entries =
78934
5553a86a1091 proper dummy timing entries;
Fabian Huch <huch@in.tum.de>
parents: 78933
diff changeset
   245
        if (measurements.isEmpty) {
79084
dd689c4ab688 consistent hosts ordering;
Fabian Huch <huch@in.tum.de>
parents: 79083
diff changeset
   246
          val default_host = host_infos.hosts.sorted(host_infos.host_speeds).last
78934
5553a86a1091 proper dummy timing entries;
Fabian Huch <huch@in.tum.de>
parents: 78933
diff changeset
   247
          host_infos.hosts.flatMap(host =>
5553a86a1091 proper dummy timing entries;
Fabian Huch <huch@in.tum.de>
parents: 78933
diff changeset
   248
            dummy_entries(host, host_infos.host_factor(default_host, host)))
5553a86a1091 proper dummy timing entries;
Fabian Huch <huch@in.tum.de>
parents: 78933
diff changeset
   249
        }
78845
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   250
        else
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   251
          measurements.groupMap(_._1)(_._2).toList.map {
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   252
            case ((job_name, hostname, threads), timings) =>
79085
cf51ccfd3e39 use full timing information in build schedule;
Fabian Huch <huch@in.tum.de>
parents: 79084
diff changeset
   253
              Timing_Entry(job_name, hostname, threads, median_timing(timings))
78845
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   254
          }
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   255
79035
6beb60b508e6 clarified timing data vs. timing entries: full top-level data view vs. dynamic partial data;
Fabian Huch <huch@in.tum.de>
parents: 79034
diff changeset
   256
      new Timing_Data(Timing_Entries(entries), host_infos)
78845
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   257
    }
79090
20be5b925720 clarified load vs. apply vs. make;
Fabian Huch <huch@in.tum.de>
parents: 79089
diff changeset
   258
20be5b925720 clarified load vs. apply vs. make;
Fabian Huch <huch@in.tum.de>
parents: 79089
diff changeset
   259
    def load(host_infos: Host_Infos, log_database: SQL.Database): Timing_Data = {
20be5b925720 clarified load vs. apply vs. make;
Fabian Huch <huch@in.tum.de>
parents: 79089
diff changeset
   260
      val build_history =
20be5b925720 clarified load vs. apply vs. make;
Fabian Huch <huch@in.tum.de>
parents: 79089
diff changeset
   261
        for {
20be5b925720 clarified load vs. apply vs. make;
Fabian Huch <huch@in.tum.de>
parents: 79089
diff changeset
   262
          log_name <- log_database.execute_query_statement(
20be5b925720 clarified load vs. apply vs. make;
Fabian Huch <huch@in.tum.de>
parents: 79089
diff changeset
   263
            Build_Log.private_data.meta_info_table.select(List(Build_Log.Column.log_name)),
20be5b925720 clarified load vs. apply vs. make;
Fabian Huch <huch@in.tum.de>
parents: 79089
diff changeset
   264
            List.from[String], res => res.string(Build_Log.Column.log_name))
20be5b925720 clarified load vs. apply vs. make;
Fabian Huch <huch@in.tum.de>
parents: 79089
diff changeset
   265
          meta_info <- Build_Log.private_data.read_meta_info(log_database, log_name)
20be5b925720 clarified load vs. apply vs. make;
Fabian Huch <huch@in.tum.de>
parents: 79089
diff changeset
   266
          build_info = Build_Log.private_data.read_build_info(log_database, log_name)
20be5b925720 clarified load vs. apply vs. make;
Fabian Huch <huch@in.tum.de>
parents: 79089
diff changeset
   267
        } yield (meta_info, build_info)
20be5b925720 clarified load vs. apply vs. make;
Fabian Huch <huch@in.tum.de>
parents: 79089
diff changeset
   268
20be5b925720 clarified load vs. apply vs. make;
Fabian Huch <huch@in.tum.de>
parents: 79089
diff changeset
   269
      make(host_infos, build_history)
20be5b925720 clarified load vs. apply vs. make;
Fabian Huch <huch@in.tum.de>
parents: 79089
diff changeset
   270
    }
78845
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   271
  }
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   272
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   273
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   274
  /* host information */
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   275
79103
883f61f0beda clarified build schedule host: more operations;
Fabian Huch <huch@in.tum.de>
parents: 79102
diff changeset
   276
  case class Host(info: isabelle.Host.Info, build: Build_Cluster.Host) {
883f61f0beda clarified build schedule host: more operations;
Fabian Huch <huch@in.tum.de>
parents: 79102
diff changeset
   277
    def name: String = info.hostname
883f61f0beda clarified build schedule host: more operations;
Fabian Huch <huch@in.tum.de>
parents: 79102
diff changeset
   278
    def num_cpus: Int = info.num_cpus
883f61f0beda clarified build schedule host: more operations;
Fabian Huch <huch@in.tum.de>
parents: 79102
diff changeset
   279
  }
78845
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   280
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   281
  object Host_Infos {
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   282
    def dummy: Host_Infos =
78846
966aa081929f tuned imports;
wenzelm
parents: 78845
diff changeset
   283
      new Host_Infos(
966aa081929f tuned imports;
wenzelm
parents: 78845
diff changeset
   284
        List(Host(isabelle.Host.Info("dummy", Nil, 8, Some(1.0)), Build_Cluster.Host("dummy"))))
78845
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   285
79090
20be5b925720 clarified load vs. apply vs. make;
Fabian Huch <huch@in.tum.de>
parents: 79089
diff changeset
   286
    def load(build_hosts: List[Build_Cluster.Host], db: SQL.Database): Host_Infos = {
78845
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   287
      def get_host(build_host: Build_Cluster.Host): Host = {
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   288
        val info =
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   289
          isabelle.Host.read_info(db, build_host.name).getOrElse(
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   290
            error("No benchmark for " + quote(build_host.name)))
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   291
        Host(info, build_host)
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   292
      }
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   293
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   294
      new Host_Infos(build_hosts.map(get_host))
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   295
    }
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   296
  }
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   297
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   298
  class Host_Infos private(val hosts: List[Host]) {
79040
Fabian Huch <huch@in.tum.de>
parents: 79039
diff changeset
   299
    require(hosts.nonEmpty)
Fabian Huch <huch@in.tum.de>
parents: 79039
diff changeset
   300
79103
883f61f0beda clarified build schedule host: more operations;
Fabian Huch <huch@in.tum.de>
parents: 79102
diff changeset
   301
    private val by_hostname = hosts.map(host => host.name -> host).toMap
78845
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   302
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   303
    def host_factor(from: Host, to: Host): Double =
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   304
      from.info.benchmark_score.get / to.info.benchmark_score.get
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   305
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   306
    val host_speeds: Ordering[Host] =
79084
dd689c4ab688 consistent hosts ordering;
Fabian Huch <huch@in.tum.de>
parents: 79083
diff changeset
   307
      Ordering.fromLessThan((host1, host2) => host_factor(host1, host2) < 1)
78845
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   308
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   309
    def the_host(hostname: String): Host =
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   310
      by_hostname.getOrElse(hostname, error("Unknown host " + quote(hostname)))
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   311
    def the_host(node_info: Node_Info): Host = the_host(node_info.hostname)
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   312
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   313
    def num_threads(node_info: Node_Info): Int =
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   314
      if (node_info.rel_cpus.nonEmpty) node_info.rel_cpus.length
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   315
      else the_host(node_info).info.num_cpus
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   316
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   317
    def available(state: Build_Process.State): Resources = {
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   318
      val allocated =
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   319
        state.running.values.map(_.node_info).groupMapReduce(the_host)(List(_))(_ ::: _)
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   320
      Resources(this, allocated)
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   321
    }
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   322
  }
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   323
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   324
79029
Fabian Huch <huch@in.tum.de>
parents: 79028
diff changeset
   325
  /* offline tracking of job configurations and resource allocations */
Fabian Huch <huch@in.tum.de>
parents: 79028
diff changeset
   326
Fabian Huch <huch@in.tum.de>
parents: 79028
diff changeset
   327
  object Config {
Fabian Huch <huch@in.tum.de>
parents: 79028
diff changeset
   328
    def from_job(job: Build_Process.Job): Config = Config(job.name, job.node_info)
Fabian Huch <huch@in.tum.de>
parents: 79028
diff changeset
   329
  }
Fabian Huch <huch@in.tum.de>
parents: 79028
diff changeset
   330
Fabian Huch <huch@in.tum.de>
parents: 79028
diff changeset
   331
  case class Config(job_name: String, node_info: Node_Info) {
Fabian Huch <huch@in.tum.de>
parents: 79028
diff changeset
   332
    def job_of(start_time: Time): Build_Process.Job =
Fabian Huch <huch@in.tum.de>
parents: 79028
diff changeset
   333
      Build_Process.Job(job_name, "", "", node_info, Date(start_time), None)
Fabian Huch <huch@in.tum.de>
parents: 79028
diff changeset
   334
  }
78845
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   335
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   336
  case class Resources(
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   337
    host_infos: Host_Infos,
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   338
    allocated_nodes: Map[Host, List[Node_Info]]
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   339
  ) {
79106
91955d607aad proper unused nodes;
Fabian Huch <huch@in.tum.de>
parents: 79105
diff changeset
   340
    def unused_nodes(host: Host, threads: Int): List[Node_Info] =
91955d607aad proper unused nodes;
Fabian Huch <huch@in.tum.de>
parents: 79105
diff changeset
   341
      if (!available(host, threads)) Nil
91955d607aad proper unused nodes;
Fabian Huch <huch@in.tum.de>
parents: 79105
diff changeset
   342
      else {
91955d607aad proper unused nodes;
Fabian Huch <huch@in.tum.de>
parents: 79105
diff changeset
   343
        val node = next_node(host, threads)
91955d607aad proper unused nodes;
Fabian Huch <huch@in.tum.de>
parents: 79105
diff changeset
   344
        node :: allocate(node).unused_nodes(host, threads)
91955d607aad proper unused nodes;
Fabian Huch <huch@in.tum.de>
parents: 79105
diff changeset
   345
      }
91955d607aad proper unused nodes;
Fabian Huch <huch@in.tum.de>
parents: 79105
diff changeset
   346
91955d607aad proper unused nodes;
Fabian Huch <huch@in.tum.de>
parents: 79105
diff changeset
   347
    def unused_nodes(threads: Int): List[Node_Info] =
91955d607aad proper unused nodes;
Fabian Huch <huch@in.tum.de>
parents: 79105
diff changeset
   348
      host_infos.hosts.flatMap(unused_nodes(_, threads))
78845
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   349
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   350
    def allocated(host: Host): List[Node_Info] = allocated_nodes.getOrElse(host, Nil)
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   351
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   352
    def allocate(node: Node_Info): Resources = {
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   353
      val host = host_infos.the_host(node)
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   354
      copy(allocated_nodes = allocated_nodes + (host -> (node :: allocated(host))))
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   355
    }
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   356
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   357
    def try_allocate_tasks(
78971
f930d24f1548 scheduled build: allocate cpus more aggressively, to avoid idle threads;
Fabian Huch <huch@in.tum.de>
parents: 78970
diff changeset
   358
      hosts: List[(Host, Int)],
f930d24f1548 scheduled build: allocate cpus more aggressively, to avoid idle threads;
Fabian Huch <huch@in.tum.de>
parents: 78970
diff changeset
   359
      tasks: List[(Build_Process.Task, Int, Int)],
78845
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   360
    ): (List[Config], Resources) =
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   361
      tasks match {
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   362
        case Nil => (Nil, this)
78971
f930d24f1548 scheduled build: allocate cpus more aggressively, to avoid idle threads;
Fabian Huch <huch@in.tum.de>
parents: 78970
diff changeset
   363
        case (task, min_threads, max_threads) :: tasks =>
78845
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   364
          val (config, resources) =
78971
f930d24f1548 scheduled build: allocate cpus more aggressively, to avoid idle threads;
Fabian Huch <huch@in.tum.de>
parents: 78970
diff changeset
   365
            hosts.find((host, _) => available(host, min_threads)) match {
f930d24f1548 scheduled build: allocate cpus more aggressively, to avoid idle threads;
Fabian Huch <huch@in.tum.de>
parents: 78970
diff changeset
   366
              case Some((host, host_max_threads)) =>
f930d24f1548 scheduled build: allocate cpus more aggressively, to avoid idle threads;
Fabian Huch <huch@in.tum.de>
parents: 78970
diff changeset
   367
                val free_threads = host.info.num_cpus - ((host.build.jobs - 1) * host_max_threads)
f930d24f1548 scheduled build: allocate cpus more aggressively, to avoid idle threads;
Fabian Huch <huch@in.tum.de>
parents: 78970
diff changeset
   368
                val node_info = next_node(host, (min_threads max free_threads) min max_threads)
78845
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   369
                (Some(Config(task.name, node_info)), allocate(node_info))
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   370
              case None => (None, this)
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   371
            }
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   372
          val (configs, resources1) = resources.try_allocate_tasks(hosts, tasks)
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   373
          (configs ++ config, resources1)
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   374
      }
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   375
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   376
    def next_node(host: Host, threads: Int): Node_Info = {
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   377
      val numa_node_num_cpus = host.info.num_cpus / (host.info.numa_nodes.length max 1)
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   378
      def explicit_cpus(node_info: Node_Info): List[Int] =
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   379
        if (node_info.rel_cpus.nonEmpty) node_info.rel_cpus else (0 until numa_node_num_cpus).toList
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   380
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   381
      val used_nodes = allocated(host).groupMapReduce(_.numa_node)(explicit_cpus)(_ ::: _)
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   382
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   383
      val available_nodes = host.info.numa_nodes
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   384
      val numa_node =
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   385
        if (!host.build.numa) None
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   386
        else available_nodes.sortBy(n => used_nodes.getOrElse(Some(n), Nil).length).headOption
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   387
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   388
      val used_cpus = used_nodes.getOrElse(numa_node, Nil).toSet
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   389
      val available_cpus = (0 until numa_node_num_cpus).filterNot(used_cpus.contains).toList
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   390
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   391
      val rel_cpus = if (available_cpus.length >= threads) available_cpus.take(threads) else Nil
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   392
79103
883f61f0beda clarified build schedule host: more operations;
Fabian Huch <huch@in.tum.de>
parents: 79102
diff changeset
   393
      Node_Info(host.name, numa_node, rel_cpus)
78845
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   394
    }
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   395
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   396
    def available(host: Host, threads: Int): Boolean = {
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   397
      val used = allocated(host)
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   398
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   399
      if (used.length >= host.build.jobs) false
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   400
      else {
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   401
        if (host.info.numa_nodes.length <= 1)
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   402
          used.map(host_infos.num_threads).sum + threads <= host.info.num_cpus
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   403
        else {
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   404
          def node_threads(n: Int): Int =
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   405
            used.filter(_.numa_node.contains(n)).map(host_infos.num_threads).sum
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   406
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   407
          host.info.numa_nodes.exists(
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   408
            node_threads(_) + threads <= host.info.num_cpus / host.info.numa_nodes.length)
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   409
        }
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   410
      }
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   411
    }
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   412
  }
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   413
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   414
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   415
  /* schedule generation */
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   416
79073
b3fee0dafd72 generated build schedule explicitly (e.g., for further analysis);
Fabian Huch <huch@in.tum.de>
parents: 79064
diff changeset
   417
  object Schedule {
b3fee0dafd72 generated build schedule explicitly (e.g., for further analysis);
Fabian Huch <huch@in.tum.de>
parents: 79064
diff changeset
   418
    case class Node(job_name: String, node_info: Node_Info, start: Date, duration: Time) {
b3fee0dafd72 generated build schedule explicitly (e.g., for further analysis);
Fabian Huch <huch@in.tum.de>
parents: 79064
diff changeset
   419
      def end: Date = Date(start.time + duration)
b3fee0dafd72 generated build schedule explicitly (e.g., for further analysis);
Fabian Huch <huch@in.tum.de>
parents: 79064
diff changeset
   420
    }
b3fee0dafd72 generated build schedule explicitly (e.g., for further analysis);
Fabian Huch <huch@in.tum.de>
parents: 79064
diff changeset
   421
b3fee0dafd72 generated build schedule explicitly (e.g., for further analysis);
Fabian Huch <huch@in.tum.de>
parents: 79064
diff changeset
   422
    type Graph = isabelle.Graph[String, Node]
b3fee0dafd72 generated build schedule explicitly (e.g., for further analysis);
Fabian Huch <huch@in.tum.de>
parents: 79064
diff changeset
   423
  }
b3fee0dafd72 generated build schedule explicitly (e.g., for further analysis);
Fabian Huch <huch@in.tum.de>
parents: 79064
diff changeset
   424
b3fee0dafd72 generated build schedule explicitly (e.g., for further analysis);
Fabian Huch <huch@in.tum.de>
parents: 79064
diff changeset
   425
  case class Schedule(start: Date, graph: Schedule.Graph) {
b3fee0dafd72 generated build schedule explicitly (e.g., for further analysis);
Fabian Huch <huch@in.tum.de>
parents: 79064
diff changeset
   426
    def end: Date =
b3fee0dafd72 generated build schedule explicitly (e.g., for further analysis);
Fabian Huch <huch@in.tum.de>
parents: 79064
diff changeset
   427
      if (graph.is_empty) start
b3fee0dafd72 generated build schedule explicitly (e.g., for further analysis);
Fabian Huch <huch@in.tum.de>
parents: 79064
diff changeset
   428
      else graph.maximals.map(graph.get_node).map(_.end).maxBy(_.unix_epoch)
b3fee0dafd72 generated build schedule explicitly (e.g., for further analysis);
Fabian Huch <huch@in.tum.de>
parents: 79064
diff changeset
   429
b3fee0dafd72 generated build schedule explicitly (e.g., for further analysis);
Fabian Huch <huch@in.tum.de>
parents: 79064
diff changeset
   430
    def duration: Time = end.time - start.time
79105
6e92475ff925 clarified schedule message;
Fabian Huch <huch@in.tum.de>
parents: 79104
diff changeset
   431
    def message: String = "Estimated " + duration.message_hms + " build time"
79073
b3fee0dafd72 generated build schedule explicitly (e.g., for further analysis);
Fabian Huch <huch@in.tum.de>
parents: 79064
diff changeset
   432
  }
b3fee0dafd72 generated build schedule explicitly (e.g., for further analysis);
Fabian Huch <huch@in.tum.de>
parents: 79064
diff changeset
   433
b3fee0dafd72 generated build schedule explicitly (e.g., for further analysis);
Fabian Huch <huch@in.tum.de>
parents: 79064
diff changeset
   434
  case class State(build_state: Build_Process.State, current_time: Time, finished: Schedule) {
78845
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   435
    def start(config: Config): State =
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   436
      copy(build_state =
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   437
        build_state.copy(running = build_state.running +
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   438
          (config.job_name -> config.job_of(current_time))))
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   439
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   440
    def step(timing_data: Timing_Data): State = {
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   441
      val remaining =
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   442
        build_state.running.values.toList.map { job =>
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   443
          val elapsed = current_time - job.start_date.time
79026
6585acdd6505 clarified time estimation: does not use config;
Fabian Huch <huch@in.tum.de>
parents: 79025
diff changeset
   444
          val threads = timing_data.host_infos.num_threads(job.node_info)
6585acdd6505 clarified time estimation: does not use config;
Fabian Huch <huch@in.tum.de>
parents: 79025
diff changeset
   445
          val predicted = timing_data.estimate(job.name, job.node_info.hostname, threads)
78845
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   446
          val remaining = if (elapsed > predicted) Time.zero else predicted - elapsed
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   447
          job -> remaining
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   448
        }
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   449
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   450
      if (remaining.isEmpty) error("Schedule step without running sessions")
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   451
      else {
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   452
        val (job, elapsed) = remaining.minBy(_._2.ms)
79073
b3fee0dafd72 generated build schedule explicitly (e.g., for further analysis);
Fabian Huch <huch@in.tum.de>
parents: 79064
diff changeset
   453
        val now = current_time + elapsed
b3fee0dafd72 generated build schedule explicitly (e.g., for further analysis);
Fabian Huch <huch@in.tum.de>
parents: 79064
diff changeset
   454
        val node = Schedule.Node(job.name, job.node_info, job.start_date, now - job.start_date.time)
b3fee0dafd72 generated build schedule explicitly (e.g., for further analysis);
Fabian Huch <huch@in.tum.de>
parents: 79064
diff changeset
   455
b3fee0dafd72 generated build schedule explicitly (e.g., for further analysis);
Fabian Huch <huch@in.tum.de>
parents: 79064
diff changeset
   456
        val preds =
b3fee0dafd72 generated build schedule explicitly (e.g., for further analysis);
Fabian Huch <huch@in.tum.de>
parents: 79064
diff changeset
   457
          build_state.sessions.graph.imm_preds(job.name).filter(finished.graph.defined)
b3fee0dafd72 generated build schedule explicitly (e.g., for further analysis);
Fabian Huch <huch@in.tum.de>
parents: 79064
diff changeset
   458
        val graph =
b3fee0dafd72 generated build schedule explicitly (e.g., for further analysis);
Fabian Huch <huch@in.tum.de>
parents: 79064
diff changeset
   459
          preds.foldLeft(finished.graph.new_node(job.name, node))(_.add_edge(_, job.name))
b3fee0dafd72 generated build schedule explicitly (e.g., for further analysis);
Fabian Huch <huch@in.tum.de>
parents: 79064
diff changeset
   460
b3fee0dafd72 generated build schedule explicitly (e.g., for further analysis);
Fabian Huch <huch@in.tum.de>
parents: 79064
diff changeset
   461
        val build_state1 = build_state.remove_running(job.name).remove_pending(job.name)
b3fee0dafd72 generated build schedule explicitly (e.g., for further analysis);
Fabian Huch <huch@in.tum.de>
parents: 79064
diff changeset
   462
        State(build_state1, now, finished.copy(graph = graph))
78845
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   463
      }
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   464
    }
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   465
79073
b3fee0dafd72 generated build schedule explicitly (e.g., for further analysis);
Fabian Huch <huch@in.tum.de>
parents: 79064
diff changeset
   466
    def is_finished: Boolean = build_state.pending.isEmpty && build_state.running.isEmpty
78845
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   467
  }
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   468
78932
Fabian Huch <huch@in.tum.de>
parents: 78931
diff changeset
   469
  trait Scheduler {
78928
6c2c60b852e0 move timing data into scheduler for more efficient heuristics (e.g., with pre-calculated values);
Fabian Huch <huch@in.tum.de>
parents: 78888
diff changeset
   470
    def next(state: Build_Process.State): List[Config]
79073
b3fee0dafd72 generated build schedule explicitly (e.g., for further analysis);
Fabian Huch <huch@in.tum.de>
parents: 79064
diff changeset
   471
    def build_schedule(build_state: Build_Process.State): Schedule
78931
26841d3c568c performance tuning for build schedule: explicit schedule generation, without mixing heuristics;
Fabian Huch <huch@in.tum.de>
parents: 78930
diff changeset
   472
  }
26841d3c568c performance tuning for build schedule: explicit schedule generation, without mixing heuristics;
Fabian Huch <huch@in.tum.de>
parents: 78930
diff changeset
   473
79102
4d5f878665a3 clarified path heuristic;
Fabian Huch <huch@in.tum.de>
parents: 79101
diff changeset
   474
  abstract class Heuristic(timing_data: Timing_Data) extends Scheduler {
79019
4df053d29215 introduced path heuristic abstraction;
Fabian Huch <huch@in.tum.de>
parents: 78976
diff changeset
   475
    val host_infos = timing_data.host_infos
79028
6bada416ba55 clarified timing data operations: proper estimation (instead of known points);
Fabian Huch <huch@in.tum.de>
parents: 79027
diff changeset
   476
    val ordered_hosts = host_infos.hosts.sorted(host_infos.host_speeds)
6bada416ba55 clarified timing data operations: proper estimation (instead of known points);
Fabian Huch <huch@in.tum.de>
parents: 79027
diff changeset
   477
79073
b3fee0dafd72 generated build schedule explicitly (e.g., for further analysis);
Fabian Huch <huch@in.tum.de>
parents: 79064
diff changeset
   478
    def build_schedule(build_state: Build_Process.State): Schedule = {
78845
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   479
      @tailrec
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   480
      def simulate(state: State): State =
79073
b3fee0dafd72 generated build schedule explicitly (e.g., for further analysis);
Fabian Huch <huch@in.tum.de>
parents: 79064
diff changeset
   481
        if (state.is_finished) state
78845
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   482
        else {
78932
Fabian Huch <huch@in.tum.de>
parents: 78931
diff changeset
   483
          val state1 = next(state.build_state).foldLeft(state)(_.start(_)).step(timing_data)
78845
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   484
          simulate(state1)
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   485
        }
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   486
79073
b3fee0dafd72 generated build schedule explicitly (e.g., for further analysis);
Fabian Huch <huch@in.tum.de>
parents: 79064
diff changeset
   487
      val start = Date.now()
b3fee0dafd72 generated build schedule explicitly (e.g., for further analysis);
Fabian Huch <huch@in.tum.de>
parents: 79064
diff changeset
   488
      val end_state = simulate(State(build_state, start.time, Schedule(start, Graph.empty)))
b3fee0dafd72 generated build schedule explicitly (e.g., for further analysis);
Fabian Huch <huch@in.tum.de>
parents: 79064
diff changeset
   489
b3fee0dafd72 generated build schedule explicitly (e.g., for further analysis);
Fabian Huch <huch@in.tum.de>
parents: 79064
diff changeset
   490
      end_state.finished
78845
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   491
    }
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   492
  }
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   493
79107
f5a2f956b531 add heuristic for non-scheduled (standard) build behaviour;
Fabian Huch <huch@in.tum.de>
parents: 79106
diff changeset
   494
  class Default_Heuristic(timing_data: Timing_Data, options: Options)
f5a2f956b531 add heuristic for non-scheduled (standard) build behaviour;
Fabian Huch <huch@in.tum.de>
parents: 79106
diff changeset
   495
    extends Heuristic(timing_data) {
f5a2f956b531 add heuristic for non-scheduled (standard) build behaviour;
Fabian Huch <huch@in.tum.de>
parents: 79106
diff changeset
   496
f5a2f956b531 add heuristic for non-scheduled (standard) build behaviour;
Fabian Huch <huch@in.tum.de>
parents: 79106
diff changeset
   497
    def host_threads(host: Host): Int = {
f5a2f956b531 add heuristic for non-scheduled (standard) build behaviour;
Fabian Huch <huch@in.tum.de>
parents: 79106
diff changeset
   498
      val m = (options ++ host.build.options).int("threads")
f5a2f956b531 add heuristic for non-scheduled (standard) build behaviour;
Fabian Huch <huch@in.tum.de>
parents: 79106
diff changeset
   499
      if (m > 0) m else (host.num_cpus max 1) min 8
f5a2f956b531 add heuristic for non-scheduled (standard) build behaviour;
Fabian Huch <huch@in.tum.de>
parents: 79106
diff changeset
   500
    }
f5a2f956b531 add heuristic for non-scheduled (standard) build behaviour;
Fabian Huch <huch@in.tum.de>
parents: 79106
diff changeset
   501
    
f5a2f956b531 add heuristic for non-scheduled (standard) build behaviour;
Fabian Huch <huch@in.tum.de>
parents: 79106
diff changeset
   502
    def next_jobs(resources: Resources, sorted_jobs: List[String], host: Host): List[Config] =
f5a2f956b531 add heuristic for non-scheduled (standard) build behaviour;
Fabian Huch <huch@in.tum.de>
parents: 79106
diff changeset
   503
      sorted_jobs.zip(resources.unused_nodes(host, host_threads(host))).map(Config(_, _))
f5a2f956b531 add heuristic for non-scheduled (standard) build behaviour;
Fabian Huch <huch@in.tum.de>
parents: 79106
diff changeset
   504
f5a2f956b531 add heuristic for non-scheduled (standard) build behaviour;
Fabian Huch <huch@in.tum.de>
parents: 79106
diff changeset
   505
    def next(state: Build_Process.State): List[Config] = {
f5a2f956b531 add heuristic for non-scheduled (standard) build behaviour;
Fabian Huch <huch@in.tum.de>
parents: 79106
diff changeset
   506
      val sorted_jobs = state.next_ready.sortBy(_.name)(state.sessions.ordering).map(_.name)
f5a2f956b531 add heuristic for non-scheduled (standard) build behaviour;
Fabian Huch <huch@in.tum.de>
parents: 79106
diff changeset
   507
      val resources = host_infos.available(state)
f5a2f956b531 add heuristic for non-scheduled (standard) build behaviour;
Fabian Huch <huch@in.tum.de>
parents: 79106
diff changeset
   508
f5a2f956b531 add heuristic for non-scheduled (standard) build behaviour;
Fabian Huch <huch@in.tum.de>
parents: 79106
diff changeset
   509
      host_infos.hosts.foldLeft((sorted_jobs, List.empty[Config])) {
f5a2f956b531 add heuristic for non-scheduled (standard) build behaviour;
Fabian Huch <huch@in.tum.de>
parents: 79106
diff changeset
   510
        case ((jobs, res), host) =>
f5a2f956b531 add heuristic for non-scheduled (standard) build behaviour;
Fabian Huch <huch@in.tum.de>
parents: 79106
diff changeset
   511
          val configs = next_jobs(resources, jobs, host)
f5a2f956b531 add heuristic for non-scheduled (standard) build behaviour;
Fabian Huch <huch@in.tum.de>
parents: 79106
diff changeset
   512
          val config_jobs = configs.map(_.job_name).toSet
f5a2f956b531 add heuristic for non-scheduled (standard) build behaviour;
Fabian Huch <huch@in.tum.de>
parents: 79106
diff changeset
   513
          (jobs.filterNot(config_jobs.contains), configs ::: res)
f5a2f956b531 add heuristic for non-scheduled (standard) build behaviour;
Fabian Huch <huch@in.tum.de>
parents: 79106
diff changeset
   514
      }._2
f5a2f956b531 add heuristic for non-scheduled (standard) build behaviour;
Fabian Huch <huch@in.tum.de>
parents: 79106
diff changeset
   515
    }
f5a2f956b531 add heuristic for non-scheduled (standard) build behaviour;
Fabian Huch <huch@in.tum.de>
parents: 79106
diff changeset
   516
  }
f5a2f956b531 add heuristic for non-scheduled (standard) build behaviour;
Fabian Huch <huch@in.tum.de>
parents: 79106
diff changeset
   517
78931
26841d3c568c performance tuning for build schedule: explicit schedule generation, without mixing heuristics;
Fabian Huch <huch@in.tum.de>
parents: 78930
diff changeset
   518
  class Meta_Heuristic(heuristics: List[Heuristic]) extends Scheduler {
26841d3c568c performance tuning for build schedule: explicit schedule generation, without mixing heuristics;
Fabian Huch <huch@in.tum.de>
parents: 78930
diff changeset
   519
    require(heuristics.nonEmpty)
26841d3c568c performance tuning for build schedule: explicit schedule generation, without mixing heuristics;
Fabian Huch <huch@in.tum.de>
parents: 78930
diff changeset
   520
79073
b3fee0dafd72 generated build schedule explicitly (e.g., for further analysis);
Fabian Huch <huch@in.tum.de>
parents: 79064
diff changeset
   521
    def best_result(state: Build_Process.State): (Heuristic, Schedule) =
b3fee0dafd72 generated build schedule explicitly (e.g., for further analysis);
Fabian Huch <huch@in.tum.de>
parents: 79064
diff changeset
   522
      heuristics.map(heuristic =>
b3fee0dafd72 generated build schedule explicitly (e.g., for further analysis);
Fabian Huch <huch@in.tum.de>
parents: 79064
diff changeset
   523
        heuristic -> heuristic.build_schedule(state)).minBy(_._2.duration.ms)
78931
26841d3c568c performance tuning for build schedule: explicit schedule generation, without mixing heuristics;
Fabian Huch <huch@in.tum.de>
parents: 78930
diff changeset
   524
26841d3c568c performance tuning for build schedule: explicit schedule generation, without mixing heuristics;
Fabian Huch <huch@in.tum.de>
parents: 78930
diff changeset
   525
    def next(state: Build_Process.State): List[Config] = best_result(state)._1.next(state)
26841d3c568c performance tuning for build schedule: explicit schedule generation, without mixing heuristics;
Fabian Huch <huch@in.tum.de>
parents: 78930
diff changeset
   526
79073
b3fee0dafd72 generated build schedule explicitly (e.g., for further analysis);
Fabian Huch <huch@in.tum.de>
parents: 79064
diff changeset
   527
    def build_schedule(state: Build_Process.State): Schedule = best_result(state)._2
78931
26841d3c568c performance tuning for build schedule: explicit schedule generation, without mixing heuristics;
Fabian Huch <huch@in.tum.de>
parents: 78930
diff changeset
   528
  }
26841d3c568c performance tuning for build schedule: explicit schedule generation, without mixing heuristics;
Fabian Huch <huch@in.tum.de>
parents: 78930
diff changeset
   529
78845
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   530
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   531
  /* heuristics */
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   532
79027
d08fb157e300 use proper max threads (limited by available hardware) in heuristics;
Fabian Huch <huch@in.tum.de>
parents: 79026
diff changeset
   533
  abstract class Path_Heuristic(
d08fb157e300 use proper max threads (limited by available hardware) in heuristics;
Fabian Huch <huch@in.tum.de>
parents: 79026
diff changeset
   534
    timing_data: Timing_Data,
d08fb157e300 use proper max threads (limited by available hardware) in heuristics;
Fabian Huch <huch@in.tum.de>
parents: 79026
diff changeset
   535
    sessions_structure: Sessions.Structure,
d08fb157e300 use proper max threads (limited by available hardware) in heuristics;
Fabian Huch <huch@in.tum.de>
parents: 79026
diff changeset
   536
    max_threads_limit: Int
79102
4d5f878665a3 clarified path heuristic;
Fabian Huch <huch@in.tum.de>
parents: 79101
diff changeset
   537
  ) extends Heuristic(timing_data) {
78929
df323f23dfde performance tuning for timing heuristic: pre-calculate graph operations;
Fabian Huch <huch@in.tum.de>
parents: 78928
diff changeset
   538
    /* pre-computed properties for efficient heuristic */
df323f23dfde performance tuning for timing heuristic: pre-calculate graph operations;
Fabian Huch <huch@in.tum.de>
parents: 78928
diff changeset
   539
79102
4d5f878665a3 clarified path heuristic;
Fabian Huch <huch@in.tum.de>
parents: 79101
diff changeset
   540
    val max_threads = host_infos.hosts.map(_.info.num_cpus).max min max_threads_limit
4d5f878665a3 clarified path heuristic;
Fabian Huch <huch@in.tum.de>
parents: 79101
diff changeset
   541
78929
df323f23dfde performance tuning for timing heuristic: pre-calculate graph operations;
Fabian Huch <huch@in.tum.de>
parents: 78928
diff changeset
   542
    type Node = String
df323f23dfde performance tuning for timing heuristic: pre-calculate graph operations;
Fabian Huch <huch@in.tum.de>
parents: 78928
diff changeset
   543
    val build_graph = sessions_structure.build_graph
79101
4e47b34fbb8e clarified graph operations in timing heuristic;
Fabian Huch <huch@in.tum.de>
parents: 79091
diff changeset
   544
4e47b34fbb8e clarified graph operations in timing heuristic;
Fabian Huch <huch@in.tum.de>
parents: 79091
diff changeset
   545
    val minimals = build_graph.minimals
4e47b34fbb8e clarified graph operations in timing heuristic;
Fabian Huch <huch@in.tum.de>
parents: 79091
diff changeset
   546
    val maximals = build_graph.maximals
4e47b34fbb8e clarified graph operations in timing heuristic;
Fabian Huch <huch@in.tum.de>
parents: 79091
diff changeset
   547
4e47b34fbb8e clarified graph operations in timing heuristic;
Fabian Huch <huch@in.tum.de>
parents: 79091
diff changeset
   548
    def all_preds(node: Node): Set[Node] = build_graph.all_preds(List(node)).toSet
4e47b34fbb8e clarified graph operations in timing heuristic;
Fabian Huch <huch@in.tum.de>
parents: 79091
diff changeset
   549
    val maximals_all_preds = maximals.map(node => node -> all_preds(node)).toMap
78929
df323f23dfde performance tuning for timing heuristic: pre-calculate graph operations;
Fabian Huch <huch@in.tum.de>
parents: 78928
diff changeset
   550
79102
4d5f878665a3 clarified path heuristic;
Fabian Huch <huch@in.tum.de>
parents: 79101
diff changeset
   551
    def best_time(node: Node): Time = {
4d5f878665a3 clarified path heuristic;
Fabian Huch <huch@in.tum.de>
parents: 79101
diff changeset
   552
      val host = ordered_hosts.last
4d5f878665a3 clarified path heuristic;
Fabian Huch <huch@in.tum.de>
parents: 79101
diff changeset
   553
      val threads = timing_data.best_threads(node, max_threads) min host.info.num_cpus
79103
883f61f0beda clarified build schedule host: more operations;
Fabian Huch <huch@in.tum.de>
parents: 79102
diff changeset
   554
      timing_data.estimate(node, host.name, threads)
79102
4d5f878665a3 clarified path heuristic;
Fabian Huch <huch@in.tum.de>
parents: 79101
diff changeset
   555
    }
79028
6bada416ba55 clarified timing data operations: proper estimation (instead of known points);
Fabian Huch <huch@in.tum.de>
parents: 79027
diff changeset
   556
    val best_times = build_graph.keys.map(node => node -> best_time(node)).toMap
78929
df323f23dfde performance tuning for timing heuristic: pre-calculate graph operations;
Fabian Huch <huch@in.tum.de>
parents: 78928
diff changeset
   557
79101
4e47b34fbb8e clarified graph operations in timing heuristic;
Fabian Huch <huch@in.tum.de>
parents: 79091
diff changeset
   558
    val succs_max_time_ms = build_graph.node_height(best_times(_).ms)
4e47b34fbb8e clarified graph operations in timing heuristic;
Fabian Huch <huch@in.tum.de>
parents: 79091
diff changeset
   559
    def max_time(node: Node): Time = Time.ms(succs_max_time_ms(node)) + best_times(node)
4e47b34fbb8e clarified graph operations in timing heuristic;
Fabian Huch <huch@in.tum.de>
parents: 79091
diff changeset
   560
    def max_time(task: Build_Process.Task): Time = max_time(task.name)
78929
df323f23dfde performance tuning for timing heuristic: pre-calculate graph operations;
Fabian Huch <huch@in.tum.de>
parents: 78928
diff changeset
   561
79101
4e47b34fbb8e clarified graph operations in timing heuristic;
Fabian Huch <huch@in.tum.de>
parents: 79091
diff changeset
   562
    def path_times(minimals: List[Node]): Map[Node, Time] = {
4e47b34fbb8e clarified graph operations in timing heuristic;
Fabian Huch <huch@in.tum.de>
parents: 79091
diff changeset
   563
      def time_ms(node: Node): Long = best_times(node).ms
4e47b34fbb8e clarified graph operations in timing heuristic;
Fabian Huch <huch@in.tum.de>
parents: 79091
diff changeset
   564
      val path_times_ms = build_graph.reachable_length(time_ms, build_graph.imm_succs, minimals)
4e47b34fbb8e clarified graph operations in timing heuristic;
Fabian Huch <huch@in.tum.de>
parents: 79091
diff changeset
   565
      path_times_ms.view.mapValues(Time.ms).toMap
78929
df323f23dfde performance tuning for timing heuristic: pre-calculate graph operations;
Fabian Huch <huch@in.tum.de>
parents: 78928
diff changeset
   566
    }
df323f23dfde performance tuning for timing heuristic: pre-calculate graph operations;
Fabian Huch <huch@in.tum.de>
parents: 78928
diff changeset
   567
79101
4e47b34fbb8e clarified graph operations in timing heuristic;
Fabian Huch <huch@in.tum.de>
parents: 79091
diff changeset
   568
    def path_max_times(minimals: List[Node]): Map[Node, Time] =
4e47b34fbb8e clarified graph operations in timing heuristic;
Fabian Huch <huch@in.tum.de>
parents: 79091
diff changeset
   569
      path_times(minimals).toList.map((node, time) => node -> (time + max_time(node))).toMap
4e47b34fbb8e clarified graph operations in timing heuristic;
Fabian Huch <huch@in.tum.de>
parents: 79091
diff changeset
   570
4e47b34fbb8e clarified graph operations in timing heuristic;
Fabian Huch <huch@in.tum.de>
parents: 79091
diff changeset
   571
    def parallel_paths(minimals: List[Node], pred: Node => Boolean = _ => true): Int = {
78972
7a39f151e9a7 proper parallel paths for timing heuristic;
Fabian Huch <huch@in.tum.de>
parents: 78971
diff changeset
   572
      def start(node: Node): (Node, Time) = node -> best_times(node)
7a39f151e9a7 proper parallel paths for timing heuristic;
Fabian Huch <huch@in.tum.de>
parents: 78971
diff changeset
   573
7a39f151e9a7 proper parallel paths for timing heuristic;
Fabian Huch <huch@in.tum.de>
parents: 78971
diff changeset
   574
      def pass_time(elapsed: Time)(node: Node, time: Time): (Node, Time) =
7a39f151e9a7 proper parallel paths for timing heuristic;
Fabian Huch <huch@in.tum.de>
parents: 78971
diff changeset
   575
        node -> (time - elapsed)
7a39f151e9a7 proper parallel paths for timing heuristic;
Fabian Huch <huch@in.tum.de>
parents: 78971
diff changeset
   576
7a39f151e9a7 proper parallel paths for timing heuristic;
Fabian Huch <huch@in.tum.de>
parents: 78971
diff changeset
   577
      def parallel_paths(running: Map[Node, Time]): (Int, Map[Node, Time]) =
7a39f151e9a7 proper parallel paths for timing heuristic;
Fabian Huch <huch@in.tum.de>
parents: 78971
diff changeset
   578
        if (running.isEmpty) (0, running)
7a39f151e9a7 proper parallel paths for timing heuristic;
Fabian Huch <huch@in.tum.de>
parents: 78971
diff changeset
   579
        else {
7a39f151e9a7 proper parallel paths for timing heuristic;
Fabian Huch <huch@in.tum.de>
parents: 78971
diff changeset
   580
          def get_next(node: Node): List[Node] =
7a39f151e9a7 proper parallel paths for timing heuristic;
Fabian Huch <huch@in.tum.de>
parents: 78971
diff changeset
   581
            build_graph.imm_succs(node).filter(pred).filter(
79104
e7ab5f4ed401 proper parallel paths;
Fabian Huch <huch@in.tum.de>
parents: 79103
diff changeset
   582
              build_graph.imm_preds(_).intersect(running.keySet) == Set(node)).toList
78972
7a39f151e9a7 proper parallel paths for timing heuristic;
Fabian Huch <huch@in.tum.de>
parents: 78971
diff changeset
   583
7a39f151e9a7 proper parallel paths for timing heuristic;
Fabian Huch <huch@in.tum.de>
parents: 78971
diff changeset
   584
          val (next, elapsed) = running.minBy(_._2.ms)
7a39f151e9a7 proper parallel paths for timing heuristic;
Fabian Huch <huch@in.tum.de>
parents: 78971
diff changeset
   585
          val (remaining, finished) =
7a39f151e9a7 proper parallel paths for timing heuristic;
Fabian Huch <huch@in.tum.de>
parents: 78971
diff changeset
   586
            running.toList.map(pass_time(elapsed)).partition(_._2 > Time.zero)
7a39f151e9a7 proper parallel paths for timing heuristic;
Fabian Huch <huch@in.tum.de>
parents: 78971
diff changeset
   587
7a39f151e9a7 proper parallel paths for timing heuristic;
Fabian Huch <huch@in.tum.de>
parents: 78971
diff changeset
   588
          val running1 =
7a39f151e9a7 proper parallel paths for timing heuristic;
Fabian Huch <huch@in.tum.de>
parents: 78971
diff changeset
   589
            remaining.map(pass_time(elapsed)).toMap ++
7a39f151e9a7 proper parallel paths for timing heuristic;
Fabian Huch <huch@in.tum.de>
parents: 78971
diff changeset
   590
              finished.map(_._1).flatMap(get_next).map(start)
7a39f151e9a7 proper parallel paths for timing heuristic;
Fabian Huch <huch@in.tum.de>
parents: 78971
diff changeset
   591
          val (res, running2) = parallel_paths(running1)
79104
e7ab5f4ed401 proper parallel paths;
Fabian Huch <huch@in.tum.de>
parents: 79103
diff changeset
   592
          (res max running.size, running2)
78972
7a39f151e9a7 proper parallel paths for timing heuristic;
Fabian Huch <huch@in.tum.de>
parents: 78971
diff changeset
   593
        }
7a39f151e9a7 proper parallel paths for timing heuristic;
Fabian Huch <huch@in.tum.de>
parents: 78971
diff changeset
   594
7a39f151e9a7 proper parallel paths for timing heuristic;
Fabian Huch <huch@in.tum.de>
parents: 78971
diff changeset
   595
      parallel_paths(minimals.map(start).toMap)._1
7a39f151e9a7 proper parallel paths for timing heuristic;
Fabian Huch <huch@in.tum.de>
parents: 78971
diff changeset
   596
    }
79019
4df053d29215 introduced path heuristic abstraction;
Fabian Huch <huch@in.tum.de>
parents: 78976
diff changeset
   597
  }
78929
df323f23dfde performance tuning for timing heuristic: pre-calculate graph operations;
Fabian Huch <huch@in.tum.de>
parents: 78928
diff changeset
   598
79019
4df053d29215 introduced path heuristic abstraction;
Fabian Huch <huch@in.tum.de>
parents: 78976
diff changeset
   599
  class Timing_Heuristic(
4df053d29215 introduced path heuristic abstraction;
Fabian Huch <huch@in.tum.de>
parents: 78976
diff changeset
   600
    threshold: Time,
4df053d29215 introduced path heuristic abstraction;
Fabian Huch <huch@in.tum.de>
parents: 78976
diff changeset
   601
    timing_data: Timing_Data,
4df053d29215 introduced path heuristic abstraction;
Fabian Huch <huch@in.tum.de>
parents: 78976
diff changeset
   602
    sessions_structure: Sessions.Structure,
79027
d08fb157e300 use proper max threads (limited by available hardware) in heuristics;
Fabian Huch <huch@in.tum.de>
parents: 79026
diff changeset
   603
    max_threads_limit: Int = 8
d08fb157e300 use proper max threads (limited by available hardware) in heuristics;
Fabian Huch <huch@in.tum.de>
parents: 79026
diff changeset
   604
  ) extends Path_Heuristic(timing_data, sessions_structure, max_threads_limit) {
78929
df323f23dfde performance tuning for timing heuristic: pre-calculate graph operations;
Fabian Huch <huch@in.tum.de>
parents: 78928
diff changeset
   605
78928
6c2c60b852e0 move timing data into scheduler for more efficient heuristics (e.g., with pre-calculated values);
Fabian Huch <huch@in.tum.de>
parents: 78888
diff changeset
   606
    def next(state: Build_Process.State): List[Config] = {
78845
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   607
      val resources = host_infos.available(state)
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   608
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   609
      def best_threads(task: Build_Process.Task): Int =
79028
6bada416ba55 clarified timing data operations: proper estimation (instead of known points);
Fabian Huch <huch@in.tum.de>
parents: 79027
diff changeset
   610
        timing_data.best_threads(task.name, max_threads)
78971
f930d24f1548 scheduled build: allocate cpus more aggressively, to avoid idle threads;
Fabian Huch <huch@in.tum.de>
parents: 78970
diff changeset
   611
79028
6bada416ba55 clarified timing data operations: proper estimation (instead of known points);
Fabian Huch <huch@in.tum.de>
parents: 79027
diff changeset
   612
      val rev_ordered_hosts = ordered_hosts.reverse.map(_ -> max_threads)
78845
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   613
79021
1c91e884035d properly incorporate running tasks into timing heuristic;
Fabian Huch <huch@in.tum.de>
parents: 79020
diff changeset
   614
      val resources0 = host_infos.available(state.copy(running = Map.empty))
79101
4e47b34fbb8e clarified graph operations in timing heuristic;
Fabian Huch <huch@in.tum.de>
parents: 79091
diff changeset
   615
      val max_parallel = parallel_paths(state.ready.map(_.name))
79021
1c91e884035d properly incorporate running tasks into timing heuristic;
Fabian Huch <huch@in.tum.de>
parents: 79020
diff changeset
   616
      val fully_parallelizable = max_parallel <= resources0.unused_nodes(max_threads).length
78973
d91e131840a0 timing heuristic: parallelize more aggressively to utilize hosts fully;
Fabian Huch <huch@in.tum.de>
parents: 78972
diff changeset
   617
79101
4e47b34fbb8e clarified graph operations in timing heuristic;
Fabian Huch <huch@in.tum.de>
parents: 79091
diff changeset
   618
      val next_sorted = state.next_ready.sortBy(max_time(_).ms).reverse
79088
32e839bb622e tuned heuristic;
Fabian Huch <huch@in.tum.de>
parents: 79087
diff changeset
   619
78973
d91e131840a0 timing heuristic: parallelize more aggressively to utilize hosts fully;
Fabian Huch <huch@in.tum.de>
parents: 78972
diff changeset
   620
      if (fully_parallelizable) {
79101
4e47b34fbb8e clarified graph operations in timing heuristic;
Fabian Huch <huch@in.tum.de>
parents: 79091
diff changeset
   621
        val all_tasks = next_sorted.map(task => (task, best_threads(task), best_threads(task)))
79028
6bada416ba55 clarified timing data operations: proper estimation (instead of known points);
Fabian Huch <huch@in.tum.de>
parents: 79027
diff changeset
   622
        resources.try_allocate_tasks(rev_ordered_hosts, all_tasks)._1
78971
f930d24f1548 scheduled build: allocate cpus more aggressively, to avoid idle threads;
Fabian Huch <huch@in.tum.de>
parents: 78970
diff changeset
   623
      }
78845
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   624
      else {
79101
4e47b34fbb8e clarified graph operations in timing heuristic;
Fabian Huch <huch@in.tum.de>
parents: 79091
diff changeset
   625
        val critical_minimals = state.ready.filter(max_time(_) > threshold).map(_.name)
4e47b34fbb8e clarified graph operations in timing heuristic;
Fabian Huch <huch@in.tum.de>
parents: 79091
diff changeset
   626
        val critical_nodes = path_max_times(critical_minimals).filter(_._2 > threshold).keySet
78845
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   627
79101
4e47b34fbb8e clarified graph operations in timing heuristic;
Fabian Huch <huch@in.tum.de>
parents: 79091
diff changeset
   628
        val (critical, other) = next_sorted.partition(task => critical_nodes.contains(task.name))
78845
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   629
78971
f930d24f1548 scheduled build: allocate cpus more aggressively, to avoid idle threads;
Fabian Huch <huch@in.tum.de>
parents: 78970
diff changeset
   630
        val critical_tasks = critical.map(task => (task, best_threads(task), best_threads(task)))
f930d24f1548 scheduled build: allocate cpus more aggressively, to avoid idle threads;
Fabian Huch <huch@in.tum.de>
parents: 78970
diff changeset
   631
        val other_tasks = other.map(task => (task, 1, best_threads(task)))
f930d24f1548 scheduled build: allocate cpus more aggressively, to avoid idle threads;
Fabian Huch <huch@in.tum.de>
parents: 78970
diff changeset
   632
79021
1c91e884035d properly incorporate running tasks into timing heuristic;
Fabian Huch <huch@in.tum.de>
parents: 79020
diff changeset
   633
        val max_critical_parallel = parallel_paths(critical_minimals, critical_nodes.contains)
79028
6bada416ba55 clarified timing data operations: proper estimation (instead of known points);
Fabian Huch <huch@in.tum.de>
parents: 79027
diff changeset
   634
        val (critical_hosts, other_hosts) = rev_ordered_hosts.splitAt(max_critical_parallel)
78845
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   635
78971
f930d24f1548 scheduled build: allocate cpus more aggressively, to avoid idle threads;
Fabian Huch <huch@in.tum.de>
parents: 78970
diff changeset
   636
        val (configs1, resources1) = resources.try_allocate_tasks(critical_hosts, critical_tasks)
f930d24f1548 scheduled build: allocate cpus more aggressively, to avoid idle threads;
Fabian Huch <huch@in.tum.de>
parents: 78970
diff changeset
   637
        val (configs2, _) = resources1.try_allocate_tasks(other_hosts, other_tasks)
78845
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   638
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   639
        configs1 ::: configs2
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   640
      }
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   641
    }
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   642
  }
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   643
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   644
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   645
  /* process for scheduled build */
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   646
78928
6c2c60b852e0 move timing data into scheduler for more efficient heuristics (e.g., with pre-calculated values);
Fabian Huch <huch@in.tum.de>
parents: 78888
diff changeset
   647
  abstract class Scheduled_Build_Process(
78845
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   648
    build_context: Build.Context,
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   649
    build_progress: Progress,
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   650
    server: SSH.Server,
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   651
  ) extends Build_Process(build_context, build_progress, server) {
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   652
    protected val start_date = Date.now()
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   653
78928
6c2c60b852e0 move timing data into scheduler for more efficient heuristics (e.g., with pre-calculated values);
Fabian Huch <huch@in.tum.de>
parents: 78888
diff changeset
   654
    def init_scheduler(timing_data: Timing_Data): Scheduler
78845
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   655
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   656
    /* global resources with common close() operation */
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   657
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   658
    private final lazy val _log_store: Build_Log.Store = Build_Log.store(build_options)
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   659
    private final lazy val _log_database: SQL.Database =
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   660
      try {
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   661
        val db = _log_store.open_database(server = this.server)
78851
db37cae970a6 more robust init_database();
wenzelm
parents: 78849
diff changeset
   662
        _log_store.init_database(db)
78845
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   663
        db
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   664
      }
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   665
      catch { case exn: Throwable => close(); throw exn }
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   666
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   667
    override def close(): Unit = {
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   668
      super.close()
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   669
      Option(_log_database).foreach(_.close())
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   670
    }
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   671
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   672
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   673
    /* previous results via build log */
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   674
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   675
    override def open_build_cluster(): Build_Cluster = {
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   676
      val build_cluster = super.open_build_cluster()
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   677
      build_cluster.init()
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   678
      if (build_context.master && build_context.max_jobs > 0) {
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   679
        val benchmark_options = build_options.string("build_hostname") = hostname
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   680
        Benchmark.benchmark(benchmark_options, progress)
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   681
      }
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   682
      build_cluster.benchmark()
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   683
      build_cluster
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   684
    }
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   685
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   686
    private val timing_data: Timing_Data = {
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   687
      val cluster_hosts: List[Build_Cluster.Host] =
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   688
        if (build_context.max_jobs == 0) build_context.build_hosts
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   689
        else {
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   690
          val local_build_host =
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   691
            Build_Cluster.Host(
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   692
              hostname, jobs = build_context.max_jobs, numa = build_context.numa_shuffling)
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   693
          local_build_host :: build_context.build_hosts
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   694
        }
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   695
79090
20be5b925720 clarified load vs. apply vs. make;
Fabian Huch <huch@in.tum.de>
parents: 79089
diff changeset
   696
      val host_infos = Host_Infos.load(cluster_hosts, _host_database)
20be5b925720 clarified load vs. apply vs. make;
Fabian Huch <huch@in.tum.de>
parents: 79089
diff changeset
   697
      Timing_Data.load(host_infos, _log_database)
78845
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   698
    }
78928
6c2c60b852e0 move timing data into scheduler for more efficient heuristics (e.g., with pre-calculated values);
Fabian Huch <huch@in.tum.de>
parents: 78888
diff changeset
   699
    private val scheduler = init_scheduler(timing_data)
78845
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   700
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   701
    def write_build_log(results: Build.Results, state: Build_Process.State.Results): Unit = {
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   702
      val sessions =
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   703
        for {
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   704
          (session_name, result) <- state.toList
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   705
          if !result.current
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   706
        } yield {
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   707
          val info = build_context.sessions_structure(session_name)
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   708
          val entry =
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   709
            if (!results.cancelled(session_name)) {
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   710
              val status =
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   711
                if (result.ok) Build_Log.Session_Status.finished
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   712
                else Build_Log.Session_Status.failed
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   713
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   714
              Build_Log.Session_Entry(
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   715
                chapter = info.chapter,
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   716
                groups = info.groups,
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   717
                hostname = Some(result.node_info.hostname),
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   718
                threads = Some(timing_data.host_infos.num_threads(result.node_info)),
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   719
                timing = result.process_result.timing,
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   720
                sources = Some(result.output_shasum.digest.toString),
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   721
                status = Some(status))
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   722
            }
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   723
            else
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   724
              Build_Log.Session_Entry(
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   725
                chapter = info.chapter,
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   726
                groups = info.groups,
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   727
                status = Some(Build_Log.Session_Status.cancelled))
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   728
          session_name -> entry
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   729
        }
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   730
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   731
      val settings =
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   732
        Build_Log.Settings.all_settings.map(_.name).map(name =>
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   733
          name -> Isabelle_System.getenv(name))
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   734
      val props =
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   735
        List(
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   736
          Build_Log.Prop.build_id.name -> build_context.build_uuid,
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   737
          Build_Log.Prop.build_engine.name -> build_context.engine.name,
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   738
          Build_Log.Prop.build_host.name -> hostname,
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   739
          Build_Log.Prop.build_start.name -> Build_Log.print_date(start_date))
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   740
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   741
      val meta_info = Build_Log.Meta_Info(props, settings)
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   742
      val build_info = Build_Log.Build_Info(sessions.toMap)
79089
Fabian Huch <huch@in.tum.de>
parents: 79088
diff changeset
   743
      val log_name = Build_Log.log_filename(engine = build_context.engine.name, date = start_date)
78845
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   744
79062
6977fb0153fb clarified modules: Build_Log.private_data provides raw data access without transaction_lock;
wenzelm
parents: 79042
diff changeset
   745
      Build_Log.private_data.update_sessions(
6977fb0153fb clarified modules: Build_Log.private_data provides raw data access without transaction_lock;
wenzelm
parents: 79042
diff changeset
   746
        _log_database, _log_store.cache.compress, log_name.file_name, build_info)
6977fb0153fb clarified modules: Build_Log.private_data provides raw data access without transaction_lock;
wenzelm
parents: 79042
diff changeset
   747
      Build_Log.private_data.update_meta_info(_log_database, log_name.file_name, meta_info)
78845
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   748
    }
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   749
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   750
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   751
    /* build process */
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   752
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   753
    case class Cache(state: Build_Process.State, configs: List[Config], estimate: Date) {
78975
4a5d35b35aeb better invalidation for schedule cache (only on relevant changes);
Fabian Huch <huch@in.tum.de>
parents: 78974
diff changeset
   754
      def is_current(state: Build_Process.State): Boolean =
4a5d35b35aeb better invalidation for schedule cache (only on relevant changes);
Fabian Huch <huch@in.tum.de>
parents: 78974
diff changeset
   755
        this.state.pending.nonEmpty && this.state.results == state.results
78845
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   756
      def is_current_estimate(estimate: Date): Boolean =
78975
4a5d35b35aeb better invalidation for schedule cache (only on relevant changes);
Fabian Huch <huch@in.tum.de>
parents: 78974
diff changeset
   757
        Math.abs((this.estimate.time - estimate.time).ms) < Time.minutes(1).ms
78845
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   758
    }
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   759
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   760
    private var cache = Cache(Build_Process.State(), Nil, Date.now())
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   761
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   762
    override def next_node_info(state: Build_Process.State, session_name: String): Node_Info = {
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   763
      val configs =
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   764
        if (cache.is_current(state)) cache.configs
78928
6c2c60b852e0 move timing data into scheduler for more efficient heuristics (e.g., with pre-calculated values);
Fabian Huch <huch@in.tum.de>
parents: 78888
diff changeset
   765
        else scheduler.next(state)
78845
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   766
      configs.find(_.job_name == session_name).get.node_info
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   767
    }
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   768
78969
1b05c2b10c9f finalize current sessions before generating schedule;
Fabian Huch <huch@in.tum.de>
parents: 78968
diff changeset
   769
    def is_current(state: Build_Process.State, session_name: String): Boolean =
1b05c2b10c9f finalize current sessions before generating schedule;
Fabian Huch <huch@in.tum.de>
parents: 78968
diff changeset
   770
      state.ancestor_results(session_name) match {
1b05c2b10c9f finalize current sessions before generating schedule;
Fabian Huch <huch@in.tum.de>
parents: 78968
diff changeset
   771
        case Some(ancestor_results) if ancestor_results.forall(_.current) =>
1b05c2b10c9f finalize current sessions before generating schedule;
Fabian Huch <huch@in.tum.de>
parents: 78968
diff changeset
   772
          val sources_shasum = state.sessions(session_name).sources_shasum
1b05c2b10c9f finalize current sessions before generating schedule;
Fabian Huch <huch@in.tum.de>
parents: 78968
diff changeset
   773
1b05c2b10c9f finalize current sessions before generating schedule;
Fabian Huch <huch@in.tum.de>
parents: 78968
diff changeset
   774
          val input_shasum =
1b05c2b10c9f finalize current sessions before generating schedule;
Fabian Huch <huch@in.tum.de>
parents: 78968
diff changeset
   775
            if (ancestor_results.isEmpty) ML_Process.bootstrap_shasum()
1b05c2b10c9f finalize current sessions before generating schedule;
Fabian Huch <huch@in.tum.de>
parents: 78968
diff changeset
   776
            else SHA1.flat_shasum(ancestor_results.map(_.output_shasum))
1b05c2b10c9f finalize current sessions before generating schedule;
Fabian Huch <huch@in.tum.de>
parents: 78968
diff changeset
   777
1b05c2b10c9f finalize current sessions before generating schedule;
Fabian Huch <huch@in.tum.de>
parents: 78968
diff changeset
   778
          val store_heap =
1b05c2b10c9f finalize current sessions before generating schedule;
Fabian Huch <huch@in.tum.de>
parents: 78968
diff changeset
   779
            build_context.build_heap || Sessions.is_pure(session_name) ||
1b05c2b10c9f finalize current sessions before generating schedule;
Fabian Huch <huch@in.tum.de>
parents: 78968
diff changeset
   780
              state.sessions.iterator.exists(_.ancestors.contains(session_name))
1b05c2b10c9f finalize current sessions before generating schedule;
Fabian Huch <huch@in.tum.de>
parents: 78968
diff changeset
   781
1b05c2b10c9f finalize current sessions before generating schedule;
Fabian Huch <huch@in.tum.de>
parents: 78968
diff changeset
   782
          store.check_output(
1b05c2b10c9f finalize current sessions before generating schedule;
Fabian Huch <huch@in.tum.de>
parents: 78968
diff changeset
   783
            _database_server, session_name,
1b05c2b10c9f finalize current sessions before generating schedule;
Fabian Huch <huch@in.tum.de>
parents: 78968
diff changeset
   784
            session_options = build_context.sessions_structure(session_name).options,
1b05c2b10c9f finalize current sessions before generating schedule;
Fabian Huch <huch@in.tum.de>
parents: 78968
diff changeset
   785
            sources_shasum = sources_shasum,
1b05c2b10c9f finalize current sessions before generating schedule;
Fabian Huch <huch@in.tum.de>
parents: 78968
diff changeset
   786
            input_shasum = input_shasum,
1b05c2b10c9f finalize current sessions before generating schedule;
Fabian Huch <huch@in.tum.de>
parents: 78968
diff changeset
   787
            fresh_build = build_context.fresh_build,
1b05c2b10c9f finalize current sessions before generating schedule;
Fabian Huch <huch@in.tum.de>
parents: 78968
diff changeset
   788
            store_heap = store_heap)._1
1b05c2b10c9f finalize current sessions before generating schedule;
Fabian Huch <huch@in.tum.de>
parents: 78968
diff changeset
   789
        case _ => false
1b05c2b10c9f finalize current sessions before generating schedule;
Fabian Huch <huch@in.tum.de>
parents: 78968
diff changeset
   790
    }
1b05c2b10c9f finalize current sessions before generating schedule;
Fabian Huch <huch@in.tum.de>
parents: 78968
diff changeset
   791
78970
5d38b72a1a66 finalize scheduled build only on master node;
Fabian Huch <huch@in.tum.de>
parents: 78969
diff changeset
   792
    override def next_jobs(state: Build_Process.State): List[String] = {
5d38b72a1a66 finalize scheduled build only on master node;
Fabian Huch <huch@in.tum.de>
parents: 78969
diff changeset
   793
      val finalize_limit = if (build_context.master) Int.MaxValue else 0
5d38b72a1a66 finalize scheduled build only on master node;
Fabian Huch <huch@in.tum.de>
parents: 78969
diff changeset
   794
79020
ef76705bf402 clarified ready vs. next ready;
Fabian Huch <huch@in.tum.de>
parents: 79019
diff changeset
   795
      if (progress.stopped) state.next_ready.map(_.name).take(finalize_limit)
78975
4a5d35b35aeb better invalidation for schedule cache (only on relevant changes);
Fabian Huch <huch@in.tum.de>
parents: 78974
diff changeset
   796
      else if (cache.is_current(state)) cache.configs.map(_.job_name).filterNot(state.is_running)
78845
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   797
      else {
79020
ef76705bf402 clarified ready vs. next ready;
Fabian Huch <huch@in.tum.de>
parents: 79019
diff changeset
   798
        val current = state.next_ready.filter(task => is_current(state, task.name))
78970
5d38b72a1a66 finalize scheduled build only on master node;
Fabian Huch <huch@in.tum.de>
parents: 78969
diff changeset
   799
        if (current.nonEmpty) current.map(_.name).take(finalize_limit)
78969
1b05c2b10c9f finalize current sessions before generating schedule;
Fabian Huch <huch@in.tum.de>
parents: 78968
diff changeset
   800
        else {
1b05c2b10c9f finalize current sessions before generating schedule;
Fabian Huch <huch@in.tum.de>
parents: 78968
diff changeset
   801
          val start = Time.now()
1b05c2b10c9f finalize current sessions before generating schedule;
Fabian Huch <huch@in.tum.de>
parents: 78968
diff changeset
   802
          val next = scheduler.next(state)
79105
6e92475ff925 clarified schedule message;
Fabian Huch <huch@in.tum.de>
parents: 79104
diff changeset
   803
          val schedule = scheduler.build_schedule(state)
78969
1b05c2b10c9f finalize current sessions before generating schedule;
Fabian Huch <huch@in.tum.de>
parents: 78968
diff changeset
   804
          val elapsed = Time.now() - start
78884
0233d5a5a4ca improved build messages;
Fabian Huch <huch@in.tum.de>
parents: 78851
diff changeset
   805
78976
8da0eedd562c tuned message;
Fabian Huch <huch@in.tum.de>
parents: 78975
diff changeset
   806
          val timing_msg = if (elapsed.is_relevant) " (took " + elapsed.message + ")" else ""
79105
6e92475ff925 clarified schedule message;
Fabian Huch <huch@in.tum.de>
parents: 79104
diff changeset
   807
          progress.echo_if(build_context.master && !cache.is_current_estimate(schedule.end),
6e92475ff925 clarified schedule message;
Fabian Huch <huch@in.tum.de>
parents: 79104
diff changeset
   808
            schedule.message + timing_msg)
78845
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   809
78969
1b05c2b10c9f finalize current sessions before generating schedule;
Fabian Huch <huch@in.tum.de>
parents: 78968
diff changeset
   810
          val configs = next.filter(_.node_info.hostname == hostname)
79105
6e92475ff925 clarified schedule message;
Fabian Huch <huch@in.tum.de>
parents: 79104
diff changeset
   811
          cache = Cache(state, configs, schedule.end)
78969
1b05c2b10c9f finalize current sessions before generating schedule;
Fabian Huch <huch@in.tum.de>
parents: 78968
diff changeset
   812
          configs.map(_.job_name)
1b05c2b10c9f finalize current sessions before generating schedule;
Fabian Huch <huch@in.tum.de>
parents: 78968
diff changeset
   813
        }
78845
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   814
      }
78970
5d38b72a1a66 finalize scheduled build only on master node;
Fabian Huch <huch@in.tum.de>
parents: 78969
diff changeset
   815
    }
78845
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   816
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   817
    override def run(): Build.Results = {
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   818
      val results = super.run()
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   819
      if (build_context.master) write_build_log(results, snapshot().results)
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   820
      results
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   821
    }
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   822
  }
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   823
79089
Fabian Huch <huch@in.tum.de>
parents: 79088
diff changeset
   824
  class Engine extends Build.Engine("build_schedule") {
Fabian Huch <huch@in.tum.de>
parents: 79088
diff changeset
   825
79108
Fabian Huch <huch@in.tum.de>
parents: 79107
diff changeset
   826
    def scheduler(timing_data: Timing_Data, context: Build.Context): Scheduler = {
Fabian Huch <huch@in.tum.de>
parents: 79107
diff changeset
   827
      val sessions_structure = context.sessions_structure
79089
Fabian Huch <huch@in.tum.de>
parents: 79088
diff changeset
   828
      val heuristics =
79108
Fabian Huch <huch@in.tum.de>
parents: 79107
diff changeset
   829
        List(5, 10, 20).map(Time.minutes(_)).map(
Fabian Huch <huch@in.tum.de>
parents: 79107
diff changeset
   830
          Timing_Heuristic(_, timing_data, sessions_structure))
79089
Fabian Huch <huch@in.tum.de>
parents: 79088
diff changeset
   831
      new Meta_Heuristic(heuristics)
Fabian Huch <huch@in.tum.de>
parents: 79088
diff changeset
   832
    }
Fabian Huch <huch@in.tum.de>
parents: 79088
diff changeset
   833
78845
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   834
    override def open_build_process(
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   835
      context: Build.Context,
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   836
      progress: Progress,
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   837
      server: SSH.Server
78928
6c2c60b852e0 move timing data into scheduler for more efficient heuristics (e.g., with pre-calculated values);
Fabian Huch <huch@in.tum.de>
parents: 78888
diff changeset
   838
    ): Build_Process =
6c2c60b852e0 move timing data into scheduler for more efficient heuristics (e.g., with pre-calculated values);
Fabian Huch <huch@in.tum.de>
parents: 78888
diff changeset
   839
      new Scheduled_Build_Process(context, progress, server) {
79108
Fabian Huch <huch@in.tum.de>
parents: 79107
diff changeset
   840
        def init_scheduler(timing_data: Timing_Data): Scheduler = scheduler(timing_data, context)
78928
6c2c60b852e0 move timing data into scheduler for more efficient heuristics (e.g., with pre-calculated values);
Fabian Huch <huch@in.tum.de>
parents: 78888
diff changeset
   841
      }
78845
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   842
  }
79091
06f380099b2e added method to generate build schedules directly;
Fabian Huch <huch@in.tum.de>
parents: 79090
diff changeset
   843
06f380099b2e added method to generate build schedules directly;
Fabian Huch <huch@in.tum.de>
parents: 79090
diff changeset
   844
06f380099b2e added method to generate build schedules directly;
Fabian Huch <huch@in.tum.de>
parents: 79090
diff changeset
   845
  /* build schedule */
06f380099b2e added method to generate build schedules directly;
Fabian Huch <huch@in.tum.de>
parents: 79090
diff changeset
   846
06f380099b2e added method to generate build schedules directly;
Fabian Huch <huch@in.tum.de>
parents: 79090
diff changeset
   847
  def build_schedule(
06f380099b2e added method to generate build schedules directly;
Fabian Huch <huch@in.tum.de>
parents: 79090
diff changeset
   848
    options: Options,
06f380099b2e added method to generate build schedules directly;
Fabian Huch <huch@in.tum.de>
parents: 79090
diff changeset
   849
    build_hosts: List[Build_Cluster.Host] = Nil,
06f380099b2e added method to generate build schedules directly;
Fabian Huch <huch@in.tum.de>
parents: 79090
diff changeset
   850
    selection: Sessions.Selection = Sessions.Selection.empty,
06f380099b2e added method to generate build schedules directly;
Fabian Huch <huch@in.tum.de>
parents: 79090
diff changeset
   851
    progress: Progress = new Progress,
06f380099b2e added method to generate build schedules directly;
Fabian Huch <huch@in.tum.de>
parents: 79090
diff changeset
   852
    afp_root: Option[Path] = None,
06f380099b2e added method to generate build schedules directly;
Fabian Huch <huch@in.tum.de>
parents: 79090
diff changeset
   853
    dirs: List[Path] = Nil,
06f380099b2e added method to generate build schedules directly;
Fabian Huch <huch@in.tum.de>
parents: 79090
diff changeset
   854
    select_dirs: List[Path] = Nil,
06f380099b2e added method to generate build schedules directly;
Fabian Huch <huch@in.tum.de>
parents: 79090
diff changeset
   855
    infos: List[Sessions.Info] = Nil,
06f380099b2e added method to generate build schedules directly;
Fabian Huch <huch@in.tum.de>
parents: 79090
diff changeset
   856
    numa_shuffling: Boolean = false,
06f380099b2e added method to generate build schedules directly;
Fabian Huch <huch@in.tum.de>
parents: 79090
diff changeset
   857
    augment_options: String => List[Options.Spec] = _ => Nil,
06f380099b2e added method to generate build schedules directly;
Fabian Huch <huch@in.tum.de>
parents: 79090
diff changeset
   858
    session_setup: (String, Session) => Unit = (_, _) => (),
06f380099b2e added method to generate build schedules directly;
Fabian Huch <huch@in.tum.de>
parents: 79090
diff changeset
   859
    cache: Term.Cache = Term.Cache.make()
06f380099b2e added method to generate build schedules directly;
Fabian Huch <huch@in.tum.de>
parents: 79090
diff changeset
   860
  ): Schedule = {
06f380099b2e added method to generate build schedules directly;
Fabian Huch <huch@in.tum.de>
parents: 79090
diff changeset
   861
    val build_engine = new Engine
06f380099b2e added method to generate build schedules directly;
Fabian Huch <huch@in.tum.de>
parents: 79090
diff changeset
   862
06f380099b2e added method to generate build schedules directly;
Fabian Huch <huch@in.tum.de>
parents: 79090
diff changeset
   863
    val store = build_engine.build_store(options, build_hosts = build_hosts, cache = cache)
06f380099b2e added method to generate build schedules directly;
Fabian Huch <huch@in.tum.de>
parents: 79090
diff changeset
   864
    val log_store = Build_Log.store(options, cache = cache)
06f380099b2e added method to generate build schedules directly;
Fabian Huch <huch@in.tum.de>
parents: 79090
diff changeset
   865
    val build_options = store.options
06f380099b2e added method to generate build schedules directly;
Fabian Huch <huch@in.tum.de>
parents: 79090
diff changeset
   866
06f380099b2e added method to generate build schedules directly;
Fabian Huch <huch@in.tum.de>
parents: 79090
diff changeset
   867
    def build_schedule(
06f380099b2e added method to generate build schedules directly;
Fabian Huch <huch@in.tum.de>
parents: 79090
diff changeset
   868
      server: SSH.Server,
06f380099b2e added method to generate build schedules directly;
Fabian Huch <huch@in.tum.de>
parents: 79090
diff changeset
   869
      database_server: Option[SQL.Database],
06f380099b2e added method to generate build schedules directly;
Fabian Huch <huch@in.tum.de>
parents: 79090
diff changeset
   870
      log_database: PostgreSQL.Database,
06f380099b2e added method to generate build schedules directly;
Fabian Huch <huch@in.tum.de>
parents: 79090
diff changeset
   871
      host_database: SQL.Database
06f380099b2e added method to generate build schedules directly;
Fabian Huch <huch@in.tum.de>
parents: 79090
diff changeset
   872
    ): Schedule = {
06f380099b2e added method to generate build schedules directly;
Fabian Huch <huch@in.tum.de>
parents: 79090
diff changeset
   873
      val full_sessions =
06f380099b2e added method to generate build schedules directly;
Fabian Huch <huch@in.tum.de>
parents: 79090
diff changeset
   874
        Sessions.load_structure(build_options, dirs = AFP.make_dirs(afp_root) ::: dirs,
06f380099b2e added method to generate build schedules directly;
Fabian Huch <huch@in.tum.de>
parents: 79090
diff changeset
   875
          select_dirs = select_dirs, infos = infos, augment_options = augment_options)
06f380099b2e added method to generate build schedules directly;
Fabian Huch <huch@in.tum.de>
parents: 79090
diff changeset
   876
      val full_sessions_selection = full_sessions.imports_selection(selection)
06f380099b2e added method to generate build schedules directly;
Fabian Huch <huch@in.tum.de>
parents: 79090
diff changeset
   877
06f380099b2e added method to generate build schedules directly;
Fabian Huch <huch@in.tum.de>
parents: 79090
diff changeset
   878
      val build_deps =
06f380099b2e added method to generate build schedules directly;
Fabian Huch <huch@in.tum.de>
parents: 79090
diff changeset
   879
        Sessions.deps(full_sessions.selection(selection), progress = progress,
06f380099b2e added method to generate build schedules directly;
Fabian Huch <huch@in.tum.de>
parents: 79090
diff changeset
   880
          inlined_files = true).check_errors
06f380099b2e added method to generate build schedules directly;
Fabian Huch <huch@in.tum.de>
parents: 79090
diff changeset
   881
06f380099b2e added method to generate build schedules directly;
Fabian Huch <huch@in.tum.de>
parents: 79090
diff changeset
   882
      val build_context =
06f380099b2e added method to generate build schedules directly;
Fabian Huch <huch@in.tum.de>
parents: 79090
diff changeset
   883
        Build.Context(store, build_engine, build_deps, afp_root = afp_root,
06f380099b2e added method to generate build schedules directly;
Fabian Huch <huch@in.tum.de>
parents: 79090
diff changeset
   884
          build_hosts = build_hosts, hostname = Build.hostname(build_options),
06f380099b2e added method to generate build schedules directly;
Fabian Huch <huch@in.tum.de>
parents: 79090
diff changeset
   885
          numa_shuffling = numa_shuffling, max_jobs = 0, session_setup = session_setup,
06f380099b2e added method to generate build schedules directly;
Fabian Huch <huch@in.tum.de>
parents: 79090
diff changeset
   886
          master = true)
06f380099b2e added method to generate build schedules directly;
Fabian Huch <huch@in.tum.de>
parents: 79090
diff changeset
   887
06f380099b2e added method to generate build schedules directly;
Fabian Huch <huch@in.tum.de>
parents: 79090
diff changeset
   888
      val cluster_hosts = build_context.build_hosts
06f380099b2e added method to generate build schedules directly;
Fabian Huch <huch@in.tum.de>
parents: 79090
diff changeset
   889
06f380099b2e added method to generate build schedules directly;
Fabian Huch <huch@in.tum.de>
parents: 79090
diff changeset
   890
      val hosts_current =
06f380099b2e added method to generate build schedules directly;
Fabian Huch <huch@in.tum.de>
parents: 79090
diff changeset
   891
        cluster_hosts.forall(host => isabelle.Host.read_info(host_database, host.name).isDefined)
06f380099b2e added method to generate build schedules directly;
Fabian Huch <huch@in.tum.de>
parents: 79090
diff changeset
   892
      if (!hosts_current) {
06f380099b2e added method to generate build schedules directly;
Fabian Huch <huch@in.tum.de>
parents: 79090
diff changeset
   893
        val build_cluster = Build_Cluster.make(build_context, progress = progress)
06f380099b2e added method to generate build schedules directly;
Fabian Huch <huch@in.tum.de>
parents: 79090
diff changeset
   894
        build_cluster.open()
06f380099b2e added method to generate build schedules directly;
Fabian Huch <huch@in.tum.de>
parents: 79090
diff changeset
   895
        build_cluster.init()
06f380099b2e added method to generate build schedules directly;
Fabian Huch <huch@in.tum.de>
parents: 79090
diff changeset
   896
        build_cluster.benchmark()
06f380099b2e added method to generate build schedules directly;
Fabian Huch <huch@in.tum.de>
parents: 79090
diff changeset
   897
        build_cluster.close()
06f380099b2e added method to generate build schedules directly;
Fabian Huch <huch@in.tum.de>
parents: 79090
diff changeset
   898
      }
06f380099b2e added method to generate build schedules directly;
Fabian Huch <huch@in.tum.de>
parents: 79090
diff changeset
   899
06f380099b2e added method to generate build schedules directly;
Fabian Huch <huch@in.tum.de>
parents: 79090
diff changeset
   900
      val host_infos = Host_Infos.load(cluster_hosts, host_database)
06f380099b2e added method to generate build schedules directly;
Fabian Huch <huch@in.tum.de>
parents: 79090
diff changeset
   901
      val timing_data = Timing_Data.load(host_infos, log_database)
06f380099b2e added method to generate build schedules directly;
Fabian Huch <huch@in.tum.de>
parents: 79090
diff changeset
   902
06f380099b2e added method to generate build schedules directly;
Fabian Huch <huch@in.tum.de>
parents: 79090
diff changeset
   903
      val sessions = Build_Process.Sessions.empty.init(build_context, database_server, progress)
06f380099b2e added method to generate build schedules directly;
Fabian Huch <huch@in.tum.de>
parents: 79090
diff changeset
   904
      def task(session: Build_Job.Session_Context): Build_Process.Task =
06f380099b2e added method to generate build schedules directly;
Fabian Huch <huch@in.tum.de>
parents: 79090
diff changeset
   905
        Build_Process.Task(session.name, session.deps, JSON.Object.empty, build_context.build_uuid)
06f380099b2e added method to generate build schedules directly;
Fabian Huch <huch@in.tum.de>
parents: 79090
diff changeset
   906
06f380099b2e added method to generate build schedules directly;
Fabian Huch <huch@in.tum.de>
parents: 79090
diff changeset
   907
      val build_state =
06f380099b2e added method to generate build schedules directly;
Fabian Huch <huch@in.tum.de>
parents: 79090
diff changeset
   908
        Build_Process.State(sessions = sessions, pending = sessions.iterator.map(task).toList)
06f380099b2e added method to generate build schedules directly;
Fabian Huch <huch@in.tum.de>
parents: 79090
diff changeset
   909
79108
Fabian Huch <huch@in.tum.de>
parents: 79107
diff changeset
   910
      val scheduler = build_engine.scheduler(timing_data, build_context)
79105
6e92475ff925 clarified schedule message;
Fabian Huch <huch@in.tum.de>
parents: 79104
diff changeset
   911
      def schedule_msg(res: Exn.Result[Schedule]): String =
6e92475ff925 clarified schedule message;
Fabian Huch <huch@in.tum.de>
parents: 79104
diff changeset
   912
        res match { case Exn.Res(schedule) => schedule.message case _ => "" }
6e92475ff925 clarified schedule message;
Fabian Huch <huch@in.tum.de>
parents: 79104
diff changeset
   913
6e92475ff925 clarified schedule message;
Fabian Huch <huch@in.tum.de>
parents: 79104
diff changeset
   914
      Timing.timeit(scheduler.build_schedule(build_state), schedule_msg, output = progress.echo(_))
79091
06f380099b2e added method to generate build schedules directly;
Fabian Huch <huch@in.tum.de>
parents: 79090
diff changeset
   915
    }
06f380099b2e added method to generate build schedules directly;
Fabian Huch <huch@in.tum.de>
parents: 79090
diff changeset
   916
06f380099b2e added method to generate build schedules directly;
Fabian Huch <huch@in.tum.de>
parents: 79090
diff changeset
   917
    using(store.open_server()) { server =>
06f380099b2e added method to generate build schedules directly;
Fabian Huch <huch@in.tum.de>
parents: 79090
diff changeset
   918
      using_optional(store.maybe_open_database_server(server = server)) { database_server =>
06f380099b2e added method to generate build schedules directly;
Fabian Huch <huch@in.tum.de>
parents: 79090
diff changeset
   919
        using(log_store.open_database(server = server)) { log_database =>
06f380099b2e added method to generate build schedules directly;
Fabian Huch <huch@in.tum.de>
parents: 79090
diff changeset
   920
          using(store.open_build_database(
06f380099b2e added method to generate build schedules directly;
Fabian Huch <huch@in.tum.de>
parents: 79090
diff changeset
   921
            path = isabelle.Host.private_data.database, server = server)) { host_database =>
06f380099b2e added method to generate build schedules directly;
Fabian Huch <huch@in.tum.de>
parents: 79090
diff changeset
   922
              build_schedule(server, database_server, log_database, host_database)
06f380099b2e added method to generate build schedules directly;
Fabian Huch <huch@in.tum.de>
parents: 79090
diff changeset
   923
          }
06f380099b2e added method to generate build schedules directly;
Fabian Huch <huch@in.tum.de>
parents: 79090
diff changeset
   924
        }
06f380099b2e added method to generate build schedules directly;
Fabian Huch <huch@in.tum.de>
parents: 79090
diff changeset
   925
      }
06f380099b2e added method to generate build schedules directly;
Fabian Huch <huch@in.tum.de>
parents: 79090
diff changeset
   926
    }
06f380099b2e added method to generate build schedules directly;
Fabian Huch <huch@in.tum.de>
parents: 79090
diff changeset
   927
  }
78845
ff96d94957cb add module for faster scheduled builds;
Fabian Huch <huch@in.tum.de>
parents:
diff changeset
   928
}