| author | desharna | 
| Mon, 23 May 2022 10:23:33 +0200 | |
| changeset 75460 | 7c2fe41f5ee8 | 
| parent 75393 | 87ebf5a50283 | 
| child 75958 | 97445e208419 | 
| permissions | -rw-r--r-- | 
| 36683 | 1 | /* Title: Pure/General/pretty.scala | 
| 2 | Author: Makarius | |
| 3 | ||
| 36687 | 4 | Generic pretty printing module. | 
| 36683 | 5 | */ | 
| 6 | ||
| 7 | package isabelle | |
| 8 | ||
| 71601 | 9 | import scala.annotation.tailrec | 
| 10 | ||
| 36683 | 11 | |
| 75393 | 12 | object Pretty {
 | 
| 61871 | 13 | /* XML constructors */ | 
| 14 | ||
| 61874 | 15 | val space: XML.Body = List(XML.Text(Symbol.space)) | 
| 16 | def spaces(n: Int): XML.Body = | |
| 17 | if (n == 0) Nil | |
| 18 | else if (n == 1) space | |
| 19 | else List(XML.Text(Symbol.spaces(n))) | |
| 48704 
85a3de10567d
tuned signature -- make Pretty less dependent on Symbol;
 wenzelm parents: 
45666diff
changeset | 20 | |
| 61871 | 21 | def block(consistent: Boolean, indent: Int, body: XML.Body): XML.Tree = | 
| 22 | XML.Elem(Markup.Block(consistent, indent), body) | |
| 23 | def block(indent: Int, body: XML.Body): XML.Tree = block(false, indent, body) | |
| 24 | def block(body: XML.Body): XML.Tree = block(2, body) | |
| 48704 
85a3de10567d
tuned signature -- make Pretty less dependent on Symbol;
 wenzelm parents: 
45666diff
changeset | 25 | |
| 61871 | 26 | def brk(width: Int, indent: Int = 0): XML.Tree = | 
| 27 | XML.Elem(Markup.Break(width, indent), spaces(width)) | |
| 28 | ||
| 69867 | 29 | val fbrk: XML.Tree = XML.newline | 
| 65130 | 30 | def fbreaks(ts: List[XML.Tree]): XML.Body = Library.separate(fbrk, ts) | 
| 61871 | 31 | |
| 32 | val Separator: XML.Body = List(XML.elem(Markup.SEPARATOR, space), fbrk) | |
| 33 | def separate(ts: List[XML.Tree]): XML.Body = Library.separate(Separator, ts.map(List(_))).flatten | |
| 61864 | 34 | |
| 48704 
85a3de10567d
tuned signature -- make Pretty less dependent on Symbol;
 wenzelm parents: 
45666diff
changeset | 35 | |
| 51492 
eaa1c4cc1106
more explicit Pretty.Metric, with clear distinction of unit (space width) vs. average char width (for visual adjustments) -- NB: Pretty formatting works via full space characters (despite a981a5c8a505 and 70f7483df9cb);
 wenzelm parents: 
51470diff
changeset | 36 | /* text metric -- standardized to width of space */ | 
| 
eaa1c4cc1106
more explicit Pretty.Metric, with clear distinction of unit (space width) vs. average char width (for visual adjustments) -- NB: Pretty formatting works via full space characters (despite a981a5c8a505 and 70f7483df9cb);
 wenzelm parents: 
51470diff
changeset | 37 | |
| 75393 | 38 |   abstract class Metric {
 | 
| 51492 
eaa1c4cc1106
more explicit Pretty.Metric, with clear distinction of unit (space width) vs. average char width (for visual adjustments) -- NB: Pretty formatting works via full space characters (despite a981a5c8a505 and 70f7483df9cb);
 wenzelm parents: 
51470diff
changeset | 39 | val unit: Double | 
| 
eaa1c4cc1106
more explicit Pretty.Metric, with clear distinction of unit (space width) vs. average char width (for visual adjustments) -- NB: Pretty formatting works via full space characters (despite a981a5c8a505 and 70f7483df9cb);
 wenzelm parents: 
51470diff
changeset | 40 | def apply(s: String): Double | 
| 
eaa1c4cc1106
more explicit Pretty.Metric, with clear distinction of unit (space width) vs. average char width (for visual adjustments) -- NB: Pretty formatting works via full space characters (despite a981a5c8a505 and 70f7483df9cb);
 wenzelm parents: 
51470diff
changeset | 41 | } | 
| 
eaa1c4cc1106
more explicit Pretty.Metric, with clear distinction of unit (space width) vs. average char width (for visual adjustments) -- NB: Pretty formatting works via full space characters (despite a981a5c8a505 and 70f7483df9cb);
 wenzelm parents: 
51470diff
changeset | 42 | |
| 75393 | 43 |   object Default_Metric extends Metric {
 | 
| 51492 
eaa1c4cc1106
more explicit Pretty.Metric, with clear distinction of unit (space width) vs. average char width (for visual adjustments) -- NB: Pretty formatting works via full space characters (despite a981a5c8a505 and 70f7483df9cb);
 wenzelm parents: 
51470diff
changeset | 44 | val unit = 1.0 | 
| 
eaa1c4cc1106
more explicit Pretty.Metric, with clear distinction of unit (space width) vs. average char width (for visual adjustments) -- NB: Pretty formatting works via full space characters (despite a981a5c8a505 and 70f7483df9cb);
 wenzelm parents: 
51470diff
changeset | 45 | def apply(s: String): Double = s.length.toDouble | 
| 
eaa1c4cc1106
more explicit Pretty.Metric, with clear distinction of unit (space width) vs. average char width (for visual adjustments) -- NB: Pretty formatting works via full space characters (despite a981a5c8a505 and 70f7483df9cb);
 wenzelm parents: 
51470diff
changeset | 46 | } | 
| 
eaa1c4cc1106
more explicit Pretty.Metric, with clear distinction of unit (space width) vs. average char width (for visual adjustments) -- NB: Pretty formatting works via full space characters (despite a981a5c8a505 and 70f7483df9cb);
 wenzelm parents: 
51470diff
changeset | 47 | |
| 
eaa1c4cc1106
more explicit Pretty.Metric, with clear distinction of unit (space width) vs. average char width (for visual adjustments) -- NB: Pretty formatting works via full space characters (despite a981a5c8a505 and 70f7483df9cb);
 wenzelm parents: 
51470diff
changeset | 48 | |
| 36687 | 49 | /* markup trees with physical blocks and breaks */ | 
| 50 | ||
| 62820 | 51 | private def force_nat(i: Int): Int = i max 0 | 
| 52 | ||
| 61874 | 53 |   private sealed abstract class Tree { def length: Double }
 | 
| 54 | private case class Block( | |
| 61871 | 55 | markup: Option[(Markup, Option[XML.Body])], | 
| 56 | consistent: Boolean, indent: Int, body: List[Tree], length: Double) extends Tree | |
| 75393 | 57 |   private case class Break(force: Boolean, width: Int, indent: Int) extends Tree {
 | 
| 58 | def length: Double = width.toDouble | |
| 59 | } | |
| 61874 | 60 | private case class Str(string: String, length: Double) extends Tree | 
| 36683 | 61 | |
| 61874 | 62 | private val FBreak = Break(true, 1, 0) | 
| 36683 | 63 | |
| 61874 | 64 | private def make_block( | 
| 75393 | 65 | markup: Option[(Markup, Option[XML.Body])], | 
| 66 | consistent: Boolean, | |
| 67 | indent: Int, | |
| 68 | body: List[Tree] | |
| 69 |   ): Tree = {
 | |
| 62785 
70b9c7d4ed7f
more robust pretty printing: permissive treatment of bad values;
 wenzelm parents: 
61883diff
changeset | 70 | val indent1 = force_nat(indent) | 
| 
70b9c7d4ed7f
more robust pretty printing: permissive treatment of bad values;
 wenzelm parents: 
61883diff
changeset | 71 | |
| 75393 | 72 |     @tailrec def body_length(prts: List[Tree], len: Double): Double = {
 | 
| 61883 
c0f34fe6aa61
clarified length of block with pre-existant forced breaks;
 wenzelm parents: 
61875diff
changeset | 73 | val (line, rest) = | 
| 
c0f34fe6aa61
clarified length of block with pre-existant forced breaks;
 wenzelm parents: 
61875diff
changeset | 74 |         Library.take_prefix[Tree]({ case Break(true, _, _) => false case _ => true }, prts)
 | 
| 73359 | 75 |       val len1 = (line.foldLeft(0.0) { case (l, t) => l + t.length }) max len
 | 
| 71781 | 76 |       (rest: @unchecked) match {
 | 
| 61883 
c0f34fe6aa61
clarified length of block with pre-existant forced breaks;
 wenzelm parents: 
61875diff
changeset | 77 | case Break(true, _, ind) :: rest1 => | 
| 62785 
70b9c7d4ed7f
more robust pretty printing: permissive treatment of bad values;
 wenzelm parents: 
61883diff
changeset | 78 | body_length(Break(false, indent1 + ind, 0) :: rest1, len1) | 
| 61883 
c0f34fe6aa61
clarified length of block with pre-existant forced breaks;
 wenzelm parents: 
61875diff
changeset | 79 | case Nil => len1 | 
| 
c0f34fe6aa61
clarified length of block with pre-existant forced breaks;
 wenzelm parents: 
61875diff
changeset | 80 | } | 
| 
c0f34fe6aa61
clarified length of block with pre-existant forced breaks;
 wenzelm parents: 
61875diff
changeset | 81 | } | 
| 62785 
70b9c7d4ed7f
more robust pretty printing: permissive treatment of bad values;
 wenzelm parents: 
61883diff
changeset | 82 | Block(markup, consistent, indent1, body, body_length(body, 0.0)) | 
| 61883 
c0f34fe6aa61
clarified length of block with pre-existant forced breaks;
 wenzelm parents: 
61875diff
changeset | 83 | } | 
| 36683 | 84 | |
| 61874 | 85 | |
| 86 | /* formatted output */ | |
| 87 | ||
| 75393 | 88 |   private sealed case class Text(tx: XML.Body = Nil, pos: Double = 0.0, nl: Int = 0) {
 | 
| 61874 | 89 | def newline: Text = copy(tx = fbrk :: tx, pos = 0.0, nl = nl + 1) | 
| 90 | def string(s: String, len: Double): Text = | |
| 91 | copy(tx = if (s == "") tx else XML.Text(s) :: tx, pos = pos + len) | |
| 92 | def blanks(wd: Int): Text = string(Symbol.spaces(wd), wd.toDouble) | |
| 93 | def content: XML.Body = tx.reverse | |
| 94 | } | |
| 95 | ||
| 96 | private def break_dist(trees: List[Tree], after: Double): Double = | |
| 97 |     trees match {
 | |
| 98 | case (_: Break) :: _ => 0.0 | |
| 99 | case t :: ts => t.length + break_dist(ts, after) | |
| 100 | case Nil => after | |
| 36689 
379f5b1e7f91
replaced slightly odd fbreak markup by plain "\n", which also coincides with regular linebreaks produced outside the ML pretty engine;
 wenzelm parents: 
36687diff
changeset | 101 | } | 
| 
379f5b1e7f91
replaced slightly odd fbreak markup by plain "\n", which also coincides with regular linebreaks produced outside the ML pretty engine;
 wenzelm parents: 
36687diff
changeset | 102 | |
| 61874 | 103 | private def force_break(tree: Tree): Tree = | 
| 104 |     tree match { case Break(false, wd, ind) => Break(true, wd, ind) case _ => tree }
 | |
| 71601 | 105 | private def force_all(trees: List[Tree]): List[Tree] = trees.map(force_break) | 
| 51570 
3633828d80fc
basic support for Pretty.item, which is considered as logical markup and interpreted in Isabelle/Scala, but ignored elsewhere (TTY, latex etc.);
 wenzelm parents: 
51569diff
changeset | 106 | |
| 61874 | 107 | private def force_next(trees: List[Tree]): List[Tree] = | 
| 108 |     trees match {
 | |
| 109 | case Nil => Nil | |
| 110 | case (t: Break) :: ts => force_break(t) :: ts | |
| 111 | case t :: ts => t :: force_next(ts) | |
| 112 | } | |
| 51570 
3633828d80fc
basic support for Pretty.item, which is considered as logical markup and interpreted in Isabelle/Scala, but ignored elsewhere (TTY, latex etc.);
 wenzelm parents: 
51569diff
changeset | 113 | |
| 71601 | 114 | val default_margin: Double = 76.0 | 
| 115 | val default_breakgain: Double = default_margin / 20 | |
| 36820 | 116 | |
| 67547 
aefe7a7b330a
clarified breakgain: keeping it constant avoids margin fluctuation in Pretty_Tooltip vs. Pretty_Text_Area;
 wenzelm parents: 
65130diff
changeset | 117 | def formatted(input: XML.Body, | 
| 67896 | 118 | margin: Double = default_margin, | 
| 119 | breakgain: Double = default_breakgain, | |
| 75393 | 120 | metric: Metric = Default_Metric | 
| 121 |   ): XML.Body = {
 | |
| 51569 
4e084727faae
maintain integer indentation during formatting -- it needs to be implemented by repeated spaces eventually;
 wenzelm parents: 
51568diff
changeset | 122 | val emergencypos = (margin / 2).round.toInt | 
| 36687 | 123 | |
| 61874 | 124 | def make_tree(inp: XML.Body): List[Tree] = | 
| 125 |       inp flatMap {
 | |
| 126 | case XML.Wrapped_Elem(markup, body1, body2) => | |
| 127 | List(make_block(Some(markup, Some(body1)), false, 0, make_tree(body2))) | |
| 128 | case XML.Elem(markup, body) => | |
| 129 |           markup match {
 | |
| 130 | case Markup.Block(consistent, indent) => | |
| 131 | List(make_block(None, consistent, indent, make_tree(body))) | |
| 132 | case Markup.Break(width, indent) => | |
| 62785 
70b9c7d4ed7f
more robust pretty printing: permissive treatment of bad values;
 wenzelm parents: 
61883diff
changeset | 133 | List(Break(false, force_nat(width), force_nat(indent))) | 
| 61874 | 134 | case Markup(Markup.ITEM, _) => | 
| 135 | List(make_block(None, false, 2, | |
| 136 | make_tree(XML.elem(Markup.BULLET, space) :: space ::: body))) | |
| 137 | case _ => | |
| 138 | List(make_block(Some((markup, None)), false, 0, make_tree(body))) | |
| 139 | } | |
| 140 | case XML.Text(text) => | |
| 141 | Library.separate(FBreak, split_lines(text).map(s => Str(s, metric(s)))) | |
| 36817 
ed97e877ff2d
more precise pretty printing based on actual font metrics;
 wenzelm parents: 
36763diff
changeset | 142 | } | 
| 
ed97e877ff2d
more precise pretty printing based on actual font metrics;
 wenzelm parents: 
36763diff
changeset | 143 | |
| 61871 | 144 | def format(trees: List[Tree], blockin: Int, after: Double, text: Text): Text = | 
| 36687 | 145 |       trees match {
 | 
| 146 | case Nil => text | |
| 147 | ||
| 61871 | 148 | case Block(markup, consistent, indent, body, blen) :: ts => | 
| 51569 
4e084727faae
maintain integer indentation during formatting -- it needs to be implemented by repeated spaces eventually;
 wenzelm parents: 
51568diff
changeset | 149 | val pos1 = (text.pos + indent).ceil.toInt | 
| 36687 | 150 | val pos2 = pos1 % emergencypos | 
| 61868 | 151 | val blockin1 = if (pos1 < emergencypos) pos1 else pos2 | 
| 61864 | 152 | val d = break_dist(ts, after) | 
| 153 | val body1 = if (consistent && text.pos + blen > margin - d) force_all(body) else body | |
| 61871 | 154 | val btext = | 
| 155 |             markup match {
 | |
| 156 | case None => format(body1, blockin1, d, text) | |
| 157 | case Some((m, markup_body)) => | |
| 158 | val btext0 = format(body1, blockin1, d, text.copy(tx = Nil)) | |
| 159 | val elem = | |
| 160 |                   markup_body match {
 | |
| 161 | case None => XML.Elem(m, btext0.content) | |
| 162 | case Some(b) => XML.Wrapped_Elem(m, b, btext0.content) | |
| 163 | } | |
| 164 | btext0.copy(tx = elem :: text.tx) | |
| 165 | } | |
| 61864 | 166 | val ts1 = if (text.nl < btext.nl) force_next(ts) else ts | 
| 36687 | 167 | format(ts1, blockin, after, btext) | 
| 168 | ||
| 61871 | 169 | case Break(force, wd, ind) :: ts => | 
| 170 | if (!force && | |
| 171 | text.pos + wd <= ((margin - break_dist(ts, after)) max (blockin + breakgain))) | |
| 36687 | 172 | format(ts, blockin, after, text.blanks(wd)) | 
| 61862 
e2a9e46ac0fb
support pretty break indent, like underlying ML systems;
 wenzelm parents: 
55551diff
changeset | 173 | else format(ts, blockin, after, text.newline.blanks(blockin + ind)) | 
| 36687 | 174 | |
| 61871 | 175 | case Str(s, len) :: ts => format(ts, blockin, after, text.string(s, len)) | 
| 36687 | 176 | } | 
| 61874 | 177 | format(make_tree(input), 0, 0.0, Text()).content | 
| 36687 | 178 | } | 
| 36734 
d9b10c173330
Pretty.formatted operates directly on XML trees, treating XML.Elem like a pro-forma block of indentation 0, like the ML version;
 wenzelm parents: 
36689diff
changeset | 179 | |
| 67547 
aefe7a7b330a
clarified breakgain: keeping it constant avoids margin fluctuation in Pretty_Tooltip vs. Pretty_Text_Area;
 wenzelm parents: 
65130diff
changeset | 180 | def string_of(input: XML.Body, | 
| 67896 | 181 | margin: Double = default_margin, | 
| 182 | breakgain: Double = default_breakgain, | |
| 183 | metric: Metric = Default_Metric): String = | |
| 67547 
aefe7a7b330a
clarified breakgain: keeping it constant avoids margin fluctuation in Pretty_Tooltip vs. Pretty_Text_Area;
 wenzelm parents: 
65130diff
changeset | 184 | XML.content(formatted(input, margin = margin, breakgain = breakgain, metric = metric)) | 
| 36683 | 185 | } |