author | wenzelm |
Wed, 03 Mar 2021 22:31:11 +0100 | |
changeset 73357 | 31d4274f32de |
parent 73355 | ec52a1a6ed31 |
child 73362 | dde25151c3c1 |
permissions | -rw-r--r-- |
34136 | 1 |
/* Title: Pure/library.scala |
2 |
Author: Makarius |
|
3 |
||
4 |
Basic library. |
|
5 |
*/ |
|
6 |
||
7 |
package isabelle |
|
8 |
||
38258 | 9 |
|
63781 | 10 |
import scala.annotation.tailrec |
51981
a8ffd3692f57
more scalable Library.separate -- NB: JVM has tiny fixed-size stack;
wenzelm
parents:
51616
diff
changeset
|
11 |
import scala.collection.mutable |
59224 | 12 |
import scala.util.matching.Regex |
51981
a8ffd3692f57
more scalable Library.separate -- NB: JVM has tiny fixed-size stack;
wenzelm
parents:
51616
diff
changeset
|
13 |
|
37018 | 14 |
|
34136 | 15 |
object Library |
16 |
{ |
|
63789 | 17 |
/* resource management */ |
18 |
||
69393
ed0824ef337e
static type for Library.using: avoid Java 11 warnings on "Illegal reflective access";
wenzelm
parents:
68715
diff
changeset
|
19 |
def using[A <: AutoCloseable, B](a: A)(f: A => B): B = |
63789 | 20 |
{ |
69393
ed0824ef337e
static type for Library.using: avoid Java 11 warnings on "Illegal reflective access";
wenzelm
parents:
68715
diff
changeset
|
21 |
try { f(a) } |
ed0824ef337e
static type for Library.using: avoid Java 11 warnings on "Illegal reflective access";
wenzelm
parents:
68715
diff
changeset
|
22 |
finally { if (a != null) a.close() } |
63789 | 23 |
} |
24 |
||
25 |
||
57909
0fb331032f02
more compact representation of special string values;
wenzelm
parents:
57831
diff
changeset
|
26 |
/* integers */ |
0fb331032f02
more compact representation of special string values;
wenzelm
parents:
57831
diff
changeset
|
27 |
|
0fb331032f02
more compact representation of special string values;
wenzelm
parents:
57831
diff
changeset
|
28 |
private val small_int = 10000 |
0fb331032f02
more compact representation of special string values;
wenzelm
parents:
57831
diff
changeset
|
29 |
private lazy val small_int_table = |
0fb331032f02
more compact representation of special string values;
wenzelm
parents:
57831
diff
changeset
|
30 |
{ |
0fb331032f02
more compact representation of special string values;
wenzelm
parents:
57831
diff
changeset
|
31 |
val array = new Array[String](small_int) |
0fb331032f02
more compact representation of special string values;
wenzelm
parents:
57831
diff
changeset
|
32 |
for (i <- 0 until small_int) array(i) = i.toString |
0fb331032f02
more compact representation of special string values;
wenzelm
parents:
57831
diff
changeset
|
33 |
array |
0fb331032f02
more compact representation of special string values;
wenzelm
parents:
57831
diff
changeset
|
34 |
} |
0fb331032f02
more compact representation of special string values;
wenzelm
parents:
57831
diff
changeset
|
35 |
|
0fb331032f02
more compact representation of special string values;
wenzelm
parents:
57831
diff
changeset
|
36 |
def is_small_int(s: String): Boolean = |
0fb331032f02
more compact representation of special string values;
wenzelm
parents:
57831
diff
changeset
|
37 |
{ |
0fb331032f02
more compact representation of special string values;
wenzelm
parents:
57831
diff
changeset
|
38 |
val len = s.length |
0fb331032f02
more compact representation of special string values;
wenzelm
parents:
57831
diff
changeset
|
39 |
1 <= len && len <= 4 && |
0fb331032f02
more compact representation of special string values;
wenzelm
parents:
57831
diff
changeset
|
40 |
s.forall(c => '0' <= c && c <= '9') && |
0fb331032f02
more compact representation of special string values;
wenzelm
parents:
57831
diff
changeset
|
41 |
(len == 1 || s(0) != '0') |
0fb331032f02
more compact representation of special string values;
wenzelm
parents:
57831
diff
changeset
|
42 |
} |
0fb331032f02
more compact representation of special string values;
wenzelm
parents:
57831
diff
changeset
|
43 |
|
0fb331032f02
more compact representation of special string values;
wenzelm
parents:
57831
diff
changeset
|
44 |
def signed_string_of_long(i: Long): String = |
0fb331032f02
more compact representation of special string values;
wenzelm
parents:
57831
diff
changeset
|
45 |
if (0 <= i && i < small_int) small_int_table(i.toInt) |
0fb331032f02
more compact representation of special string values;
wenzelm
parents:
57831
diff
changeset
|
46 |
else i.toString |
0fb331032f02
more compact representation of special string values;
wenzelm
parents:
57831
diff
changeset
|
47 |
|
0fb331032f02
more compact representation of special string values;
wenzelm
parents:
57831
diff
changeset
|
48 |
def signed_string_of_int(i: Int): String = |
0fb331032f02
more compact representation of special string values;
wenzelm
parents:
57831
diff
changeset
|
49 |
if (0 <= i && i < small_int) small_int_table(i) |
0fb331032f02
more compact representation of special string values;
wenzelm
parents:
57831
diff
changeset
|
50 |
else i.toString |
0fb331032f02
more compact representation of special string values;
wenzelm
parents:
57831
diff
changeset
|
51 |
|
0fb331032f02
more compact representation of special string values;
wenzelm
parents:
57831
diff
changeset
|
52 |
|
48996 | 53 |
/* separated chunks */ |
36688 | 54 |
|
55 |
def separate[A](s: A, list: List[A]): List[A] = |
|
51981
a8ffd3692f57
more scalable Library.separate -- NB: JVM has tiny fixed-size stack;
wenzelm
parents:
51616
diff
changeset
|
56 |
{ |
a8ffd3692f57
more scalable Library.separate -- NB: JVM has tiny fixed-size stack;
wenzelm
parents:
51616
diff
changeset
|
57 |
val result = new mutable.ListBuffer[A] |
a8ffd3692f57
more scalable Library.separate -- NB: JVM has tiny fixed-size stack;
wenzelm
parents:
51616
diff
changeset
|
58 |
var first = true |
a8ffd3692f57
more scalable Library.separate -- NB: JVM has tiny fixed-size stack;
wenzelm
parents:
51616
diff
changeset
|
59 |
for (x <- list) { |
a8ffd3692f57
more scalable Library.separate -- NB: JVM has tiny fixed-size stack;
wenzelm
parents:
51616
diff
changeset
|
60 |
if (first) { |
a8ffd3692f57
more scalable Library.separate -- NB: JVM has tiny fixed-size stack;
wenzelm
parents:
51616
diff
changeset
|
61 |
first = false |
a8ffd3692f57
more scalable Library.separate -- NB: JVM has tiny fixed-size stack;
wenzelm
parents:
51616
diff
changeset
|
62 |
result += x |
a8ffd3692f57
more scalable Library.separate -- NB: JVM has tiny fixed-size stack;
wenzelm
parents:
51616
diff
changeset
|
63 |
} |
a8ffd3692f57
more scalable Library.separate -- NB: JVM has tiny fixed-size stack;
wenzelm
parents:
51616
diff
changeset
|
64 |
else { |
a8ffd3692f57
more scalable Library.separate -- NB: JVM has tiny fixed-size stack;
wenzelm
parents:
51616
diff
changeset
|
65 |
result += s |
a8ffd3692f57
more scalable Library.separate -- NB: JVM has tiny fixed-size stack;
wenzelm
parents:
51616
diff
changeset
|
66 |
result += x |
a8ffd3692f57
more scalable Library.separate -- NB: JVM has tiny fixed-size stack;
wenzelm
parents:
51616
diff
changeset
|
67 |
} |
36688 | 68 |
} |
51981
a8ffd3692f57
more scalable Library.separate -- NB: JVM has tiny fixed-size stack;
wenzelm
parents:
51616
diff
changeset
|
69 |
result.toList |
a8ffd3692f57
more scalable Library.separate -- NB: JVM has tiny fixed-size stack;
wenzelm
parents:
51616
diff
changeset
|
70 |
} |
36688 | 71 |
|
56600 | 72 |
def separated_chunks(sep: Char => Boolean, source: CharSequence): Iterator[CharSequence] = |
48996 | 73 |
new Iterator[CharSequence] { |
74 |
private val end = source.length |
|
75 |
private def next_chunk(i: Int): Option[(CharSequence, Int)] = |
|
76 |
{ |
|
77 |
if (i < end) { |
|
56600 | 78 |
var j = i; do j += 1 while (j < end && !sep(source.charAt(j))) |
48996 | 79 |
Some((source.subSequence(i + 1, j), j)) |
80 |
} |
|
81 |
else None |
|
43598 | 82 |
} |
48996 | 83 |
private var state: Option[(CharSequence, Int)] = if (end == 0) None else next_chunk(-1) |
84 |
||
73337 | 85 |
def hasNext: Boolean = state.isDefined |
48996 | 86 |
def next(): CharSequence = |
87 |
state match { |
|
60215 | 88 |
case Some((s, i)) => state = next_chunk(i); s |
48996 | 89 |
case None => Iterator.empty.next() |
90 |
} |
|
43598 | 91 |
} |
92 |
||
48996 | 93 |
def space_explode(sep: Char, str: String): List[String] = |
56600 | 94 |
separated_chunks(_ == sep, str).map(_.toString).toList |
48996 | 95 |
|
96 |
||
97 |
/* lines */ |
|
98 |
||
73357 | 99 |
def terminate_lines(lines: IterableOnce[String]): String = lines.mkString("", "\n", "\n") |
51983
32692ce4c61a
more frugal line termination, to cope with huge log files (see also 016cb7d8f297);
wenzelm
parents:
51981
diff
changeset
|
100 |
|
73357 | 101 |
def cat_lines(lines: IterableOnce[String]): String = lines.mkString("\n") |
48996 | 102 |
|
43670
7f933761764b
prefer space_explode/split_lines as in Isabelle/ML;
wenzelm
parents:
43652
diff
changeset
|
103 |
def split_lines(str: String): List[String] = space_explode('\n', str) |
7f933761764b
prefer space_explode/split_lines as in Isabelle/ML;
wenzelm
parents:
43652
diff
changeset
|
104 |
|
62590 | 105 |
def prefix_lines(prfx: String, str: String): String = |
71164 | 106 |
if (str == "") str else cat_lines(split_lines(str).map(prfx + _)) |
62590 | 107 |
|
48996 | 108 |
def first_line(source: CharSequence): String = |
109 |
{ |
|
56600 | 110 |
val lines = separated_chunks(_ == '\n', source) |
73344 | 111 |
if (lines.hasNext) lines.next().toString |
48996 | 112 |
else "" |
113 |
} |
|
114 |
||
73332 | 115 |
def trim_line(s: String): String = |
116 |
if (s.endsWith("\r\n")) s.substring(0, s.length - 2) |
|
117 |
else if (s.endsWith("\r") || s.endsWith("\n")) s.substring(0, s.length - 1) |
|
118 |
else s |
|
119 |
||
120 |
def trim_split_lines(s: String): List[String] = |
|
121 |
split_lines(trim_line(s)).map(trim_line) |
|
122 |
||
65932 | 123 |
def encode_lines(s: String): String = s.replace('\n', '\u000b') |
124 |
def decode_lines(s: String): String = s.replace('\u000b', '\n') |
|
125 |
||
50847 | 126 |
|
127 |
/* strings */ |
|
128 |
||
73357 | 129 |
def cat_strings0(strs: IterableOnce[String]): String = strs.mkString("\u0000") |
73333 | 130 |
def split_strings0(str: String): List[String] = space_explode('\u0000', str) |
131 |
||
64355 | 132 |
def make_string(f: StringBuilder => Unit): String = |
133 |
{ |
|
134 |
val s = new StringBuilder |
|
135 |
f(s) |
|
136 |
s.toString |
|
137 |
} |
|
138 |
||
50847 | 139 |
def try_unprefix(prfx: String, s: String): Option[String] = |
140 |
if (s.startsWith(prfx)) Some(s.substring(prfx.length)) else None |
|
141 |
||
55033 | 142 |
def try_unsuffix(sffx: String, s: String): Option[String] = |
143 |
if (s.endsWith(sffx)) Some(s.substring(0, s.length - sffx.length)) else None |
|
144 |
||
65606 | 145 |
def perhaps_unprefix(prfx: String, s: String): String = try_unprefix(prfx, s) getOrElse s |
146 |
def perhaps_unsuffix(sffx: String, s: String): String = try_unsuffix(sffx, s) getOrElse s |
|
147 |
||
65903 | 148 |
def isolate_substring(s: String): String = new String(s.toCharArray) |
64820
00488a8c042f
Line.Document consists of independently allocated strings;
wenzelm
parents:
64370
diff
changeset
|
149 |
|
71864 | 150 |
def strip_ansi_color(s: String): String = |
73355 | 151 |
s.replaceAll("\u001b\\[\\d+m", "") |
71864 | 152 |
|
43598 | 153 |
|
48996 | 154 |
/* quote */ |
46196 | 155 |
|
67820
e30d6368c7c8
clarified argument formats: explicit Unit, allow XML.Elem as well;
wenzelm
parents:
67436
diff
changeset
|
156 |
def single_quote(s: String): String = "'" + s + "'" |
e30d6368c7c8
clarified argument formats: explicit Unit, allow XML.Elem as well;
wenzelm
parents:
67436
diff
changeset
|
157 |
|
43598 | 158 |
def quote(s: String): String = "\"" + s + "\"" |
56843
b2bfcd8cda80
support for path completion based on file-system content;
wenzelm
parents:
56730
diff
changeset
|
159 |
|
b2bfcd8cda80
support for path completion based on file-system content;
wenzelm
parents:
56730
diff
changeset
|
160 |
def try_unquote(s: String): Option[String] = |
b2bfcd8cda80
support for path completion based on file-system content;
wenzelm
parents:
56730
diff
changeset
|
161 |
if (s.startsWith("\"") && s.endsWith("\"")) Some(s.substring(1, s.length - 1)) |
b2bfcd8cda80
support for path completion based on file-system content;
wenzelm
parents:
56730
diff
changeset
|
162 |
else None |
b2bfcd8cda80
support for path completion based on file-system content;
wenzelm
parents:
56730
diff
changeset
|
163 |
|
58592 | 164 |
def perhaps_unquote(s: String): String = try_unquote(s) getOrElse s |
165 |
||
43598 | 166 |
def commas(ss: Iterable[String]): String = ss.iterator.mkString(", ") |
48362 | 167 |
def commas_quote(ss: Iterable[String]): String = ss.iterator.map(quote).mkString(", ") |
43598 | 168 |
|
36688 | 169 |
|
51983
32692ce4c61a
more frugal line termination, to cope with huge log files (see also 016cb7d8f297);
wenzelm
parents:
51981
diff
changeset
|
170 |
/* CharSequence */ |
34141 | 171 |
|
172 |
class Reverse(text: CharSequence, start: Int, end: Int) extends CharSequence |
|
173 |
{ |
|
73120
c3589f2dff31
more informative errors: simplify diagnosis of spurious failures reported by users;
wenzelm
parents:
72214
diff
changeset
|
174 |
require(0 <= start && start <= end && end <= text.length, "bad reverse range") |
34141 | 175 |
|
176 |
def this(text: CharSequence) = this(text, 0, text.length) |
|
177 |
||
178 |
def length: Int = end - start |
|
179 |
def charAt(i: Int): Char = text.charAt(end - i - 1) |
|
180 |
||
181 |
def subSequence(i: Int, j: Int): CharSequence = |
|
182 |
if (0 <= i && i <= j && j <= length) new Reverse(text, end - j, end - i) |
|
183 |
else throw new IndexOutOfBoundsException |
|
184 |
||
185 |
override def toString: String = |
|
186 |
{ |
|
187 |
val buf = new StringBuilder(length) |
|
188 |
for (i <- 0 until length) |
|
189 |
buf.append(charAt(i)) |
|
190 |
buf.toString |
|
191 |
} |
|
192 |
} |
|
193 |
||
51983
32692ce4c61a
more frugal line termination, to cope with huge log files (see also 016cb7d8f297);
wenzelm
parents:
51981
diff
changeset
|
194 |
class Line_Termination(text: CharSequence) extends CharSequence |
32692ce4c61a
more frugal line termination, to cope with huge log files (see also 016cb7d8f297);
wenzelm
parents:
51981
diff
changeset
|
195 |
{ |
32692ce4c61a
more frugal line termination, to cope with huge log files (see also 016cb7d8f297);
wenzelm
parents:
51981
diff
changeset
|
196 |
def length: Int = text.length + 1 |
32692ce4c61a
more frugal line termination, to cope with huge log files (see also 016cb7d8f297);
wenzelm
parents:
51981
diff
changeset
|
197 |
def charAt(i: Int): Char = if (i == text.length) '\n' else text.charAt(i) |
32692ce4c61a
more frugal line termination, to cope with huge log files (see also 016cb7d8f297);
wenzelm
parents:
51981
diff
changeset
|
198 |
def subSequence(i: Int, j: Int): CharSequence = |
32692ce4c61a
more frugal line termination, to cope with huge log files (see also 016cb7d8f297);
wenzelm
parents:
51981
diff
changeset
|
199 |
if (j == text.length + 1) new Line_Termination(text.subSequence(i, j - 1)) |
32692ce4c61a
more frugal line termination, to cope with huge log files (see also 016cb7d8f297);
wenzelm
parents:
51981
diff
changeset
|
200 |
else text.subSequence(i, j) |
32692ce4c61a
more frugal line termination, to cope with huge log files (see also 016cb7d8f297);
wenzelm
parents:
51981
diff
changeset
|
201 |
override def toString: String = text.toString + "\n" |
32692ce4c61a
more frugal line termination, to cope with huge log files (see also 016cb7d8f297);
wenzelm
parents:
51981
diff
changeset
|
202 |
} |
32692ce4c61a
more frugal line termination, to cope with huge log files (see also 016cb7d8f297);
wenzelm
parents:
51981
diff
changeset
|
203 |
|
34141 | 204 |
|
59224 | 205 |
/* regular expressions */ |
206 |
||
207 |
def make_regex(s: String): Option[Regex] = |
|
208 |
try { Some(new Regex(s)) } catch { case ERROR(_) => None } |
|
209 |
||
64871 | 210 |
def is_regex_meta(c: Char): Boolean = """()[]{}\^$|?*+.<>-=!""".contains(c) |
211 |
||
212 |
def escape_regex(s: String): String = |
|
71601 | 213 |
if (s.exists(is_regex_meta)) { |
64871 | 214 |
(for (c <- s.iterator) |
215 |
yield { if (is_regex_meta(c)) "\\" + c.toString else c.toString }).mkString |
|
216 |
} |
|
217 |
else s |
|
218 |
||
59224 | 219 |
|
61883
c0f34fe6aa61
clarified length of block with pre-existant forced breaks;
wenzelm
parents:
60215
diff
changeset
|
220 |
/* lists */ |
c0f34fe6aa61
clarified length of block with pre-existant forced breaks;
wenzelm
parents:
60215
diff
changeset
|
221 |
|
c0f34fe6aa61
clarified length of block with pre-existant forced breaks;
wenzelm
parents:
60215
diff
changeset
|
222 |
def take_prefix[A](pred: A => Boolean, xs: List[A]): (List[A], List[A]) = |
c0f34fe6aa61
clarified length of block with pre-existant forced breaks;
wenzelm
parents:
60215
diff
changeset
|
223 |
(xs.takeWhile(pred), xs.dropWhile(pred)) |
56686 | 224 |
|
67434 | 225 |
def take_suffix[A](pred: A => Boolean, xs: List[A]): (List[A], List[A]) = |
226 |
{ |
|
227 |
val rev_xs = xs.reverse |
|
228 |
(rev_xs.dropWhile(pred).reverse, rev_xs.takeWhile(pred).reverse) |
|
229 |
} |
|
230 |
||
231 |
def trim[A](pred: A => Boolean, xs: List[A]): List[A] = |
|
232 |
take_suffix(pred, take_prefix(pred, xs)._2)._1 |
|
233 |
||
60215 | 234 |
def member[A, B](xs: List[A])(x: B): Boolean = xs.contains(x) |
56688 | 235 |
def insert[A](x: A)(xs: List[A]): List[A] = if (xs.contains(x)) xs else x :: xs |
236 |
def remove[A, B](x: B)(xs: List[A]): List[A] = if (member(xs)(x)) xs.filterNot(_ == x) else xs |
|
237 |
def update[A](x: A)(xs: List[A]): List[A] = x :: remove(x)(xs) |
|
63734
133e3e84e6fb
some support for merge of Isabelle/jEdit shortcuts wrt. jEdit keymap;
wenzelm
parents:
62590
diff
changeset
|
238 |
|
63867 | 239 |
def merge[A](xs: List[A], ys: List[A]): List[A] = |
240 |
if (xs.eq(ys)) xs |
|
241 |
else if (xs.isEmpty) ys |
|
242 |
else ys.foldRight(xs)(Library.insert(_)(_)) |
|
243 |
||
64207 | 244 |
def distinct[A](xs: List[A], eq: (A, A) => Boolean = (x: A, y: A) => x == y): List[A] = |
63734
133e3e84e6fb
some support for merge of Isabelle/jEdit shortcuts wrt. jEdit keymap;
wenzelm
parents:
62590
diff
changeset
|
245 |
{ |
133e3e84e6fb
some support for merge of Isabelle/jEdit shortcuts wrt. jEdit keymap;
wenzelm
parents:
62590
diff
changeset
|
246 |
val result = new mutable.ListBuffer[A] |
64207 | 247 |
xs.foreach(x => if (!result.exists(y => eq(x, y))) result += x) |
63734
133e3e84e6fb
some support for merge of Isabelle/jEdit shortcuts wrt. jEdit keymap;
wenzelm
parents:
62590
diff
changeset
|
248 |
result.toList |
133e3e84e6fb
some support for merge of Isabelle/jEdit shortcuts wrt. jEdit keymap;
wenzelm
parents:
62590
diff
changeset
|
249 |
} |
63781 | 250 |
|
64207 | 251 |
def duplicates[A](lst: List[A], eq: (A, A) => Boolean = (x: A, y: A) => x == y): List[A] = |
63781 | 252 |
{ |
253 |
val result = new mutable.ListBuffer[A] |
|
254 |
@tailrec def dups(rest: List[A]): Unit = |
|
255 |
rest match { |
|
256 |
case Nil => |
|
257 |
case x :: xs => |
|
64207 | 258 |
if (!result.exists(y => eq(x, y)) && xs.exists(y => eq(x, y))) result += x |
63781 | 259 |
dups(xs) |
260 |
} |
|
261 |
dups(lst) |
|
262 |
result.toList |
|
263 |
} |
|
65761 | 264 |
|
68715 | 265 |
def replicate[A](n: Int, a: A): List[A] = |
266 |
if (n < 0) throw new IllegalArgumentException |
|
267 |
else if (n == 0) Nil |
|
268 |
else { |
|
269 |
val res = new mutable.ListBuffer[A] |
|
270 |
(1 to n).foreach(_ => res += a) |
|
271 |
res.toList |
|
272 |
} |
|
273 |
||
65761 | 274 |
|
275 |
/* proper values */ |
|
276 |
||
277 |
def proper_string(s: String): Option[String] = |
|
278 |
if (s == null || s == "") None else Some(s) |
|
279 |
||
280 |
def proper_list[A](list: List[A]): Option[List[A]] = |
|
281 |
if (list == null || list.isEmpty) None else Some(list) |
|
72214 | 282 |
|
283 |
||
284 |
/* reflection */ |
|
285 |
||
286 |
def is_subclass[A, B](a: Class[A], b: Class[B]): Boolean = |
|
287 |
{ |
|
73339 | 288 |
import scala.language.existentials |
72214 | 289 |
@tailrec def subclass(c: Class[_]): Boolean = |
290 |
{ |
|
291 |
c == b || |
|
292 |
{ |
|
293 |
val d = c.getSuperclass |
|
294 |
d != null && subclass(d) |
|
295 |
} |
|
296 |
} |
|
297 |
subclass(a) |
|
298 |
} |
|
34136 | 299 |
} |