| author | wenzelm | 
| Fri, 24 May 2024 16:15:27 +0200 | |
| changeset 80188 | 3956e8b6a9c9 | 
| parent 79980 | ee04ce2ac13f | 
| child 80194 | 79655411a32d | 
| permissions | -rw-r--r-- | 
| 48411 
5b3440850d36
more abstract file system operations in Scala, corresponding to ML version;
 wenzelm parents: diff
changeset | 1 | /* Title: Pure/General/file.scala | 
| 
5b3440850d36
more abstract file system operations in Scala, corresponding to ML version;
 wenzelm parents: diff
changeset | 2 | Author: Makarius | 
| 
5b3440850d36
more abstract file system operations in Scala, corresponding to ML version;
 wenzelm parents: diff
changeset | 3 | |
| 64698 | 4 | File-system operations. | 
| 48411 
5b3440850d36
more abstract file system operations in Scala, corresponding to ML version;
 wenzelm parents: diff
changeset | 5 | */ | 
| 
5b3440850d36
more abstract file system operations in Scala, corresponding to ML version;
 wenzelm parents: diff
changeset | 6 | |
| 
5b3440850d36
more abstract file system operations in Scala, corresponding to ML version;
 wenzelm parents: diff
changeset | 7 | package isabelle | 
| 
5b3440850d36
more abstract file system operations in Scala, corresponding to ML version;
 wenzelm parents: diff
changeset | 8 | |
| 
5b3440850d36
more abstract file system operations in Scala, corresponding to ML version;
 wenzelm parents: diff
changeset | 9 | |
| 79980 | 10 | import java.util.{Properties => JProperties}
 | 
| 48411 
5b3440850d36
more abstract file system operations in Scala, corresponding to ML version;
 wenzelm parents: diff
changeset | 11 | import java.io.{BufferedWriter, OutputStreamWriter, FileOutputStream, BufferedOutputStream,
 | 
| 51504 | 12 | OutputStream, InputStream, FileInputStream, BufferedInputStream, BufferedReader, | 
| 13 | InputStreamReader, File => JFile, IOException} | |
| 73317 | 14 | import java.nio.file.{StandardOpenOption, Path => JPath, Files, SimpleFileVisitor,
 | 
| 15 | FileVisitOption, FileVisitResult} | |
| 78169 
5ad1ae8626de
minor performance tuning: avoid external process;
 wenzelm parents: 
78161diff
changeset | 16 | import java.nio.file.attribute.{BasicFileAttributes, PosixFilePermission}
 | 
| 79659 
a4118f530263
clarified signature: avoid ill-defined type java.net.URL;
 wenzelm parents: 
79045diff
changeset | 17 | import java.net.URI | 
| 50684 
12b7e0b4a66e
support File.read_gzip as well, in accordance to File.write_gzip;
 wenzelm parents: 
50203diff
changeset | 18 | import java.util.zip.{GZIPInputStream, GZIPOutputStream}
 | 
| 69293 
72a9860f8602
clarified find_files: follow links by default, e.g. relevant for "~/cronjob/log";
 wenzelm parents: 
66693diff
changeset | 19 | import java.util.EnumSet | 
| 48411 
5b3440850d36
more abstract file system operations in Scala, corresponding to ML version;
 wenzelm parents: diff
changeset | 20 | |
| 76353 | 21 | import org.tukaani.xz | 
| 22 | import com.github.luben.zstd | |
| 76348 | 23 | |
| 48411 
5b3440850d36
more abstract file system operations in Scala, corresponding to ML version;
 wenzelm parents: diff
changeset | 24 | import scala.collection.mutable | 
| 
5b3440850d36
more abstract file system operations in Scala, corresponding to ML version;
 wenzelm parents: diff
changeset | 25 | |
| 
5b3440850d36
more abstract file system operations in Scala, corresponding to ML version;
 wenzelm parents: diff
changeset | 26 | |
| 75393 | 27 | object File {
 | 
| 60992 | 28 | /* standard path (Cygwin or Posix) */ | 
| 60988 | 29 | |
| 30 | def standard_path(path: Path): String = path.expand.implode | |
| 31 | ||
| 60992 | 32 | def standard_path(platform_path: String): String = | 
| 73911 | 33 | isabelle.setup.Environment.standard_path(platform_path) | 
| 60992 | 34 | |
| 35 | def standard_path(file: JFile): String = standard_path(file.getPath) | |
| 36 | ||
| 37 | def standard_url(name: String): String = | |
| 38 |     try {
 | |
| 79044 
8cc1ae43e12e
clarified signature: avoid deprecated URL constructors;
 wenzelm parents: 
78956diff
changeset | 39 | val url = new URI(name).toURL | 
| 
8cc1ae43e12e
clarified signature: avoid deprecated URL constructors;
 wenzelm parents: 
78956diff
changeset | 40 |       if (url.getProtocol == "file" && Url.is_wellformed_file(name)) {
 | 
| 64775 | 41 | standard_path(Url.parse_file(name)) | 
| 79044 
8cc1ae43e12e
clarified signature: avoid deprecated URL constructors;
 wenzelm parents: 
78956diff
changeset | 42 | } | 
| 60992 | 43 | else name | 
| 44 | } | |
| 79045 
24d04dd5bf01
more robust exception handling (amending 8cc1ae43e12e);
 wenzelm parents: 
79044diff
changeset | 45 |     catch { case exn: Throwable if Url.is_malformed(exn) => standard_path(name) }
 | 
| 60992 | 46 | |
| 47 | ||
| 48 | /* platform path (Windows or Posix) */ | |
| 49 | ||
| 50 | def platform_path(standard_path: String): String = | |
| 73911 | 51 | isabelle.setup.Environment.platform_path(standard_path) | 
| 60992 | 52 | |
| 53 | def platform_path(path: Path): String = platform_path(standard_path(path)) | |
| 60988 | 54 | def platform_file(path: Path): JFile = new JFile(platform_path(path)) | 
| 55 | ||
| 60992 | 56 | |
| 76884 | 57 | /* symbolic path representation, e.g. "~~/src/Pure/ROOT.ML" */ | 
| 58 | ||
| 59 |   def symbolic_path(path: Path): String = {
 | |
| 77218 | 60 |     val directories = space_explode(':', Isabelle_System.getenv("ISABELLE_DIRECTORIES")).reverse
 | 
| 76884 | 61 | val full_name = standard_path(path) | 
| 62 | directories.view.flatMap(a => | |
| 63 |       try {
 | |
| 64 | val b = standard_path(Path.explode(a)) | |
| 65 | if (full_name == b) Some(a) | |
| 66 |         else {
 | |
| 67 |           Library.try_unprefix(b + "/", full_name) match {
 | |
| 68 | case Some(name) => Some(a + "/" + name) | |
| 69 | case None => None | |
| 70 | } | |
| 71 | } | |
| 72 |       } catch { case ERROR(_) => None }).headOption.getOrElse(path.implode)
 | |
| 73 | } | |
| 74 | ||
| 75 | ||
| 66232 | 76 | /* platform files */ | 
| 77 | ||
| 78 | def absolute(file: JFile): JFile = file.toPath.toAbsolutePath.normalize.toFile | |
| 79 | def canonical(file: JFile): JFile = file.getCanonicalFile | |
| 80 | ||
| 81 | def path(file: JFile): Path = Path.explode(standard_path(file)) | |
| 76546 | 82 | def path(java_path: JPath): Path = path(java_path.toFile) | 
| 83 | ||
| 66232 | 84 | def pwd(): Path = path(Path.current.absolute_file) | 
| 85 | ||
| 75701 | 86 | def uri(file: JFile): URI = file.toURI | 
| 87 | def uri(path: Path): URI = path.file.toURI | |
| 88 | ||
| 79659 
a4118f530263
clarified signature: avoid ill-defined type java.net.URL;
 wenzelm parents: 
79045diff
changeset | 89 | def url(file: JFile): Url = Url(uri(file)) | 
| 
a4118f530263
clarified signature: avoid ill-defined type java.net.URL;
 wenzelm parents: 
79045diff
changeset | 90 | def url(path: Path): Url = url(path.file) | 
| 75701 | 91 | |
| 66232 | 92 | |
| 75906 
2167b9e3157a
clarified signature: support for adhoc file types;
 wenzelm parents: 
75825diff
changeset | 93 | /* adhoc file types */ | 
| 
2167b9e3157a
clarified signature: support for adhoc file types;
 wenzelm parents: 
75825diff
changeset | 94 | |
| 
2167b9e3157a
clarified signature: support for adhoc file types;
 wenzelm parents: 
75825diff
changeset | 95 |   def is_ML(s: String): Boolean = s.endsWith(".ML")
 | 
| 
2167b9e3157a
clarified signature: support for adhoc file types;
 wenzelm parents: 
75825diff
changeset | 96 |   def is_bib(s: String): Boolean = s.endsWith(".bib")
 | 
| 
2167b9e3157a
clarified signature: support for adhoc file types;
 wenzelm parents: 
75825diff
changeset | 97 |   def is_dll(s: String): Boolean = s.endsWith(".dll")
 | 
| 
2167b9e3157a
clarified signature: support for adhoc file types;
 wenzelm parents: 
75825diff
changeset | 98 |   def is_exe(s: String): Boolean = s.endsWith(".exe")
 | 
| 
2167b9e3157a
clarified signature: support for adhoc file types;
 wenzelm parents: 
75825diff
changeset | 99 |   def is_gz(s: String): Boolean = s.endsWith(".gz")
 | 
| 
2167b9e3157a
clarified signature: support for adhoc file types;
 wenzelm parents: 
75825diff
changeset | 100 |   def is_html(s: String): Boolean = s.endsWith(".html")
 | 
| 
2167b9e3157a
clarified signature: support for adhoc file types;
 wenzelm parents: 
75825diff
changeset | 101 |   def is_jar(s: String): Boolean = s.endsWith(".jar")
 | 
| 
2167b9e3157a
clarified signature: support for adhoc file types;
 wenzelm parents: 
75825diff
changeset | 102 |   def is_java(s: String): Boolean = s.endsWith(".java")
 | 
| 
2167b9e3157a
clarified signature: support for adhoc file types;
 wenzelm parents: 
75825diff
changeset | 103 |   def is_node(s: String): Boolean = s.endsWith(".node")
 | 
| 
2167b9e3157a
clarified signature: support for adhoc file types;
 wenzelm parents: 
75825diff
changeset | 104 |   def is_pdf(s: String): Boolean = s.endsWith(".pdf")
 | 
| 
2167b9e3157a
clarified signature: support for adhoc file types;
 wenzelm parents: 
75825diff
changeset | 105 |   def is_png(s: String): Boolean = s.endsWith(".png")
 | 
| 76540 
83de6e9ae983
clarified signature: prefer Scala functions instead of shell scripts;
 wenzelm parents: 
76533diff
changeset | 106 |   def is_tar_bz2(s: String): Boolean = s.endsWith(".tar.bz2")
 | 
| 76533 | 107 |   def is_tar_gz(s: String): Boolean = s.endsWith(".tar.gz")
 | 
| 76540 
83de6e9ae983
clarified signature: prefer Scala functions instead of shell scripts;
 wenzelm parents: 
76533diff
changeset | 108 |   def is_tgz(s: String): Boolean = s.endsWith(".tgz")
 | 
| 75906 
2167b9e3157a
clarified signature: support for adhoc file types;
 wenzelm parents: 
75825diff
changeset | 109 |   def is_thy(s: String): Boolean = s.endsWith(".thy")
 | 
| 
2167b9e3157a
clarified signature: support for adhoc file types;
 wenzelm parents: 
75825diff
changeset | 110 |   def is_xz(s: String): Boolean = s.endsWith(".xz")
 | 
| 
2167b9e3157a
clarified signature: support for adhoc file types;
 wenzelm parents: 
75825diff
changeset | 111 |   def is_zip(s: String): Boolean = s.endsWith(".zip")
 | 
| 76348 | 112 |   def is_zst(s: String): Boolean = s.endsWith(".zst")
 | 
| 75906 
2167b9e3157a
clarified signature: support for adhoc file types;
 wenzelm parents: 
75825diff
changeset | 113 | |
| 
2167b9e3157a
clarified signature: support for adhoc file types;
 wenzelm parents: 
75825diff
changeset | 114 |   def is_backup(s: String): Boolean = s.endsWith("~") || s.endsWith(".orig")
 | 
| 
2167b9e3157a
clarified signature: support for adhoc file types;
 wenzelm parents: 
75825diff
changeset | 115 | |
| 
2167b9e3157a
clarified signature: support for adhoc file types;
 wenzelm parents: 
75825diff
changeset | 116 | |
| 66693 | 117 | /* relative paths */ | 
| 118 | ||
| 75393 | 119 |   def relative_path(base: Path, other: Path): Option[Path] = {
 | 
| 73945 | 120 | val base_path = base.java_path | 
| 121 | val other_path = other.java_path | |
| 66693 | 122 | if (other_path.startsWith(base_path)) | 
| 123 | Some(path(base_path.relativize(other_path).toFile)) | |
| 124 | else None | |
| 125 | } | |
| 126 | ||
| 127 | ||
| 62545 
8ebffdaf2ce2
Bash.process always uses a closed script instead of an open argument list, for extra robustness on Windows, where quoting is not well-defined;
 wenzelm parents: 
62544diff
changeset | 128 | /* bash path */ | 
| 60992 | 129 | |
| 64304 | 130 | def bash_path(path: Path): String = Bash.string(standard_path(path)) | 
| 131 | def bash_path(file: JFile): String = Bash.string(standard_path(file)) | |
| 60988 | 132 | |
| 72036 | 133 | def bash_platform_path(path: Path): String = Bash.string(platform_path(path)) | 
| 134 | ||
| 60988 | 135 | |
| 62829 
4141c2a8458b
clarified Isabelle tool wrapper: bash, Scala, no perl, no ML;
 wenzelm parents: 
62704diff
changeset | 136 | /* directory content */ | 
| 
4141c2a8458b
clarified Isabelle tool wrapper: bash, Scala, no perl, no ML;
 wenzelm parents: 
62704diff
changeset | 137 | |
| 75393 | 138 |   def read_dir(dir: Path): List[String] = {
 | 
| 69300 
8b6ab9989bcd
is_file/is_dir/read_dir: more uniform treatment of errors and boundary cases, notably for symlinks in ssh;
 wenzelm parents: 
69299diff
changeset | 139 |     if (!dir.is_dir) error("No such directory: " + dir.toString)
 | 
| 62829 
4141c2a8458b
clarified Isabelle tool wrapper: bash, Scala, no perl, no ML;
 wenzelm parents: 
62704diff
changeset | 140 | val files = dir.file.listFiles | 
| 
4141c2a8458b
clarified Isabelle tool wrapper: bash, Scala, no perl, no ML;
 wenzelm parents: 
62704diff
changeset | 141 | if (files == null) Nil | 
| 69427 
ff2f39a221d4
clarified operations: uniform sorting of results;
 wenzelm parents: 
69405diff
changeset | 142 | else files.toList.map(_.getName).sorted | 
| 62829 
4141c2a8458b
clarified Isabelle tool wrapper: bash, Scala, no perl, no ML;
 wenzelm parents: 
62704diff
changeset | 143 | } | 
| 48613 
232652ac346e
clarified directory content operations (similar to ML version);
 wenzelm parents: 
48550diff
changeset | 144 | |
| 76529 | 145 | def get_entry( | 
| 146 | dir: Path, | |
| 147 | pred: Path => Boolean = _ => true, | |
| 148 | title: String = "" | |
| 149 | ): Path = | |
| 150 |     read_dir(dir).filter(name => pred(dir + Path.basic(name))) match {
 | |
| 151 | case List(entry) => dir + Path.basic(entry) | |
| 152 | case bad => | |
| 153 |         error("Bad directory content in " + (if (title.nonEmpty) title else dir.toString) +
 | |
| 154 | "\nexpected a single entry, but found" + | |
| 155 | (if (bad.isEmpty) " nothing" | |
| 156 |            else bad.sorted.map(quote).mkString(":\n  ", "\n  ", "")))
 | |
| 72442 | 157 | } | 
| 158 | ||
| 76529 | 159 | def get_file(dir: Path, title: String = ""): Path = | 
| 160 | get_entry(dir, pred = _.is_file, title = title) | |
| 161 | ||
| 162 | def get_dir(dir: Path, title: String = ""): Path = | |
| 163 | get_entry(dir, pred = _.is_dir, title = title) | |
| 164 | ||
| 64932 | 165 | def find_files( | 
| 166 | start: JFile, | |
| 167 | pred: JFile => Boolean = _ => true, | |
| 69293 
72a9860f8602
clarified find_files: follow links by default, e.g. relevant for "~/cronjob/log";
 wenzelm parents: 
66693diff
changeset | 168 | include_dirs: Boolean = false, | 
| 75393 | 169 | follow_links: Boolean = false | 
| 170 |   ): List[JFile] = {
 | |
| 62443 
133f65ac17e5
just one File.find_files, based on Java 7 Files operations;
 wenzelm parents: 
62294diff
changeset | 171 | val result = new mutable.ListBuffer[JFile] | 
| 73340 | 172 | def check(file: JFile): Unit = if (pred(file)) result += file | 
| 62443 
133f65ac17e5
just one File.find_files, based on Java 7 Files operations;
 wenzelm parents: 
62294diff
changeset | 173 | |
| 64932 | 174 | if (start.isFile) check(start) | 
| 62443 
133f65ac17e5
just one File.find_files, based on Java 7 Files operations;
 wenzelm parents: 
62294diff
changeset | 175 |     else if (start.isDirectory) {
 | 
| 69293 
72a9860f8602
clarified find_files: follow links by default, e.g. relevant for "~/cronjob/log";
 wenzelm parents: 
66693diff
changeset | 176 | val options = | 
| 
72a9860f8602
clarified find_files: follow links by default, e.g. relevant for "~/cronjob/log";
 wenzelm parents: 
66693diff
changeset | 177 | if (follow_links) EnumSet.of(FileVisitOption.FOLLOW_LINKS) | 
| 
72a9860f8602
clarified find_files: follow links by default, e.g. relevant for "~/cronjob/log";
 wenzelm parents: 
66693diff
changeset | 178 | else EnumSet.noneOf(classOf[FileVisitOption]) | 
| 78243 | 179 | Files.walkFileTree(start.toPath, options, Int.MaxValue, | 
| 62443 
133f65ac17e5
just one File.find_files, based on Java 7 Files operations;
 wenzelm parents: 
62294diff
changeset | 180 |         new SimpleFileVisitor[JPath] {
 | 
| 75393 | 181 | override def preVisitDirectory( | 
| 182 | path: JPath, | |
| 183 | attrs: BasicFileAttributes | |
| 184 |           ): FileVisitResult = {
 | |
| 64932 | 185 | if (include_dirs) check(path.toFile) | 
| 186 | FileVisitResult.CONTINUE | |
| 187 | } | |
| 75393 | 188 | override def visitFile( | 
| 189 | path: JPath, | |
| 190 | attrs: BasicFileAttributes | |
| 191 |           ): FileVisitResult = {
 | |
| 69301 | 192 | val file = path.toFile | 
| 193 | if (include_dirs || !file.isDirectory) check(file) | |
| 62443 
133f65ac17e5
just one File.find_files, based on Java 7 Files operations;
 wenzelm parents: 
62294diff
changeset | 194 | FileVisitResult.CONTINUE | 
| 
133f65ac17e5
just one File.find_files, based on Java 7 Files operations;
 wenzelm parents: 
62294diff
changeset | 195 | } | 
| 
133f65ac17e5
just one File.find_files, based on Java 7 Files operations;
 wenzelm parents: 
62294diff
changeset | 196 | } | 
| 
133f65ac17e5
just one File.find_files, based on Java 7 Files operations;
 wenzelm parents: 
62294diff
changeset | 197 | ) | 
| 
133f65ac17e5
just one File.find_files, based on Java 7 Files operations;
 wenzelm parents: 
62294diff
changeset | 198 | } | 
| 
133f65ac17e5
just one File.find_files, based on Java 7 Files operations;
 wenzelm parents: 
62294diff
changeset | 199 | |
| 
133f65ac17e5
just one File.find_files, based on Java 7 Files operations;
 wenzelm parents: 
62294diff
changeset | 200 | result.toList | 
| 48613 
232652ac346e
clarified directory content operations (similar to ML version);
 wenzelm parents: 
48550diff
changeset | 201 | } | 
| 
232652ac346e
clarified directory content operations (similar to ML version);
 wenzelm parents: 
48550diff
changeset | 202 | |
| 
232652ac346e
clarified directory content operations (similar to ML version);
 wenzelm parents: 
48550diff
changeset | 203 | |
| 48411 
5b3440850d36
more abstract file system operations in Scala, corresponding to ML version;
 wenzelm parents: diff
changeset | 204 | /* read */ | 
| 
5b3440850d36
more abstract file system operations in Scala, corresponding to ML version;
 wenzelm parents: diff
changeset | 205 | |
| 65589 
f70c617e9c26
more robust treatment of non-UTF8 text files (cf. 3ed43cfc8b14), notably old log files in ISO-8859-15;
 wenzelm parents: 
64934diff
changeset | 206 | def read(file: JFile): String = Bytes.read(file).text | 
| 48913 
f686cb016c0c
more direct File.read_bytes -- avoid cumulative copying of StringBuilder;
 wenzelm parents: 
48613diff
changeset | 207 | def read(path: Path): String = read(path.file) | 
| 
f686cb016c0c
more direct File.read_bytes -- avoid cumulative copying of StringBuilder;
 wenzelm parents: 
48613diff
changeset | 208 | |
| 50684 
12b7e0b4a66e
support File.read_gzip as well, in accordance to File.write_gzip;
 wenzelm parents: 
50203diff
changeset | 209 | |
| 75393 | 210 |   def read_stream(reader: BufferedReader): String = {
 | 
| 48411 
5b3440850d36
more abstract file system operations in Scala, corresponding to ML version;
 wenzelm parents: diff
changeset | 211 | val output = new StringBuilder(100) | 
| 
5b3440850d36
more abstract file system operations in Scala, corresponding to ML version;
 wenzelm parents: diff
changeset | 212 | var c = -1 | 
| 
5b3440850d36
more abstract file system operations in Scala, corresponding to ML version;
 wenzelm parents: diff
changeset | 213 |     while ({ c = reader.read; c != -1 }) output += c.toChar
 | 
| 73367 | 214 | reader.close() | 
| 48411 
5b3440850d36
more abstract file system operations in Scala, corresponding to ML version;
 wenzelm parents: diff
changeset | 215 | output.toString | 
| 
5b3440850d36
more abstract file system operations in Scala, corresponding to ML version;
 wenzelm parents: diff
changeset | 216 | } | 
| 
5b3440850d36
more abstract file system operations in Scala, corresponding to ML version;
 wenzelm parents: diff
changeset | 217 | |
| 50684 
12b7e0b4a66e
support File.read_gzip as well, in accordance to File.write_gzip;
 wenzelm parents: 
50203diff
changeset | 218 | def read_stream(stream: InputStream): String = | 
| 64000 | 219 | read_stream(new BufferedReader(new InputStreamReader(stream, UTF8.charset))) | 
| 50684 
12b7e0b4a66e
support File.read_gzip as well, in accordance to File.write_gzip;
 wenzelm parents: 
50203diff
changeset | 220 | |
| 
12b7e0b4a66e
support File.read_gzip as well, in accordance to File.write_gzip;
 wenzelm parents: 
50203diff
changeset | 221 | def read_gzip(file: JFile): String = | 
| 
12b7e0b4a66e
support File.read_gzip as well, in accordance to File.write_gzip;
 wenzelm parents: 
50203diff
changeset | 222 | read_stream(new GZIPInputStream(new BufferedInputStream(new FileInputStream(file)))) | 
| 64000 | 223 | def read_gzip(path: Path): String = read_gzip(path.file) | 
| 51504 | 224 | |
| 64002 | 225 | def read_xz(file: JFile): String = | 
| 76353 | 226 | read_stream(new xz.XZInputStream(new BufferedInputStream(new FileInputStream(file)))) | 
| 64000 | 227 | def read_xz(path: Path): String = read_xz(path.file) | 
| 48411 
5b3440850d36
more abstract file system operations in Scala, corresponding to ML version;
 wenzelm parents: diff
changeset | 228 | |
| 76348 | 229 |   def read_zstd(file: JFile): String = {
 | 
| 76349 
b4daf7577ca0
clarified Zstd.init(): avoid accidential com.github.luben.zstd.util.Native.load() operation;
 wenzelm parents: 
76348diff
changeset | 230 | Zstd.init() | 
| 76353 | 231 | read_stream(new zstd.ZstdInputStream(new BufferedInputStream(new FileInputStream(file)))) | 
| 76348 | 232 | } | 
| 233 | def read_zstd(path: Path): String = read_zstd(path.file) | |
| 234 | ||
| 48411 
5b3440850d36
more abstract file system operations in Scala, corresponding to ML version;
 wenzelm parents: diff
changeset | 235 | |
| 50845 | 236 | /* read lines */ | 
| 237 | ||
| 75393 | 238 |   def read_line(reader: BufferedReader): Option[String] = {
 | 
| 69487 | 239 | val line = | 
| 240 |       try { reader.readLine}
 | |
| 241 |       catch { case _: IOException => null }
 | |
| 72698 | 242 | Option(line).map(Library.trim_line) | 
| 69487 | 243 | } | 
| 244 | ||
| 75393 | 245 |   def read_lines(reader: BufferedReader, progress: String => Unit): List[String] = {
 | 
| 50845 | 246 | val result = new mutable.ListBuffer[String] | 
| 69487 | 247 | var line: Option[String] = None | 
| 248 |     while ({ line = read_line(reader); line.isDefined }) {
 | |
| 249 | progress(line.get) | |
| 250 | result += line.get | |
| 50845 | 251 | } | 
| 73367 | 252 | reader.close() | 
| 50845 | 253 | result.toList | 
| 254 | } | |
| 255 | ||
| 256 | ||
| 79980 | 257 | /* read properties */ | 
| 258 | ||
| 259 |   def read_props(path: Path): JProperties = {
 | |
| 260 | val props = new JProperties | |
| 261 | props.load(Files.newBufferedReader(path.java_path)) | |
| 262 | props | |
| 263 | } | |
| 264 | ||
| 265 | ||
| 48411 
5b3440850d36
more abstract file system operations in Scala, corresponding to ML version;
 wenzelm parents: diff
changeset | 266 | /* write */ | 
| 
5b3440850d36
more abstract file system operations in Scala, corresponding to ML version;
 wenzelm parents: diff
changeset | 267 | |
| 71534 | 268 | def writer(file: JFile): BufferedWriter = | 
| 269 | new BufferedWriter(new OutputStreamWriter(new FileOutputStream(file), UTF8.charset)) | |
| 270 | ||
| 73340 | 271 | def write_file( | 
| 75393 | 272 | file: JFile, | 
| 273 | text: String, | |
| 274 | make_stream: OutputStream => OutputStream | |
| 275 |   ): Unit = {
 | |
| 51504 | 276 | val stream = make_stream(new FileOutputStream(file)) | 
| 69393 
ed0824ef337e
static type for Library.using: avoid Java 11 warnings on "Illegal reflective access";
 wenzelm parents: 
69301diff
changeset | 277 | using(new BufferedWriter(new OutputStreamWriter(stream, UTF8.charset)))(_.append(text)) | 
| 48411 
5b3440850d36
more abstract file system operations in Scala, corresponding to ML version;
 wenzelm parents: diff
changeset | 278 | } | 
| 
5b3440850d36
more abstract file system operations in Scala, corresponding to ML version;
 wenzelm parents: diff
changeset | 279 | |
| 73574 
12b3f78dde61
clarified signature: avoid overlap of String vs. Bytes (both are CharSequence);
 wenzelm parents: 
73367diff
changeset | 280 | def write(file: JFile, text: String): Unit = write_file(file, text, s => s) | 
| 
12b3f78dde61
clarified signature: avoid overlap of String vs. Bytes (both are CharSequence);
 wenzelm parents: 
73367diff
changeset | 281 | def write(path: Path, text: String): Unit = write(path.file, text) | 
| 48411 
5b3440850d36
more abstract file system operations in Scala, corresponding to ML version;
 wenzelm parents: diff
changeset | 282 | |
| 73574 
12b3f78dde61
clarified signature: avoid overlap of String vs. Bytes (both are CharSequence);
 wenzelm parents: 
73367diff
changeset | 283 | def write_gzip(file: JFile, text: String): Unit = | 
| 51504 | 284 | write_file(file, text, (s: OutputStream) => new GZIPOutputStream(new BufferedOutputStream(s))) | 
| 73574 
12b3f78dde61
clarified signature: avoid overlap of String vs. Bytes (both are CharSequence);
 wenzelm parents: 
73367diff
changeset | 285 | def write_gzip(path: Path, text: String): Unit = write_gzip(path.file, text) | 
| 48411 
5b3440850d36
more abstract file system operations in Scala, corresponding to ML version;
 wenzelm parents: diff
changeset | 286 | |
| 76351 
2cee31cd92f0
generic support for XZ and Zstd compression in Isabelle/Scala;
 wenzelm parents: 
76349diff
changeset | 287 | def write_xz(file: JFile, text: String, options: Compress.Options_XZ): Unit = | 
| 76353 | 288 | File.write_file(file, text, | 
| 289 | s => new xz.XZOutputStream(new BufferedOutputStream(s), options.make)) | |
| 76351 
2cee31cd92f0
generic support for XZ and Zstd compression in Isabelle/Scala;
 wenzelm parents: 
76349diff
changeset | 290 | def write_xz(file: JFile, text: String): Unit = write_xz(file, text, Compress.Options_XZ()) | 
| 
2cee31cd92f0
generic support for XZ and Zstd compression in Isabelle/Scala;
 wenzelm parents: 
76349diff
changeset | 291 | def write_xz(path: Path, text: String, options: Compress.Options_XZ): Unit = | 
| 64002 | 292 | write_xz(path.file, text, options) | 
| 76351 
2cee31cd92f0
generic support for XZ and Zstd compression in Isabelle/Scala;
 wenzelm parents: 
76349diff
changeset | 293 | def write_xz(path: Path, text: String): Unit = write_xz(path, text, Compress.Options_XZ()) | 
| 64000 | 294 | |
| 76351 
2cee31cd92f0
generic support for XZ and Zstd compression in Isabelle/Scala;
 wenzelm parents: 
76349diff
changeset | 295 |   def write_zstd(file: JFile, text: String, options: Compress.Options_Zstd): Unit = {
 | 
| 76349 
b4daf7577ca0
clarified Zstd.init(): avoid accidential com.github.luben.zstd.util.Native.load() operation;
 wenzelm parents: 
76348diff
changeset | 296 | Zstd.init() | 
| 76353 | 297 | File.write_file(file, text, | 
| 298 | s => new zstd.ZstdOutputStream(new BufferedOutputStream(s), options.level)) | |
| 76348 | 299 | } | 
| 76351 
2cee31cd92f0
generic support for XZ and Zstd compression in Isabelle/Scala;
 wenzelm parents: 
76349diff
changeset | 300 | def write_zstd(file: JFile, text: String): Unit = | 
| 
2cee31cd92f0
generic support for XZ and Zstd compression in Isabelle/Scala;
 wenzelm parents: 
76349diff
changeset | 301 | write_zstd(file, text, Compress.Options_Zstd()) | 
| 
2cee31cd92f0
generic support for XZ and Zstd compression in Isabelle/Scala;
 wenzelm parents: 
76349diff
changeset | 302 | def write_zstd(path: Path, text: String, options: Compress.Options_Zstd): Unit = | 
| 
2cee31cd92f0
generic support for XZ and Zstd compression in Isabelle/Scala;
 wenzelm parents: 
76349diff
changeset | 303 | write_zstd(path.file, text, options) | 
| 
2cee31cd92f0
generic support for XZ and Zstd compression in Isabelle/Scala;
 wenzelm parents: 
76349diff
changeset | 304 | def write_zstd(path: Path, text: String): Unit = | 
| 
2cee31cd92f0
generic support for XZ and Zstd compression in Isabelle/Scala;
 wenzelm parents: 
76349diff
changeset | 305 | write_zstd(path, text, Compress.Options_Zstd()) | 
| 76348 | 306 | |
| 75393 | 307 |   def write_backup(path: Path, text: String): Unit = {
 | 
| 73317 | 308 | if (path.is_file) Isabelle_System.move_file(path, path.backup) | 
| 62444 | 309 | write(path, text) | 
| 53336 | 310 | } | 
| 311 | ||
| 75393 | 312 |   def write_backup2(path: Path, text: String): Unit = {
 | 
| 73317 | 313 | if (path.is_file) Isabelle_System.move_file(path, path.backup2) | 
| 62444 | 314 | write(path, text) | 
| 58610 | 315 | } | 
| 316 | ||
| 48411 
5b3440850d36
more abstract file system operations in Scala, corresponding to ML version;
 wenzelm parents: diff
changeset | 317 | |
| 62703 | 318 | /* append */ | 
| 319 | ||
| 73574 
12b3f78dde61
clarified signature: avoid overlap of String vs. Bytes (both are CharSequence);
 wenzelm parents: 
73367diff
changeset | 320 | def append(file: JFile, text: String): Unit = | 
| 73627 | 321 | Files.write(file.toPath, UTF8.bytes(text), | 
| 62703 | 322 | StandardOpenOption.APPEND, StandardOpenOption.CREATE) | 
| 323 | ||
| 73574 
12b3f78dde61
clarified signature: avoid overlap of String vs. Bytes (both are CharSequence);
 wenzelm parents: 
73367diff
changeset | 324 | def append(path: Path, text: String): Unit = append(path.file, text) | 
| 62703 | 325 | |
| 326 | ||
| 75206 | 327 | /* change */ | 
| 328 | ||
| 75393 | 329 | def change( | 
| 330 | path: Path, | |
| 331 | init: Boolean = false, | |
| 332 | strict: Boolean = false | |
| 333 |   )(f: String => String): Unit = {
 | |
| 75208 | 334 | if (!path.is_file && init) write(path, "") | 
| 75206 | 335 | val x = read(path) | 
| 336 | val y = f(x) | |
| 337 | if (x != y) write(path, y) | |
| 75213 | 338 |     else if (strict) error("Unchanged file: " + path)
 | 
| 75206 | 339 | } | 
| 340 | ||
| 75213 | 341 | def change_lines(path: Path, init: Boolean = false, strict: Boolean = false)( | 
| 342 | f: List[String] => List[String]): Unit = | |
| 343 | change(path, init = init, strict = strict)(text => cat_lines(f(split_lines(text)))) | |
| 75206 | 344 | |
| 345 | ||
| 64213 | 346 | /* eq */ | 
| 48411 
5b3440850d36
more abstract file system operations in Scala, corresponding to ML version;
 wenzelm parents: diff
changeset | 347 | |
| 
5b3440850d36
more abstract file system operations in Scala, corresponding to ML version;
 wenzelm parents: diff
changeset | 348 | def eq(file1: JFile, file2: JFile): Boolean = | 
| 73318 | 349 |     try { Files.isSameFile(file1.toPath, file2.toPath) }
 | 
| 49673 
2a088cff1e7b
more robust File.eq, and thus File.copy of "~~/lib/logo/isabelle.gif";
 wenzelm parents: 
49610diff
changeset | 350 |     catch { case ERROR(_) => false }
 | 
| 48411 
5b3440850d36
more abstract file system operations in Scala, corresponding to ML version;
 wenzelm parents: diff
changeset | 351 | |
| 64213 | 352 | def eq(path1: Path, path2: Path): Boolean = eq(path1.file, path2.file) | 
| 353 | ||
| 354 | ||
| 64934 | 355 | /* eq_content */ | 
| 356 | ||
| 357 | def eq_content(file1: JFile, file2: JFile): Boolean = | |
| 358 | if (eq(file1, file2)) true | |
| 359 | else if (file1.length != file2.length) false | |
| 360 | else Bytes.read(file1) == Bytes.read(file2) | |
| 361 | ||
| 362 | def eq_content(path1: Path, path2: Path): Boolean = eq_content(path1.file, path2.file) | |
| 363 | ||
| 364 | ||
| 69405 
22428643351f
more direct File.executable operation: avoid external process (on Unix);
 wenzelm parents: 
69402diff
changeset | 365 | /* permissions */ | 
| 
22428643351f
more direct File.executable operation: avoid external process (on Unix);
 wenzelm parents: 
69402diff
changeset | 366 | |
| 78169 
5ad1ae8626de
minor performance tuning: avoid external process;
 wenzelm parents: 
78161diff
changeset | 367 | private val restrict_perms: List[PosixFilePermission] = | 
| 
5ad1ae8626de
minor performance tuning: avoid external process;
 wenzelm parents: 
78161diff
changeset | 368 | List( | 
| 
5ad1ae8626de
minor performance tuning: avoid external process;
 wenzelm parents: 
78161diff
changeset | 369 | PosixFilePermission.GROUP_READ, | 
| 
5ad1ae8626de
minor performance tuning: avoid external process;
 wenzelm parents: 
78161diff
changeset | 370 | PosixFilePermission.GROUP_WRITE, | 
| 
5ad1ae8626de
minor performance tuning: avoid external process;
 wenzelm parents: 
78161diff
changeset | 371 | PosixFilePermission.GROUP_EXECUTE, | 
| 
5ad1ae8626de
minor performance tuning: avoid external process;
 wenzelm parents: 
78161diff
changeset | 372 | PosixFilePermission.OTHERS_READ, | 
| 
5ad1ae8626de
minor performance tuning: avoid external process;
 wenzelm parents: 
78161diff
changeset | 373 | PosixFilePermission.OTHERS_WRITE, | 
| 
5ad1ae8626de
minor performance tuning: avoid external process;
 wenzelm parents: 
78161diff
changeset | 374 | PosixFilePermission.OTHERS_EXECUTE) | 
| 
5ad1ae8626de
minor performance tuning: avoid external process;
 wenzelm parents: 
78161diff
changeset | 375 | |
| 
5ad1ae8626de
minor performance tuning: avoid external process;
 wenzelm parents: 
78161diff
changeset | 376 | def restrict(path: Path): Unit = | 
| 
5ad1ae8626de
minor performance tuning: avoid external process;
 wenzelm parents: 
78161diff
changeset | 377 |     if (Platform.is_windows) Isabelle_System.chmod("g-rwx,o-rwx", path)
 | 
| 
5ad1ae8626de
minor performance tuning: avoid external process;
 wenzelm parents: 
78161diff
changeset | 378 |     else {
 | 
| 
5ad1ae8626de
minor performance tuning: avoid external process;
 wenzelm parents: 
78161diff
changeset | 379 | val perms = Files.getPosixFilePermissions(path.java_path) | 
| 
5ad1ae8626de
minor performance tuning: avoid external process;
 wenzelm parents: 
78161diff
changeset | 380 | var perms_changed = false | 
| 
5ad1ae8626de
minor performance tuning: avoid external process;
 wenzelm parents: 
78161diff
changeset | 381 |       for (p <- restrict_perms if perms.contains(p)) {
 | 
| 
5ad1ae8626de
minor performance tuning: avoid external process;
 wenzelm parents: 
78161diff
changeset | 382 | perms.remove(p) | 
| 
5ad1ae8626de
minor performance tuning: avoid external process;
 wenzelm parents: 
78161diff
changeset | 383 | perms_changed = true | 
| 
5ad1ae8626de
minor performance tuning: avoid external process;
 wenzelm parents: 
78161diff
changeset | 384 | } | 
| 
5ad1ae8626de
minor performance tuning: avoid external process;
 wenzelm parents: 
78161diff
changeset | 385 | if (perms_changed) Files.setPosixFilePermissions(path.java_path, perms) | 
| 
5ad1ae8626de
minor performance tuning: avoid external process;
 wenzelm parents: 
78161diff
changeset | 386 | } | 
| 78161 | 387 | |
| 75393 | 388 |   def is_executable(path: Path): Boolean = {
 | 
| 69788 | 389 |     if (Platform.is_windows) Isabelle_System.bash("test -x " + bash_path(path)).check.ok
 | 
| 390 | else path.file.canExecute | |
| 391 | } | |
| 392 | ||
| 78298 
3b0f8f1010f2
clarified signature, with subtle change of semantics (amending 8b5a2e4b16d4);
 wenzelm parents: 
78243diff
changeset | 393 |   def set_executable(path: Path, reset: Boolean = false): Unit = {
 | 
| 
3b0f8f1010f2
clarified signature, with subtle change of semantics (amending 8b5a2e4b16d4);
 wenzelm parents: 
78243diff
changeset | 394 | if (Platform.is_windows) Isabelle_System.chmod(if (reset) "a-x" else "a+x", path) | 
| 
3b0f8f1010f2
clarified signature, with subtle change of semantics (amending 8b5a2e4b16d4);
 wenzelm parents: 
78243diff
changeset | 395 | else path.file.setExecutable(!reset, false) | 
| 69405 
22428643351f
more direct File.executable operation: avoid external process (on Unix);
 wenzelm parents: 
69402diff
changeset | 396 | } | 
| 74811 | 397 | |
| 398 | ||
| 399 | /* content */ | |
| 400 | ||
| 75825 | 401 | def content(path: Path, content: Bytes): Content = new Content(path, content) | 
| 402 | def content(path: Path, content: String): Content = new Content(path, Bytes(content)) | |
| 75824 | 403 | def content(path: Path, content: XML.Body): Content_XML = new Content_XML(path, content) | 
| 74811 | 404 | |
| 75825 | 405 |   final class Content private[File](val path: Path, val content: Bytes) {
 | 
| 75677 | 406 | override def toString: String = path.toString | 
| 74811 | 407 | |
| 77852 
df35b5b7b6a4
more direct hg_sync init via ssh (see also 721b3278c8e4);
 wenzelm parents: 
77218diff
changeset | 408 |     def write(dir: Path, ssh: SSH.System = SSH.Local): Unit = {
 | 
| 75508 | 409 | val full_path = dir + path | 
| 77852 
df35b5b7b6a4
more direct hg_sync init via ssh (see also 721b3278c8e4);
 wenzelm parents: 
77218diff
changeset | 410 | ssh.make_directory(ssh.expand_path(full_path).dir) | 
| 
df35b5b7b6a4
more direct hg_sync init via ssh (see also 721b3278c8e4);
 wenzelm parents: 
77218diff
changeset | 411 | ssh.write_bytes(full_path, content) | 
| 75508 | 412 | } | 
| 74811 | 413 | } | 
| 414 | ||
| 75676 | 415 |   final class Content_XML private[File](val path: Path, val content: XML.Body) {
 | 
| 75823 
6eb8d6cdb686
proper toString for Content_XML, which is not covered by trait Content;
 wenzelm parents: 
75701diff
changeset | 416 | override def toString: String = path.toString | 
| 
6eb8d6cdb686
proper toString for Content_XML, which is not covered by trait Content;
 wenzelm parents: 
75701diff
changeset | 417 | |
| 75825 | 418 | def output(out: XML.Body => String): Content = new Content(path, Bytes(out(content))) | 
| 74811 | 419 | } | 
| 77109 
e3a2b3536030
prefer typed bytes count, but retain toString of original Long for robustness of Java/Scala string composition;
 wenzelm parents: 
76884diff
changeset | 420 | |
| 
e3a2b3536030
prefer typed bytes count, but retain toString of original Long for robustness of Java/Scala string composition;
 wenzelm parents: 
76884diff
changeset | 421 | |
| 78956 | 422 | /* strict file size */ | 
| 77109 
e3a2b3536030
prefer typed bytes count, but retain toString of original Long for robustness of Java/Scala string composition;
 wenzelm parents: 
76884diff
changeset | 423 | |
| 78956 | 424 | def size(path: Path): Long = path.check_file.file.length | 
| 425 | def space(path: Path): Space = Space.bytes(size(path)) | |
| 48411 
5b3440850d36
more abstract file system operations in Scala, corresponding to ML version;
 wenzelm parents: diff
changeset | 426 | } |