| author | wenzelm |
| Fri, 24 Jun 2022 23:31:28 +0200 | |
| changeset 75615 | 4494cd69f97f |
| parent 75613 | 1b50bcd108b7 |
| child 75616 | 986506233812 |
| permissions | -rw-r--r-- |
| 6118 | 1 |
(* Title: Pure/General/file.ML |
| 64698 | 2 |
Author: Makarius |
| 5009 | 3 |
|
| 64698 | 4 |
File-system operations. |
| 5009 | 5 |
*) |
6 |
||
7 |
signature FILE = |
|
8 |
sig |
|
|
60970
e08d868ceca9
clarified File.standard_path vs. File.platform_path (like Isabelle/Scala operations);
wenzelm
parents:
59058
diff
changeset
|
9 |
val standard_path: Path.T -> string |
| 16261 | 10 |
val platform_path: Path.T -> string |
|
62549
9498623b27f0
File.bash_string operations in ML as in Scala -- exclusively for GNU bash, not perl and not user output;
wenzelm
parents:
62468
diff
changeset
|
11 |
val bash_path: Path.T -> string |
| 69223 | 12 |
val bash_paths: Path.T list -> string |
| 72278 | 13 |
val bash_platform_path: Path.T -> string |
|
73314
87403fde8cc3
more direct make_directory in ML and Scala, but ssh still requires perl for Windows UNC paths (see a5dbad753552);
wenzelm
parents:
73264
diff
changeset
|
14 |
val absolute_path: Path.T -> Path.T |
|
42003
6e45dc518ebb
replaced File.check by specific File.check_file, File.check_dir;
wenzelm
parents:
41944
diff
changeset
|
15 |
val full_path: Path.T -> Path.T -> Path.T |
| 6182 | 16 |
val tmp_path: Path.T -> Path.T |
| 17826 | 17 |
val exists: Path.T -> bool |
18 |
val rm: Path.T -> unit |
|
| 40785 | 19 |
val is_dir: Path.T -> bool |
|
69300
8b6ab9989bcd
is_file/is_dir/read_dir: more uniform treatment of errors and boundary cases, notably for symlinks in ssh;
wenzelm
parents:
69223
diff
changeset
|
20 |
val is_file: Path.T -> bool |
|
42003
6e45dc518ebb
replaced File.check by specific File.check_file, File.check_dir;
wenzelm
parents:
41944
diff
changeset
|
21 |
val check_dir: Path.T -> Path.T |
|
6e45dc518ebb
replaced File.check by specific File.check_file, File.check_dir;
wenzelm
parents:
41944
diff
changeset
|
22 |
val check_file: Path.T -> Path.T |
| 43848 | 23 |
val fold_dir: (string -> 'a -> 'a) -> Path.T -> 'a -> 'a |
24 |
val read_dir: Path.T -> string list |
|
| 28028 | 25 |
val fold_lines: (string -> 'a -> 'a) -> Path.T -> 'a -> 'a |
| 43848 | 26 |
val read_lines: Path.T -> string list |
| 6182 | 27 |
val read: Path.T -> string |
28 |
val write: Path.T -> string -> unit |
|
29 |
val append: Path.T -> string -> unit |
|
| 16713 | 30 |
val write_list: Path.T -> string list -> unit |
31 |
val append_list: Path.T -> string list -> unit |
|
| 16603 | 32 |
val eq: Path.T * Path.T -> bool |
| 5009 | 33 |
end; |
34 |
||
35 |
structure File: FILE = |
|
36 |
struct |
|
37 |
||
|
26503
4dec4460244f
discontinued unused hooks explode_platform_path_fn, platform_path_fn, shell_path_fn;
wenzelm
parents:
26220
diff
changeset
|
38 |
(* system path representations *) |
| 6224 | 39 |
|
|
60970
e08d868ceca9
clarified File.standard_path vs. File.platform_path (like Isabelle/Scala operations);
wenzelm
parents:
59058
diff
changeset
|
40 |
val standard_path = Path.implode o Path.expand; |
| 62468 | 41 |
val platform_path = ML_System.platform_path o standard_path; |
|
26980
f7f48bb9a025
ident: naive caching prevents potentially slow external invocations;
wenzelm
parents:
26946
diff
changeset
|
42 |
|
| 73264 | 43 |
val bash_path = Bash.string o standard_path; |
44 |
val bash_paths = Bash.strings o map standard_path; |
|
| 6224 | 45 |
|
| 73264 | 46 |
val bash_platform_path = Bash.string o platform_path; |
| 72278 | 47 |
|
| 70292 | 48 |
|
|
42003
6e45dc518ebb
replaced File.check by specific File.check_file, File.check_dir;
wenzelm
parents:
41944
diff
changeset
|
49 |
(* full_path *) |
|
6e45dc518ebb
replaced File.check by specific File.check_file, File.check_dir;
wenzelm
parents:
41944
diff
changeset
|
50 |
|
|
73314
87403fde8cc3
more direct make_directory in ML and Scala, but ssh still requires perl for Windows UNC paths (see a5dbad753552);
wenzelm
parents:
73264
diff
changeset
|
51 |
val absolute_path = |
|
87403fde8cc3
more direct make_directory in ML and Scala, but ssh still requires perl for Windows UNC paths (see a5dbad753552);
wenzelm
parents:
73264
diff
changeset
|
52 |
Path.expand #> (fn path => |
|
87403fde8cc3
more direct make_directory in ML and Scala, but ssh still requires perl for Windows UNC paths (see a5dbad753552);
wenzelm
parents:
73264
diff
changeset
|
53 |
if Path.is_absolute path then path |
|
87403fde8cc3
more direct make_directory in ML and Scala, but ssh still requires perl for Windows UNC paths (see a5dbad753552);
wenzelm
parents:
73264
diff
changeset
|
54 |
else Path.explode (ML_System.standard_path (OS.FileSys.getDir ())) + path); |
|
87403fde8cc3
more direct make_directory in ML and Scala, but ssh still requires perl for Windows UNC paths (see a5dbad753552);
wenzelm
parents:
73264
diff
changeset
|
55 |
|
|
42003
6e45dc518ebb
replaced File.check by specific File.check_file, File.check_dir;
wenzelm
parents:
41944
diff
changeset
|
56 |
fun full_path dir path = |
|
6e45dc518ebb
replaced File.check by specific File.check_file, File.check_dir;
wenzelm
parents:
41944
diff
changeset
|
57 |
let |
|
6e45dc518ebb
replaced File.check by specific File.check_file, File.check_dir;
wenzelm
parents:
41944
diff
changeset
|
58 |
val path' = Path.expand path; |
|
6e45dc518ebb
replaced File.check by specific File.check_file, File.check_dir;
wenzelm
parents:
41944
diff
changeset
|
59 |
val _ = Path.is_current path' andalso error "Bad file specification"; |
|
73314
87403fde8cc3
more direct make_directory in ML and Scala, but ssh still requires perl for Windows UNC paths (see a5dbad753552);
wenzelm
parents:
73264
diff
changeset
|
60 |
in absolute_path (dir + path') end; |
| 5009 | 61 |
|
| 6182 | 62 |
|
63 |
(* tmp_path *) |
|
64 |
||
|
72511
460d743010bc
clarified signature: overloaded "+" for Path.append;
wenzelm
parents:
72278
diff
changeset
|
65 |
fun tmp_path path = Path.variable "ISABELLE_TMP" + Path.base path; |
| 5009 | 66 |
|
67 |
||
|
26980
f7f48bb9a025
ident: naive caching prevents potentially slow external invocations;
wenzelm
parents:
26946
diff
changeset
|
68 |
(* directory entries *) |
|
f7f48bb9a025
ident: naive caching prevents potentially slow external invocations;
wenzelm
parents:
26946
diff
changeset
|
69 |
|
|
23861
72bb3494746f
replaced info by ident (for full identification, potentially content-based);
wenzelm
parents:
23826
diff
changeset
|
70 |
val exists = can OS.FileSys.modTime o platform_path; |
| 16261 | 71 |
|
72 |
val rm = OS.FileSys.remove o platform_path; |
|
73 |
||
|
69300
8b6ab9989bcd
is_file/is_dir/read_dir: more uniform treatment of errors and boundary cases, notably for symlinks in ssh;
wenzelm
parents:
69223
diff
changeset
|
74 |
fun test_dir path = the_default false (try OS.FileSys.isDir (platform_path path)); |
|
8b6ab9989bcd
is_file/is_dir/read_dir: more uniform treatment of errors and boundary cases, notably for symlinks in ssh;
wenzelm
parents:
69223
diff
changeset
|
75 |
fun is_dir path = exists path andalso test_dir path; |
|
8b6ab9989bcd
is_file/is_dir/read_dir: more uniform treatment of errors and boundary cases, notably for symlinks in ssh;
wenzelm
parents:
69223
diff
changeset
|
76 |
fun is_file path = exists path andalso not (test_dir path); |
| 40785 | 77 |
|
|
42003
6e45dc518ebb
replaced File.check by specific File.check_file, File.check_dir;
wenzelm
parents:
41944
diff
changeset
|
78 |
fun check_dir path = |
|
69300
8b6ab9989bcd
is_file/is_dir/read_dir: more uniform treatment of errors and boundary cases, notably for symlinks in ssh;
wenzelm
parents:
69223
diff
changeset
|
79 |
if is_dir path then path |
| 63668 | 80 |
else error ("No such directory: " ^ Path.print (Path.expand path));
|
|
42003
6e45dc518ebb
replaced File.check by specific File.check_file, File.check_dir;
wenzelm
parents:
41944
diff
changeset
|
81 |
|
|
6e45dc518ebb
replaced File.check by specific File.check_file, File.check_dir;
wenzelm
parents:
41944
diff
changeset
|
82 |
fun check_file path = |
|
69300
8b6ab9989bcd
is_file/is_dir/read_dir: more uniform treatment of errors and boundary cases, notably for symlinks in ssh;
wenzelm
parents:
69223
diff
changeset
|
83 |
if is_file path then path |
| 63668 | 84 |
else error ("No such file: " ^ Path.print (Path.expand path));
|
|
42003
6e45dc518ebb
replaced File.check by specific File.check_file, File.check_dir;
wenzelm
parents:
41944
diff
changeset
|
85 |
|
| 16261 | 86 |
|
| 43848 | 87 |
(* directory content *) |
88 |
||
|
69300
8b6ab9989bcd
is_file/is_dir/read_dir: more uniform treatment of errors and boundary cases, notably for symlinks in ssh;
wenzelm
parents:
69223
diff
changeset
|
89 |
fun fold_dir f path a = |
| 75615 | 90 |
check_dir path |> File_Stream.open_dir (fn stream => |
|
69300
8b6ab9989bcd
is_file/is_dir/read_dir: more uniform treatment of errors and boundary cases, notably for symlinks in ssh;
wenzelm
parents:
69223
diff
changeset
|
91 |
let |
|
8b6ab9989bcd
is_file/is_dir/read_dir: more uniform treatment of errors and boundary cases, notably for symlinks in ssh;
wenzelm
parents:
69223
diff
changeset
|
92 |
fun read x = |
|
8b6ab9989bcd
is_file/is_dir/read_dir: more uniform treatment of errors and boundary cases, notably for symlinks in ssh;
wenzelm
parents:
69223
diff
changeset
|
93 |
(case OS.FileSys.readDir stream of |
|
8b6ab9989bcd
is_file/is_dir/read_dir: more uniform treatment of errors and boundary cases, notably for symlinks in ssh;
wenzelm
parents:
69223
diff
changeset
|
94 |
NONE => x |
|
8b6ab9989bcd
is_file/is_dir/read_dir: more uniform treatment of errors and boundary cases, notably for symlinks in ssh;
wenzelm
parents:
69223
diff
changeset
|
95 |
| SOME entry => read (f entry x)); |
|
8b6ab9989bcd
is_file/is_dir/read_dir: more uniform treatment of errors and boundary cases, notably for symlinks in ssh;
wenzelm
parents:
69223
diff
changeset
|
96 |
in read a end); |
| 43848 | 97 |
|
|
69427
ff2f39a221d4
clarified operations: uniform sorting of results;
wenzelm
parents:
69300
diff
changeset
|
98 |
fun read_dir path = sort_strings (fold_dir cons path []); |
| 43848 | 99 |
|
100 |
||
| 44879 | 101 |
(* |
102 |
scalable iterator: |
|
103 |
. avoid size limit of TextIO.inputAll and overhead of many TextIO.inputLine |
|
|
48911
5debc3e4fa81
tuned messages: end-of-input rarely means physical end-of-file from the past;
wenzelm
parents:
48446
diff
changeset
|
104 |
. optional terminator at end-of-input |
| 44879 | 105 |
*) |
| 75615 | 106 |
fun fold_lines f path a = File_Stream.open_input (fn file => |
| 28028 | 107 |
let |
|
28510
66b95e857bde
fold_lines: more tuning, avoiding extra split_last;
wenzelm
parents:
28500
diff
changeset
|
108 |
fun read buf x = |
| 75615 | 109 |
(case File_Stream.input file of |
| 75595 | 110 |
"" => (case Buffer.content buf of "" => x | line => f line x) |
|
28510
66b95e857bde
fold_lines: more tuning, avoiding extra split_last;
wenzelm
parents:
28500
diff
changeset
|
111 |
| input => |
| 75595 | 112 |
(case String.fields (fn c => c = #"\n") input of |
|
28510
66b95e857bde
fold_lines: more tuning, avoiding extra split_last;
wenzelm
parents:
28500
diff
changeset
|
113 |
[rest] => read (Buffer.add rest buf) x |
| 75595 | 114 |
| line :: more => read_more more (f (Buffer.content (Buffer.add line buf)) x))) |
115 |
and read_more [rest] x = read (Buffer.add rest Buffer.empty) x |
|
116 |
| read_more (line :: more) x = read_more more (f line x); |
|
| 28028 | 117 |
in read Buffer.empty a end) path; |
118 |
||
| 43848 | 119 |
fun read_lines path = rev (fold_lines cons path []); |
120 |
||
| 75615 | 121 |
val read = File_Stream.open_input File_Stream.input_all; |
| 5009 | 122 |
|
| 28028 | 123 |
|
| 75615 | 124 |
(* write *) |
| 28028 | 125 |
|
| 75615 | 126 |
fun write_list path ss = File_Stream.open_output (fn stream => File_Stream.outputs stream ss) path; |
127 |
fun append_list path ss = File_Stream.open_append (fn stream => File_Stream.outputs stream ss) path; |
|
| 16713 | 128 |
|
129 |
fun write path txt = write_list path [txt]; |
|
130 |
fun append path txt = append_list path [txt]; |
|
| 6182 | 131 |
|
| 28028 | 132 |
|
|
56533
cd8b6d849b6a
explicit 'document_files' in session ROOT specifications;
wenzelm
parents:
48911
diff
changeset
|
133 |
(* eq *) |
| 5009 | 134 |
|
| 16603 | 135 |
fun eq paths = |
|
59058
a78612c67ec0
renamed "pairself" to "apply2", in accordance to @{apply 2};
wenzelm
parents:
56533
diff
changeset
|
136 |
(case try (apply2 (OS.FileSys.fileId o platform_path)) paths of |
| 26656 | 137 |
SOME ids => is_equal (OS.FileSys.compare ids) |
| 16603 | 138 |
| NONE => false); |
139 |
||
| 5009 | 140 |
end; |