author | wenzelm |
Wed, 11 Aug 2010 18:41:06 +0200 | |
changeset 38353 | d98baa2cf589 |
parent 37740 | 9bb4a74cff4e |
child 40425 | c9b5e0fcee31 |
permissions | -rw-r--r-- |
35942
667fd8553cd5
use internal SHA1 digest implementation for generating hash keys
boehmes
parents:
35941
diff
changeset
|
1 |
(* Title: Tools/cache_io.ML |
35151 | 2 |
Author: Sascha Boehme, TU Muenchen |
3 |
||
4 |
Cache for output of external processes. |
|
5 |
*) |
|
6 |
||
7 |
signature CACHE_IO = |
|
8 |
sig |
|
9 |
val with_tmp_file: string -> (Path.T -> 'a) -> 'a |
|
37740 | 10 |
val with_tmp_dir: string -> (Path.T -> 'a) -> 'a |
36086
8e5454761f26
simplified Cache_IO interface (input is just a string and not already stored in a file)
boehmes
parents:
35942
diff
changeset
|
11 |
val run: (Path.T -> Path.T -> string) -> string -> string list * string list |
35151 | 12 |
|
13 |
type cache |
|
14 |
val make: Path.T -> cache |
|
15 |
val cache_path_of: cache -> Path.T |
|
36086
8e5454761f26
simplified Cache_IO interface (input is just a string and not already stored in a file)
boehmes
parents:
35942
diff
changeset
|
16 |
val lookup: cache -> string -> (string list * string list) option * string |
8e5454761f26
simplified Cache_IO interface (input is just a string and not already stored in a file)
boehmes
parents:
35942
diff
changeset
|
17 |
val run_and_cache: cache -> string -> (Path.T -> Path.T -> string) -> |
8e5454761f26
simplified Cache_IO interface (input is just a string and not already stored in a file)
boehmes
parents:
35942
diff
changeset
|
18 |
string -> string list * string list |
8e5454761f26
simplified Cache_IO interface (input is just a string and not already stored in a file)
boehmes
parents:
35942
diff
changeset
|
19 |
val run_cached: cache -> (Path.T -> Path.T -> string) -> string -> |
35151 | 20 |
string list * string list |
21 |
end |
|
22 |
||
23 |
structure Cache_IO : CACHE_IO = |
|
24 |
struct |
|
25 |
||
36086
8e5454761f26
simplified Cache_IO interface (input is just a string and not already stored in a file)
boehmes
parents:
35942
diff
changeset
|
26 |
val cache_io_prefix = "cache-io-" |
8e5454761f26
simplified Cache_IO interface (input is just a string and not already stored in a file)
boehmes
parents:
35942
diff
changeset
|
27 |
|
35151 | 28 |
fun with_tmp_file name f = |
29 |
let |
|
30 |
val path = File.tmp_path (Path.explode (name ^ serial_string ())) |
|
31 |
val x = Exn.capture f path |
|
32 |
val _ = try File.rm path |
|
33 |
in Exn.release x end |
|
34 |
||
37740 | 35 |
fun with_tmp_dir name f = |
36 |
let |
|
37 |
val path = File.tmp_path (Path.explode (name ^ serial_string ())) |
|
38 |
val _ = File.mkdir path |
|
39 |
val x = Exn.capture f path |
|
40 |
val _ = try File.rm_tree path |
|
41 |
in Exn.release x end |
|
42 |
||
36086
8e5454761f26
simplified Cache_IO interface (input is just a string and not already stored in a file)
boehmes
parents:
35942
diff
changeset
|
43 |
fun run make_cmd str = |
8e5454761f26
simplified Cache_IO interface (input is just a string and not already stored in a file)
boehmes
parents:
35942
diff
changeset
|
44 |
with_tmp_file cache_io_prefix (fn in_path => |
8e5454761f26
simplified Cache_IO interface (input is just a string and not already stored in a file)
boehmes
parents:
35942
diff
changeset
|
45 |
with_tmp_file cache_io_prefix (fn out_path => |
35151 | 46 |
let |
36086
8e5454761f26
simplified Cache_IO interface (input is just a string and not already stored in a file)
boehmes
parents:
35942
diff
changeset
|
47 |
val _ = File.write in_path str |
35151 | 48 |
val (out2, _) = bash_output (make_cmd in_path out_path) |
49 |
val out1 = the_default [] (try (rev o File.fold_lines cons out_path) []) |
|
36086
8e5454761f26
simplified Cache_IO interface (input is just a string and not already stored in a file)
boehmes
parents:
35942
diff
changeset
|
50 |
in (out1, split_lines out2) end)) |
35151 | 51 |
|
52 |
||
53 |
||
54 |
abstype cache = Cache of { |
|
55 |
path: Path.T, |
|
56 |
table: (int * (int * int * int) Symtab.table) Synchronized.var } |
|
57 |
with |
|
58 |
||
59 |
||
60 |
fun cache_path_of (Cache {path, ...}) = path |
|
61 |
||
62 |
||
63 |
fun load cache_path = |
|
64 |
let |
|
65 |
fun err () = error ("Cache IO: corrupted cache file: " ^ |
|
66 |
File.shell_path cache_path) |
|
67 |
||
68 |
fun int_of_string s = |
|
69 |
(case read_int (explode s) of |
|
70 |
(i, []) => i |
|
71 |
| _ => err ()) |
|
72 |
||
73 |
fun split line = |
|
74 |
(case space_explode " " line of |
|
75 |
[key, len1, len2] => (key, int_of_string len1, int_of_string len2) |
|
76 |
| _ => err ()) |
|
77 |
||
78 |
fun parse line ((i, l), tab) = |
|
79 |
if i = l |
|
80 |
then |
|
81 |
let val (key, l1, l2) = split line |
|
82 |
in ((i+1, l+l1+l2+1), Symtab.update (key, (i+1, l1, l2)) tab) end |
|
83 |
else ((i+1, l), tab) |
|
84 |
in apfst fst (File.fold_lines parse cache_path ((1, 1), Symtab.empty)) end |
|
85 |
||
86 |
fun make path = |
|
87 |
let val table = if File.exists path then load path else (1, Symtab.empty) |
|
88 |
in Cache {path=path, table=Synchronized.var (Path.implode path) table} end |
|
89 |
||
90 |
||
91 |
fun load_cached_result cache_path (p, len1, len2) = |
|
92 |
let |
|
93 |
fun load line (i, xsp) = |
|
94 |
if i < p then (i+1, xsp) |
|
95 |
else if i < p + len1 then (i+1, apfst (cons line) xsp) |
|
96 |
else if i < p + len2 then (i+1, apsnd (cons line) xsp) |
|
97 |
else (i, xsp) |
|
98 |
in pairself rev (snd (File.fold_lines load cache_path (1, ([], [])))) end |
|
99 |
||
36086
8e5454761f26
simplified Cache_IO interface (input is just a string and not already stored in a file)
boehmes
parents:
35942
diff
changeset
|
100 |
|
8e5454761f26
simplified Cache_IO interface (input is just a string and not already stored in a file)
boehmes
parents:
35942
diff
changeset
|
101 |
fun lookup (Cache {path=cache_path, table}) str = |
8e5454761f26
simplified Cache_IO interface (input is just a string and not already stored in a file)
boehmes
parents:
35942
diff
changeset
|
102 |
let val key = SHA1.digest str |
35151 | 103 |
in |
104 |
(case Symtab.lookup (snd (Synchronized.value table)) key of |
|
36086
8e5454761f26
simplified Cache_IO interface (input is just a string and not already stored in a file)
boehmes
parents:
35942
diff
changeset
|
105 |
NONE => (NONE, key) |
8e5454761f26
simplified Cache_IO interface (input is just a string and not already stored in a file)
boehmes
parents:
35942
diff
changeset
|
106 |
| SOME pos => (SOME (load_cached_result cache_path pos), key)) |
35151 | 107 |
end |
108 |
||
36086
8e5454761f26
simplified Cache_IO interface (input is just a string and not already stored in a file)
boehmes
parents:
35942
diff
changeset
|
109 |
|
8e5454761f26
simplified Cache_IO interface (input is just a string and not already stored in a file)
boehmes
parents:
35942
diff
changeset
|
110 |
fun run_and_cache (Cache {path=cache_path, table}) key make_cmd str = |
8e5454761f26
simplified Cache_IO interface (input is just a string and not already stored in a file)
boehmes
parents:
35942
diff
changeset
|
111 |
let |
8e5454761f26
simplified Cache_IO interface (input is just a string and not already stored in a file)
boehmes
parents:
35942
diff
changeset
|
112 |
val res as (out, err) = run make_cmd str |
8e5454761f26
simplified Cache_IO interface (input is just a string and not already stored in a file)
boehmes
parents:
35942
diff
changeset
|
113 |
val (l1, l2) = pairself length res |
8e5454761f26
simplified Cache_IO interface (input is just a string and not already stored in a file)
boehmes
parents:
35942
diff
changeset
|
114 |
val header = key ^ " " ^ string_of_int l1 ^ " " ^ string_of_int l2 |
8e5454761f26
simplified Cache_IO interface (input is just a string and not already stored in a file)
boehmes
parents:
35942
diff
changeset
|
115 |
val lines = map (suffix "\n") (header :: out @ err) |
8e5454761f26
simplified Cache_IO interface (input is just a string and not already stored in a file)
boehmes
parents:
35942
diff
changeset
|
116 |
|
8e5454761f26
simplified Cache_IO interface (input is just a string and not already stored in a file)
boehmes
parents:
35942
diff
changeset
|
117 |
val _ = Synchronized.change table (fn (p, tab) => |
8e5454761f26
simplified Cache_IO interface (input is just a string and not already stored in a file)
boehmes
parents:
35942
diff
changeset
|
118 |
if Symtab.defined tab key then (p, tab) |
8e5454761f26
simplified Cache_IO interface (input is just a string and not already stored in a file)
boehmes
parents:
35942
diff
changeset
|
119 |
else |
8e5454761f26
simplified Cache_IO interface (input is just a string and not already stored in a file)
boehmes
parents:
35942
diff
changeset
|
120 |
let val _ = File.append_list cache_path lines |
8e5454761f26
simplified Cache_IO interface (input is just a string and not already stored in a file)
boehmes
parents:
35942
diff
changeset
|
121 |
in (p+l1+l2+1, Symtab.update (key, (p+1, l1, l2)) tab) end) |
8e5454761f26
simplified Cache_IO interface (input is just a string and not already stored in a file)
boehmes
parents:
35942
diff
changeset
|
122 |
in res end |
8e5454761f26
simplified Cache_IO interface (input is just a string and not already stored in a file)
boehmes
parents:
35942
diff
changeset
|
123 |
|
8e5454761f26
simplified Cache_IO interface (input is just a string and not already stored in a file)
boehmes
parents:
35942
diff
changeset
|
124 |
|
8e5454761f26
simplified Cache_IO interface (input is just a string and not already stored in a file)
boehmes
parents:
35942
diff
changeset
|
125 |
fun run_cached cache make_cmd str = |
8e5454761f26
simplified Cache_IO interface (input is just a string and not already stored in a file)
boehmes
parents:
35942
diff
changeset
|
126 |
(case lookup cache str of |
8e5454761f26
simplified Cache_IO interface (input is just a string and not already stored in a file)
boehmes
parents:
35942
diff
changeset
|
127 |
(NONE, key) => run_and_cache cache key make_cmd str |
8e5454761f26
simplified Cache_IO interface (input is just a string and not already stored in a file)
boehmes
parents:
35942
diff
changeset
|
128 |
| (SOME output, _) => output) |
35151 | 129 |
|
130 |
end |
|
131 |
end |