|
1 | 1 | # This file is a part of ParallelProcessingTools.jl, licensed under the MIT License (MIT).
|
2 | 2 |
|
| 3 | +""" |
| 4 | + ParallelProcessingTools.split_basename_ext(file_basename_with_ext::AbstractString) |
| 5 | +
|
| 6 | +Splits a filename (given without its directory path) into a basename without |
| 7 | +file extension and the file extension. Returns a tuple `(basename_noext, ext)`. |
| 8 | +
|
| 9 | +Example: |
| 10 | +
|
| 11 | +``` |
| 12 | +ParallelProcessingTools.split_basename_ext("myfile.tar.gz") == ("myfile", ".tar.gz") |
| 13 | +``` |
| 14 | +""" |
| 15 | +function split_basename_ext(bn_ext::AbstractString) |
| 16 | + ext_startpos = findfirst('.', bn_ext) |
| 17 | + bn, ext = isnothing(ext_startpos) ? (bn_ext, "") : (bn_ext[1:ext_startpos-1], bn_ext[ext_startpos:end]) |
| 18 | + return bn, ext |
| 19 | +end |
| 20 | + |
3 | 21 |
|
4 | 22 | """
|
5 | 23 | ParallelProcessingTools.tmp_filename(fname::AbstractString)
|
| 24 | + ParallelProcessingTools.tmp_filename(fname::AbstractString, dir::AbstractString) |
6 | 25 |
|
7 |
| -Returns a temporary filename, based on `fname`, in the same directory. |
| 26 | +Returns a temporary filename, based on `fname`. |
8 | 27 |
|
9 |
| -Does *not* create the temporary file. |
| 28 | +By default, the temporary filename is in the same directory as `fname`, |
| 29 | +otherwise in `dir`. |
| 30 | +
|
| 31 | +Does *not* create the temporary file, only returns the filename (including |
| 32 | +directory path). |
10 | 33 | """
|
11 |
| -function tmp_filename(fname::AbstractString) |
12 |
| - d, fn, ext = _split_dir_fn_ext(fname) |
| 34 | +function tmp_filename end |
| 35 | + |
| 36 | +function tmp_filename(fname::AbstractString, dir::AbstractString) |
| 37 | + bn_ext = basename(fname) |
| 38 | + bn, ext = split_basename_ext(bn_ext) |
13 | 39 | tag = _rand_fname_tag()
|
14 |
| - joinpath(d, "$(fn)_$(tag)$(ext)") |
15 |
| -end |
16 |
| - |
17 |
| -function _split_dir_fn_ext(fname::AbstractString) |
18 |
| - d = dirname(fname) |
19 |
| - f = basename(fname) |
20 |
| - ext_startpos = findfirst('.', f) |
21 |
| - fn, ext = isnothing(ext_startpos) ? (f, "") : (f[1:ext_startpos-1], f[ext_startpos:end]) |
22 |
| - return d, fn, ext |
| 40 | + joinpath(dir, "$(bn)_$(tag)$(ext)") |
23 | 41 | end
|
24 | 42 |
|
| 43 | +tmp_filename(fname::AbstractString) = tmp_filename(fname, dirname(fname)) |
| 44 | + |
25 | 45 | _rand_fname_tag() = String(rand(b"0123456789abcdefghijklmnopqrstuvwxyzABCDEFGHIJKLMNOPQRSTUVWXYZ", 8))
|
26 | 46 |
|
27 | 47 |
|
28 | 48 | """
|
29 | 49 | function create_files(
|
30 | 50 | body, filenames::AbstractString...;
|
31 | 51 | create_dirs::Bool = true, overwrite::Bool = true, delete_on_error::Bool=true
|
| 52 | + use_cache::Bool = true, cache_dir::AbstractString = tempdir() |
32 | 53 | )
|
33 | 54 |
|
34 | 55 | Creates `filenames` in an atomic fashion.
|
35 | 56 |
|
36 |
| -Creates temporary files in the same directories as `filenames`, then |
| 57 | +Creates temporary files, then |
37 | 58 | calls `body(temporary_filenames...)`. If `body` returns successfully,
|
38 | 59 | the files `temporary_filenames` are renamed to `filenames`. If `body` throws
|
39 | 60 | an exception, the temporary files are either deleted (if `delete_on_error` is
|
40 | 61 | `true`) or left in place (e.g. for debugging purposes).
|
41 | 62 |
|
| 63 | +If `create_dirs` is `true`, the `temporary_filenames` are created in |
| 64 | +`cache_dir` and then atomically moved to `filenames`, otherwise, they are |
| 65 | +created next to `filenames` (in the same directories). |
| 66 | +
|
42 | 67 | If `create_dirs` is `true`, directories are created if necessary.
|
43 | 68 |
|
44 | 69 | If all of files already exist and `overwrite` is `false`, takes no action
|
45 | 70 | (or, if the file is created by other code running in parallel, while `body` is
|
46 | 71 | running, does not overwrite it).
|
47 | 72 |
|
| 73 | +If `verbose` is `true`, uses log-level `Logging.Info` to log file creation, |
| 74 | +otherwise `Logging.Debug`. |
| 75 | +
|
48 | 76 | Throws an error if only some of the files exist and `overwrite` is `false`.
|
49 | 77 |
|
50 | 78 | Returns `nothing`.
|
|
59 | 87 | ```
|
60 | 88 | """
|
61 | 89 | function create_files(
|
62 |
| - body, filenames::AbstractString...; |
63 |
| - create_dirs::Bool = true, overwrite::Bool = true, delete_on_error::Bool=true |
| 90 | + @nospecialize(body), @nospecialize(filenames::AbstractString...); |
| 91 | + create_dirs::Bool = true, overwrite::Bool = true, delete_on_error::Bool=true, |
| 92 | + use_cache::Bool = true, cache_dir::AbstractString = tempdir(), |
| 93 | + verbose::Bool = true |
64 | 94 | )
|
65 |
| - tmp_filenames = String[] |
66 |
| - completed_filenames = String[] |
| 95 | + loglevel = verbose ? Info : Debug |
| 96 | + |
| 97 | + target_fnames = String[filenames...] # Fix type |
| 98 | + staging_fnames = String[] |
| 99 | + writeto_fnames = String[] |
| 100 | + completed_fnames = String[] |
67 | 101 |
|
68 |
| - pre_existing = isfile.(filenames) |
| 102 | + pre_existing = isfile.(target_fnames) |
69 | 103 | if any(pre_existing)
|
70 | 104 | if all(pre_existing)
|
71 | 105 | if !overwrite
|
72 |
| - @info "Files $filenames already exist, nothing to do." |
| 106 | + @logmsg loglevel "Files $target_fnames already exist, nothing to do." |
73 | 107 | return nothing
|
74 | 108 | end
|
75 | 109 | else
|
76 |
| - !overwrite && throw(ErrorException("Only some of $filenames exist but not allowed to overwrite")) |
| 110 | + !overwrite && throw(ErrorException("Only some of $target_fnames exist but not allowed to overwrite")) |
77 | 111 | end
|
78 | 112 | end
|
79 | 113 |
|
80 |
| - dirs = dirname.(filenames) |
81 |
| - for dir in dirs |
82 |
| - if !isdir(dir) && create_dirs |
83 |
| - mkpath(dir) |
84 |
| - @info "Created directory $dir." |
| 114 | + dirs = dirname.(target_fnames) |
| 115 | + if create_dirs |
| 116 | + for dir in dirs |
| 117 | + if !isdir(dir) && create_dirs |
| 118 | + mkpath(dir) |
| 119 | + @logmsg loglevel "Created directory $dir." |
| 120 | + end |
| 121 | + end |
| 122 | + |
| 123 | + if use_cache && !isdir(cache_dir) |
| 124 | + mkpath(cache_dir) |
| 125 | + @logmsg loglevel "Created cache directory $cache_dir." |
85 | 126 | end
|
86 | 127 | end
|
87 | 128 |
|
88 | 129 | try
|
89 |
| - for fname in filenames |
90 |
| - tmp_fname = tmp_filename(fname) |
91 |
| - @assert !isfile(tmp_fname) |
92 |
| - push!(tmp_filenames, tmp_fname) |
93 |
| - end |
| 130 | + staging_fnames = tmp_filename.(target_fnames) |
| 131 | + @assert !any(isfile, staging_fnames) |
| 132 | + |
| 133 | + writeto_fnames = use_cache ? tmp_filename.(target_fnames, Ref(cache_dir)) : staging_fnames |
| 134 | + @assert !any(isfile, writeto_fnames) |
94 | 135 |
|
95 |
| - body(tmp_filenames...) |
| 136 | + @debug "Creating intermediate files $writeto_fnames." |
| 137 | + body(writeto_fnames...) |
96 | 138 |
|
97 |
| - post_body_existing = isfile.(filenames) |
| 139 | + post_body_existing = isfile.(target_fnames) |
98 | 140 | if any(post_body_existing)
|
99 | 141 | if all(post_body_existing)
|
100 | 142 | if !overwrite
|
101 |
| - @info "Files $filenames already exist, won't replace." |
| 143 | + @logmsg loglevel "Files $target_fnames already exist, won't replace." |
102 | 144 | return nothing
|
103 | 145 | end
|
104 | 146 | else
|
105 |
| - !overwrite && throw(ErrorException("Only some of $filenames exist but not allowed to replace files")) |
| 147 | + !overwrite && throw(ErrorException("Only some of $target_fnames exist but not allowed to replace files")) |
106 | 148 | end
|
107 | 149 | end
|
108 |
| - |
| 150 | + |
109 | 151 | try
|
110 |
| - for (tmp_fname, fname) in zip(tmp_filenames, filenames) |
111 |
| - mv(tmp_fname, fname; force=true) |
112 |
| - @assert isfile(fname) |
113 |
| - push!(completed_filenames, fname) |
| 152 | + if use_cache |
| 153 | + for (writeto_fn, staging_fn) in zip(writeto_fnames, staging_fnames) |
| 154 | + @assert writeto_fn != staging_fn |
| 155 | + @debug "Moving file \"$writeto_fn\" to \"$staging_fn\"." |
| 156 | + isfile(writeto_fn) || error("Expected file \"$writeto_fn\" to exist, but it doesn't.") |
| 157 | + mv(writeto_fn, staging_fn; force=true) |
| 158 | + isfile(staging_fn) || error("Tried to move file \"$writeto_fn\" to \"$staging_fn\", but \"$staging_fn\" doesn't exist.") |
| 159 | + end |
| 160 | + end |
| 161 | + for (staging_fn, target_fn) in zip(staging_fnames, target_fnames) |
| 162 | + @assert staging_fn != target_fn |
| 163 | + @debug "Renaming file \"$staging_fn\" to \"$target_fn\"." |
| 164 | + isfile(staging_fn) || error("Expected file \"$staging_fn\" to exist, but it doesn't.") |
| 165 | + mv(staging_fn, target_fn; force=true) |
| 166 | + isfile(target_fn) || error("Tried to rename file \"$staging_fn\" to \"$target_fn\", but \"$target_fn\" doesn't exist.") |
| 167 | + push!(completed_fnames, target_fn) |
114 | 168 | end
|
115 |
| - @info "Successfully created files $filenames." |
| 169 | + @logmsg loglevel "Created files $target_fnames." |
116 | 170 | catch
|
117 |
| - if !isempty(completed_filenames) |
118 |
| - @error "Failed to rename some temporary files to final filenames, removing $completed_filenames" |
119 |
| - for fname in completed_filenames |
| 171 | + if !isempty(completed_fnames) |
| 172 | + @error "Failed to rename some temporary files to final filenames, removing $completed_fnames" |
| 173 | + for fname in completed_fnames |
120 | 174 | rm(fname; force=true)
|
121 | 175 | end
|
122 | 176 | end
|
123 | 177 | rethrow()
|
124 | 178 | end
|
125 | 179 |
|
126 |
| - @assert all(fn -> !isfile(fn), tmp_filenames) |
| 180 | + @assert all(fn -> !isfile(fn), staging_fnames) |
127 | 181 | finally
|
128 | 182 | if delete_on_error
|
129 |
| - for tmp_fname in tmp_filenames |
130 |
| - isfile(tmp_fname) && rm(tmp_fname; force=true); |
| 183 | + for writeto_fn in writeto_fnames |
| 184 | + isfile(writeto_fn) && rm(writeto_fn; force=true); |
| 185 | + end |
| 186 | + for staging_fn in staging_fnames |
| 187 | + isfile(staging_fn) && rm(staging_fn; force=true); |
131 | 188 | end
|
132 | 189 | end
|
133 | 190 | end
|
|
0 commit comments