Skip to content

Commit 7d5e87a

Browse files
committed
update handling of files with bad checksums
1 parent 02160e6 commit 7d5e87a

File tree

1 file changed

+13
-8
lines changed

1 file changed

+13
-8
lines changed

scripts/verify_download.jl

+13-8
Original file line numberDiff line numberDiff line change
@@ -19,11 +19,11 @@ using ArgParse
1919
"--root"
2020
help = "Path to root of data directories"
2121
arg_type = String
22-
default = "/gpfs/group/ebf11/default/RISE_NEID_ebf/data"
22+
default = "/storage/group/ebf11/default/pipeline/neid_solar/data"
2323
"--input"
2424
help = "Path to inputs FITS files (fits)"
2525
arg_type = String
26-
default = "solar_L2/v1.1"
26+
default = "v1.1/L2/"
2727
"--output"
2828
help = "Path to daily CCFs (jld2)"
2929
arg_type = String
@@ -169,20 +169,24 @@ begin
169169
if checksums
170170
if in("l2filename",names(meta_df))
171171
download_success_df = manifest_df |> @join(meta_df, String(_.filename), String(_.l2filename), {_.filename, success= _.md5_download == __.l2checksum}) |> DataFrame
172-
meta_bad_checksum_df = DataFrame(download_success_df |> @filter(!_.success) |> @join(meta_df, String(_.filename), String(_.l2filename), {_.filename, meta=__}) |> DataFrame).meta
172+
#meta_bad_checksum_df = DataFrame(download_success_df |> @filter(!_.success) |> @join(meta_df, String(_.filename), String(_.l2filename), {_.filename, meta=__}) |> DataFrame).meta
173+
meta_bad_checksum_df = DataFrame(download_success_df |> @filter(!_.success) |> @join(meta_df, String(_.filename), String(_.l2filename), {_.filename, meta=__}) |> DataFrame)
173174
elseif in("l1filename",names(meta_df))
174175
download_success_df = manifest_df |> @join(meta_df, String(_.filename), String(_.l1filename), {_.filename, success= _.md5_download == __.l1checksum}) |> DataFrame
175-
meta_bad_checksum_df = DataFrame(download_success_df |> @filter(!_.success) |> @join(meta_df, String(_.filename), String(_.l1filename), {_.filename, meta=__}) |> DataFrame).meta
176+
#meta_bad_checksum_df = DataFrame(download_success_df |> @filter(!_.success) |> @join(meta_df, String(_.filename), String(_.l1filename), {_.filename, meta=__}) |> DataFrame).meta
177+
meta_bad_checksum_df = DataFrame(download_success_df |> @filter(!_.success) |> @join(meta_df, String(_.filename), String(_.l1filename), {_.filename, meta=__}) |> DataFrame)
176178
else
177179
download_success_df = manifest_df |> @join(meta_df, String(_.filename), String(_.l0filename), {_.filename, success= _.md5_download == __.l0checksum}) |> DataFrame
178-
meta_bad_checksum_df = DataFrame(download_success_df |> @filter(!_.success) |> @join(meta_df, String(_.filename), String(_.l0filename), {_.filename, meta=__}) |> DataFrame).meta
180+
#meta_bad_checksum_df = DataFrame(download_success_df |> @filter(!_.success) |> @join(meta_df, String(_.filename), String(_.l0filename), {_.filename, meta=__}) |> DataFrame).meta
181+
meta_bad_checksum_df = DataFrame(download_success_df |> @filter(!_.success) |> @join(meta_df, String(_.filename), String(_.l0filename), {_.filename, meta=__}) |> DataFrame)
179182
end
180-
if size(meta_bad_checksum_df,1) >= 1
181-
append!(need_to_redownload_df,meta_bad_checksum_df)
183+
if size(meta_bad_checksum_df.meta,1) >= 1
184+
#append!(need_to_redownload_df,meta_bad_checksum_df)
185+
append!(need_to_redownload_df,meta_bad_checksum_df.meta)
182186
suspect_files_dir = joinpath(path,suspect_dirname)
183187
isdir(suspect_files_dir) || mkdir(suspect_files_dir)
184188
for file in meta_bad_checksum_df.filename
185-
mv(file, joinpath(suspect_files_dir,file), force=true)
189+
mv(joinpath(path,file), joinpath(suspect_files_dir,file), force=true)
186190
end
187191
end
188192
end
@@ -222,6 +226,7 @@ if !args["crawl"]
222226

223227
if !args["quiet"]
224228
println("# verify_downloads.jl $input_path identified ", size(need_to_redownload_df,1), " files to download.")
229+
println(need_to_redownload_df)
225230
end
226231

227232
else

0 commit comments

Comments
 (0)