From: "Fabian Grünbichler" <f.gruenbichler@proxmox.com>
To: pbs-devel@lists.proxmox.com
Subject: [pbs-devel] [PATCH proxmox-backup 1/3] debug: recover: allow ignoring missing/corrupt chunks
Date: Mon, 23 May 2022 16:11:33 +0200 [thread overview]
Message-ID: <20220523141135.921321-1-f.gruenbichler@proxmox.com> (raw)
replacing them with chunks of zero bytes.
Signed-off-by: Fabian Grünbichler <f.gruenbichler@proxmox.com>
---
src/bin/proxmox_backup_debug/recover.rs | 98 +++++++++++++++++++++----
1 file changed, 84 insertions(+), 14 deletions(-)
diff --git a/src/bin/proxmox_backup_debug/recover.rs b/src/bin/proxmox_backup_debug/recover.rs
index b118a71c..9c4aed3d 100644
--- a/src/bin/proxmox_backup_debug/recover.rs
+++ b/src/bin/proxmox_backup_debug/recover.rs
@@ -38,7 +38,19 @@ use pbs_tools::crypt_config::CryptConfig;
type: Boolean,
optional: true,
default: false,
- }
+ },
+ "ignore-missing-chunks": {
+ description: "If a chunk is missing, warn and write 0-bytes instead to attempt partial recovery.",
+ type: Boolean,
+ optional: true,
+ default: false,
+ },
+ "ignore-corrupt-chunks": {
+ description: "If a chunk is corrupt, warn and write 0-bytes instead to attempt partial recovery.",
+ type: Boolean,
+ optional: true,
+ default: false,
+ },
}
}
)]
@@ -49,6 +61,8 @@ fn recover_index(
chunks: String,
keyfile: Option<String>,
skip_crc: bool,
+ ignore_missing_chunks: bool,
+ ignore_corrupt_chunks: bool,
_param: Value,
) -> Result<(), Error> {
let file_path = Path::new(&file);
@@ -89,22 +103,78 @@ fn recover_index(
let digest_str = hex::encode(chunk_digest);
let digest_prefix = &digest_str[0..4];
let chunk_path = chunks_path.join(digest_prefix).join(digest_str);
- let mut chunk_file = std::fs::File::open(&chunk_path)
- .map_err(|e| format_err!("could not open chunk file - {}", e))?;
- data.clear();
- chunk_file.read_to_end(&mut data)?;
- let chunk_blob = DataBlob::from_raw(data.clone())?;
+ let create_zero_chunk = |msg: String| -> Result<(DataBlob, Option<&[u8; 32]>), Error> {
+ let info = index
+ .chunk_info(pos)
+ .ok_or_else(|| format_err!("Couldn't read chunk info from index at {pos}"))?;
+ let size = info.size();
- if !skip_crc {
- chunk_blob.verify_crc()?;
- }
+ eprintln!("WARN: chunk {:?} {}", chunk_path, msg);
+ eprintln!("WARN: replacing output file {:?} with '\\0'", info.range,);
+
+ Ok((
+ DataBlob::encode(&vec![0; size as usize], crypt_conf_opt.as_ref(), true)?,
+ None,
+ ))
+ };
+
+ let (chunk_blob, chunk_digest) = match std::fs::File::open(&chunk_path) {
+ Ok(mut chunk_file) => {
+ data.clear();
+ chunk_file.read_to_end(&mut data)?;
+
+ // first chance for corrupt chunk - handling magic fails
+ DataBlob::from_raw(data.clone())
+ .map(|blob| (blob, Some(chunk_digest)))
+ .or_else(|err| {
+ if ignore_corrupt_chunks {
+ create_zero_chunk(format!("is corrupt - {err}"))
+ } else {
+ bail!("{err}");
+ }
+ })?
+ }
+ Err(err) => {
+ if ignore_missing_chunks && err.kind() == std::io::ErrorKind::NotFound {
+ create_zero_chunk(format!("is missing"))?
+ } else {
+ bail!("could not open chunk file - {}", err);
+ }
+ }
+ };
+
+ // second chance - we need CRC to detect truncated chunks!
+ let crc_res = if skip_crc {
+ Ok(())
+ } else {
+ chunk_blob.verify_crc()
+ };
+
+ let (chunk_blob, chunk_digest) = if let Err(crc_err) = crc_res {
+ if ignore_corrupt_chunks {
+ create_zero_chunk(format!("is corrupt - {crc_err}"))?
+ } else {
+ bail!("Error at chunk {:?} - {crc_err}", chunk_path);
+ }
+ } else {
+ (chunk_blob, chunk_digest)
+ };
+
+ // third chance - decoding might fail (digest, compression, encryption)
+ let decoded = chunk_blob
+ .decode(crypt_conf_opt.as_ref(), chunk_digest)
+ .or_else(|err| {
+ if ignore_corrupt_chunks {
+ create_zero_chunk(format!("fails to decode - {err}"))?
+ .0
+ .decode(crypt_conf_opt.as_ref(), None)
+ } else {
+ bail!("Failed to decode chunk {:?} = {}", chunk_path, err);
+ }
+ })?;
- output_file.write_all(
- chunk_blob
- .decode(crypt_conf_opt.as_ref(), Some(chunk_digest))?
- .as_slice(),
- )?;
+ output_file.write_all(decoded.as_slice())?;
}
Ok(())
--
2.30.2
next reply other threads:[~2022-05-23 14:12 UTC|newest]
Thread overview: 5+ messages / expand[flat|nested] mbox.gz Atom feed top
2022-05-23 14:11 Fabian Grünbichler [this message]
2022-05-23 14:11 ` [pbs-devel] [PATCH proxmox-backup 2/3] debug: move outfile_or_stdout to module for reuse Fabian Grünbichler
2022-05-23 14:11 ` [pbs-devel] [PATCH proxmox-backup 3/3] debug: recover: allow overriding output-path Fabian Grünbichler
2022-05-24 9:16 ` [pbs-devel] [PATCH proxmox-backup 1/3] debug: recover: allow ignoring missing/corrupt chunks Hannes Laimer
2022-05-24 9:47 ` [pbs-devel] applied-series: " Thomas Lamprecht
Reply instructions:
You may reply publicly to this message via plain-text email
using any one of the following methods:
* Save the following mbox file, import it into your mail client,
and reply-to-all from there: mbox
Avoid top-posting and favor interleaved quoting:
https://en.wikipedia.org/wiki/Posting_style#Interleaved_style
* Reply using the --to, --cc, and --in-reply-to
switches of git-send-email(1):
git send-email \
--in-reply-to=20220523141135.921321-1-f.gruenbichler@proxmox.com \
--to=f.gruenbichler@proxmox.com \
--cc=pbs-devel@lists.proxmox.com \
/path/to/YOUR_REPLY
https://kernel.org/pub/software/scm/git/docs/git-send-email.html
* If your mail client supports setting the In-Reply-To header
via mailto: links, try the mailto: link
Be sure your reply has a Subject: header at the top and a blank line
before the message body.
This is an external index of several public inboxes,
see mirroring instructions on how to clone and mirror
all data and code used by this external index.