From: Dominik Csapak <d.csapak@proxmox.com>
To: pbs-devel@lists.proxmox.com
Subject: [pbs-devel] [PATCH proxmox-backup 1/3] tape: media_catalog: add fast_catalog beside normal catalog
Date: Mon, 19 Jul 2021 16:55:54 +0200 [thread overview]
Message-ID: <20210719145556.2781356-1-d.csapak@proxmox.com> (raw)
for some parts of the ui, we only need the snapshot list from the catalog,
and reading the whole catalog (can be multiple hundred MiB) is not
really necessary.
Instead, on every commit of the catalog, write the complete content list
into a seperate .index file, that can be read to get only the snapshot
list.
Signed-off-by: Dominik Csapak <d.csapak@proxmox.com>
---
src/tape/media_catalog.rs | 108 +++++++++++++++++++++++++++++++++++++-
1 file changed, 106 insertions(+), 2 deletions(-)
diff --git a/src/tape/media_catalog.rs b/src/tape/media_catalog.rs
index 65b52a42..6a9c8ce1 100644
--- a/src/tape/media_catalog.rs
+++ b/src/tape/media_catalog.rs
@@ -1,8 +1,8 @@
use std::convert::TryFrom;
use std::fs::File;
-use std::io::{Write, Read, BufReader, Seek, SeekFrom};
+use std::io::{Write, Read, BufRead, BufReader, Seek, SeekFrom};
use std::os::unix::io::AsRawFd;
-use std::path::Path;
+use std::path::{Path, PathBuf};
use std::collections::{HashSet, HashMap};
use anyhow::{bail, format_err, Error};
@@ -53,6 +53,7 @@ impl DatastoreContent {
///
/// We use a simple binary format to store data on disk.
pub struct MediaCatalog {
+ base_path: PathBuf,
uuid: Uuid, // BackupMedia uuid
@@ -108,7 +109,11 @@ impl MediaCatalog {
let mut path = base_path.to_owned();
path.push(uuid.to_string());
+ let mut fast_catalog = path.clone();
path.set_extension("log");
+ fast_catalog.set_extension("index");
+
+ let _ = std::fs::remove_file(fast_catalog); // ignore errors
match std::fs::remove_file(path) {
Ok(()) => Ok(()),
@@ -217,6 +222,7 @@ impl MediaCatalog {
.map_err(|err| format_err!("fchown failed - {}", err))?;
let mut me = Self {
+ base_path: base_path.to_path_buf(),
uuid: uuid.clone(),
file: None,
log_to_stdout: false,
@@ -294,6 +300,7 @@ impl MediaCatalog {
let file = Self::create_temporary_database_file(base_path, uuid)?;
let mut me = Self {
+ base_path: base_path.to_path_buf(),
uuid: uuid.clone(),
file: Some(file),
log_to_stdout: false,
@@ -360,6 +367,99 @@ impl MediaCatalog {
&self.content
}
+ fn load_fast_catalog(
+ file: &mut File,
+ ) -> Result<Vec<(String, String)>, Error> {
+ let mut list = Vec::new();
+ let file = BufReader::new(file);
+ for line in file.lines() {
+ let mut line = line?;
+
+ let idx = line
+ .find(':')
+ .ok_or_else(|| format_err!("invalid line format (no store found)"))?;
+
+ let snapshot = line.split_off(idx + 1);
+ line.truncate(idx);
+ list.push((line, snapshot));
+ }
+
+ Ok(list)
+ }
+
+ /// Returns a list of (store, snapshot) for a given MediaId
+ pub fn snapshot_list(
+ base_path: &Path,
+ media_id: &MediaId,
+ ) -> Result<Vec<(String, String)>, Error> {
+ let uuid = &media_id.label.uuid;
+
+ let mut path = base_path.to_owned();
+ path.push(uuid.to_string());
+ path.set_extension("index");
+
+
+ let list = proxmox::try_block!({
+
+ Self::create_basedir(base_path)?;
+
+ let mut file = match std::fs::OpenOptions::new().read(true).open(&path) {
+ Ok(file) => file,
+ Err(err) if err.kind() == std::io::ErrorKind::NotFound => {
+ // open normal catalog and write fast index
+ let catalog = Self::open(base_path, media_id, false, false)?;
+ catalog.write_snapshot_list()?;
+ let mut list = Vec::new();
+ for (store, content) in catalog.content() {
+ for snapshot in content.snapshot_index.keys() {
+ list.push((store.to_string(), snapshot.to_string()));
+ }
+ }
+ return Ok(list);
+ },
+ Err(err) => bail!(err),
+ };
+
+ Self::load_fast_catalog(&mut file)
+ }).map_err(|err: Error| {
+ format_err!("unable to open fast media catalog {:?} - {}", path, err)
+ })?;
+
+ Ok(list)
+ }
+
+ // writes the full snapshot list into <uuid>.index
+ fn write_snapshot_list(&self) -> Result<(), Error> {
+ let mut data = String::new();
+
+ for (store, content) in self.content() {
+ for snapshot in content.snapshot_index.keys() {
+ data.push_str(store);
+ data.push_str(":");
+ data.push_str(snapshot);
+ data.push_str("\n");
+ }
+ }
+
+ let mut path = self.base_path.clone();
+ path.push(self.uuid.to_string());
+ path.set_extension("index");
+
+ let backup_user = crate::backup::backup_user()?;
+ let options = if cfg!(test) {
+ // cannot chown the file in the test environment
+ CreateOptions::new()
+ } else {
+ CreateOptions::new().owner(backup_user.uid).group(backup_user.gid)
+ };
+
+ proxmox::tools::fs::replace_file(
+ path,
+ data.as_bytes(),
+ options,
+ )
+ }
+
/// Commit pending changes
///
/// This is necessary to store changes persistently.
@@ -380,6 +480,10 @@ impl MediaCatalog {
None => bail!("media catalog not writable (opened read only)"),
}
+ self.write_snapshot_list().map_err(|err| {
+ format_err!("could not write fast catalog: {}", err)
+ })?;
+
self.pending = Vec::new();
Ok(())
--
2.30.2
next reply other threads:[~2021-07-19 14:56 UTC|newest]
Thread overview: 5+ messages / expand[flat|nested] mbox.gz Atom feed top
2021-07-19 14:55 Dominik Csapak [this message]
2021-07-19 14:55 ` [pbs-devel] [RFC PATCH proxmox-backup 2/3] tape: media_catalog: add local type aliases to make code more clear Dominik Csapak
2021-07-19 14:55 ` [pbs-devel] [PATCH proxmox-backup 3/3] api2: tape: media: use MediaCatalog::snapshot_list for content listing Dominik Csapak
2021-07-20 6:15 [pbs-devel] [PATCH proxmox-backup 1/3] tape: media_catalog: add fast_catalog beside normal catalog Dietmar Maurer
2021-07-20 7:01 ` Dominik Csapak
Reply instructions:
You may reply publicly to this message via plain-text email
using any one of the following methods:
* Save the following mbox file, import it into your mail client,
and reply-to-all from there: mbox
Avoid top-posting and favor interleaved quoting:
https://en.wikipedia.org/wiki/Posting_style#Interleaved_style
* Reply using the --to, --cc, and --in-reply-to
switches of git-send-email(1):
git send-email \
--in-reply-to=20210719145556.2781356-1-d.csapak@proxmox.com \
--to=d.csapak@proxmox.com \
--cc=pbs-devel@lists.proxmox.com \
/path/to/YOUR_REPLY
https://kernel.org/pub/software/scm/git/docs/git-send-email.html
* If your mail client supports setting the In-Reply-To header
via mailto: links, try the mailto: link
Be sure your reply has a Subject: header at the top and a blank line
before the message body.
This is a public inbox, see mirroring instructions
for how to clone and mirror all data and code used for this inbox