src/backup/archive_index.rs: first try

This commit is contained in:
Dietmar Maurer 2018-12-31 17:30:08 +01:00
parent cbdd8c54ae
commit 0433db1949
6 changed files with 152 additions and 30 deletions

View File

@ -3,4 +3,5 @@
pub mod chunker; pub mod chunker;
pub mod chunk_store; pub mod chunk_store;
pub mod image_index; pub mod image_index;
pub mod archive_index;
pub mod datastore; pub mod datastore;

133
src/backup/archive_index.rs Normal file
View File

@ -0,0 +1,133 @@
use failure::*;
use super::chunk_store::*;
use super::chunker::*;
use std::io::{Read, Write};
use std::fs::File;
use std::path::{Path, PathBuf};
use std::os::unix::io::AsRawFd;
use uuid::Uuid;
use chrono::{Local, TimeZone};
#[repr(C)]
pub struct ArchiveIndexHeader {
pub magic: [u8; 12],
pub version: u32,
pub uuid: [u8; 16],
pub ctime: u64,
reserved: [u8; 4056], // oversall size is one page (4096 bytes)
}
pub struct ArchiveIndexWriter<'a> {
store: &'a ChunkStore,
chunker: Chunker,
file: File,
filename: PathBuf,
tmp_filename: PathBuf,
uuid: [u8; 16],
ctime: u64,
chunk_offset: usize,
last_chunk: usize,
chunk_buffer: Vec<u8>,
}
impl <'a> ArchiveIndexWriter<'a> {
pub fn create(store: &'a ChunkStore, path: &Path, chunk_size: usize) -> Result<Self, Error> {
let full_path = store.relative_path(path);
let mut tmp_path = full_path.clone();
tmp_path.set_extension("tmp_aidx");
let mut file = std::fs::OpenOptions::new()
.create(true).truncate(true)
.read(true)
.write(true)
.open(&tmp_path)?;
let header_size = std::mem::size_of::<ArchiveIndexHeader>();
// todo: use static assertion when available in rust
if header_size != 4096 { panic!("got unexpected header size"); }
let ctime = std::time::SystemTime::now().duration_since(
std::time::SystemTime::UNIX_EPOCH)?.as_secs();
let uuid = Uuid::new_v4();
let mut buffer = vec![0u8; header_size];
let header = crate::tools::map_struct_mut::<ArchiveIndexHeader>(&mut buffer)?;
header.magic = *b"PROXMOX-AIDX";
header.version = u32::to_le(1);
header.ctime = u64::to_le(ctime);
header.uuid = *uuid.as_bytes();
file.write_all(&buffer)?;
Ok(Self {
store,
chunker: Chunker::new(chunk_size),
file: file,
filename: full_path,
tmp_filename: tmp_path,
ctime,
uuid: *uuid.as_bytes(),
chunk_offset: 0,
last_chunk: 0,
chunk_buffer: Vec::with_capacity(chunk_size*4),
})
}
}
impl <'a> Write for ArchiveIndexWriter<'a> {
fn write(&mut self, data: &[u8]) -> std::result::Result<usize, std::io::Error> {
use std::io::{Error, ErrorKind};
let chunker = &mut self.chunker;
let pos = chunker.scan(data);
if pos > 0 {
self.chunk_buffer.extend(&data[0..pos]);
self.chunk_offset += pos;
let chunk_size = self.chunk_buffer.len();
let expected_chunk_size = self.chunk_offset - self.last_chunk;
if expected_chunk_size != self.chunk_buffer.len() {
panic!("wrong chunk size {} != {}",
expected_chunk_size, chunk_size);
}
self.last_chunk = self.chunk_offset;
match self.store.insert_chunk(&self.chunk_buffer) {
Ok((is_duplicate, digest)) => {
println!("ADD CHUNK {} {} {} {}", self.chunk_offset, chunk_size, is_duplicate, digest_to_hex(&digest));
self.chunk_buffer.truncate(0);
return Ok(pos);
}
Err(err) => {
self.chunk_buffer.truncate(0);
return Err(Error::new(ErrorKind::Other, err.to_string()));
}
}
} else {
self.chunk_offset += data.len();
self.chunk_buffer.extend(data);
return Ok(data.len());
}
}
fn flush(&mut self) -> std::result::Result<(), std::io::Error> {
Ok(())
}
}

View File

@ -205,26 +205,3 @@ impl Chunker {
self.h ^= BUZHASH_TABLE[(byte as usize)]; self.h ^= BUZHASH_TABLE[(byte as usize)];
} }
} }
impl Write for Chunker {
fn write(&mut self, data: &[u8]) -> std::result::Result<usize, std::io::Error> {
let pos = self.scan(data);
if pos > 0 {
self.offset += pos;
println!("BOUND {} size {}", self.offset, self.offset - self.last_offset);
self.last_offset = self.offset;
return Ok(pos);
} else {
self.offset += data.len();
return Ok(data.len());
}
}
fn flush(&mut self) -> std::result::Result<(), std::io::Error> {
Ok(())
}
}

View File

@ -8,6 +8,7 @@ use std::sync::{Mutex, Arc};
use crate::config::datastore; use crate::config::datastore;
use super::chunk_store::*; use super::chunk_store::*;
use super::image_index::*; use super::image_index::*;
use super::archive_index::*;
pub struct DataStore { pub struct DataStore {
chunk_store: ChunkStore, chunk_store: ChunkStore,
@ -76,6 +77,16 @@ impl DataStore {
Ok(index) Ok(index)
} }
pub fn create_archive_writer<P: AsRef<Path>>(
&self, filename: P,
chunk_size: usize
) -> Result<ArchiveIndexWriter, Error> {
let index = ArchiveIndexWriter::create(&self.chunk_store, filename.as_ref(), chunk_size)?;
Ok(index)
}
pub fn list_images(&self) -> Result<Vec<PathBuf>, Error> { pub fn list_images(&self) -> Result<Vec<PathBuf>, Error> {
let base = self.chunk_store.base_path(); let base = self.chunk_store.base_path();

View File

@ -44,11 +44,11 @@ fn backup_dir(
// .truncate(true) // .truncate(true)
// .open("mytest.catar")?; // .open("mytest.catar")?;
let writer = Chunker::new(chunk_size); let mut index = datastore.create_archive_writer(&target, chunk_size)?;
let path = std::path::PathBuf::from(path); let path = std::path::PathBuf::from(path);
CaTarEncoder::encode(path, dir, writer)?; CaTarEncoder::encode(path, dir, index)?;
Ok(()) Ok(())
} }

View File

@ -163,7 +163,7 @@ impl <W: Write> CaTarEncoder<W> {
fn encode_dir(&mut self, dir: &mut nix::dir::Dir) -> Result<(), Error> { fn encode_dir(&mut self, dir: &mut nix::dir::Dir) -> Result<(), Error> {
println!("encode_dir: {:?} start {}", self.current_path, self.writer_pos); //println!("encode_dir: {:?} start {}", self.current_path, self.writer_pos);
let mut name_list = vec![]; let mut name_list = vec![];
@ -270,7 +270,7 @@ impl <W: Write> CaTarEncoder<W> {
self.current_path.pop(); self.current_path.pop();
} }
println!("encode_dir: {:?} end {}", self.current_path, self.writer_pos); //println!("encode_dir: {:?} end {}", self.current_path, self.writer_pos);
// fixup goodby item offsets // fixup goodby item offsets
let goodbye_start = self.writer_pos as u64; let goodbye_start = self.writer_pos as u64;
@ -282,13 +282,13 @@ impl <W: Write> CaTarEncoder<W> {
self.write_goodbye_table(goodbye_offset, &mut goodbye_items)?; self.write_goodbye_table(goodbye_offset, &mut goodbye_items)?;
println!("encode_dir: {:?} end1 {}", self.current_path, self.writer_pos); //println!("encode_dir: {:?} end1 {}", self.current_path, self.writer_pos);
Ok(()) Ok(())
} }
fn encode_file(&mut self, filefd: RawFd) -> Result<(), Error> { fn encode_file(&mut self, filefd: RawFd) -> Result<(), Error> {
println!("encode_file: {:?}", self.current_path); //println!("encode_file: {:?}", self.current_path);
let stat = match nix::sys::stat::fstat(filefd) { let stat = match nix::sys::stat::fstat(filefd) {
Ok(stat) => stat, Ok(stat) => stat,
@ -338,7 +338,7 @@ impl <W: Write> CaTarEncoder<W> {
fn encode_symlink(&mut self, target: &[u8], stat: &FileStat) -> Result<(), Error> { fn encode_symlink(&mut self, target: &[u8], stat: &FileStat) -> Result<(), Error> {
println!("encode_symlink: {:?} -> {:?}", self.current_path, target); //println!("encode_symlink: {:?} -> {:?}", self.current_path, target);
self.write_entry(stat)?; self.write_entry(stat)?;