src/backup/data_chunk.rs: Data Chunk builder
Make handling encoded chunks easier.
This commit is contained in:
parent
a70b2aeb48
commit
b595cb9d2c
@ -124,6 +124,9 @@ pub static ENCR_COMPR_CHUNK_MAGIC_1_0: [u8; 8] = [9, 40, 53, 200, 37, 150, 90, 1
|
||||
mod crypt_setup;
|
||||
pub use crypt_setup::*;
|
||||
|
||||
mod data_chunk;
|
||||
pub use data_chunk::*;
|
||||
|
||||
mod chunk_stream;
|
||||
pub use chunk_stream::*;
|
||||
|
||||
|
226
src/backup/data_chunk.rs
Normal file
226
src/backup/data_chunk.rs
Normal file
@ -0,0 +1,226 @@
|
||||
use failure::*;
|
||||
use std::convert::TryInto;
|
||||
use std::io::Write;
|
||||
|
||||
use super::*;
|
||||
|
||||
|
||||
/// Data chunk binary storage format
|
||||
///
|
||||
/// Data chunks are identified by a unique digest, and can be
|
||||
/// compressed and encrypted. A simply binary format is used to store
|
||||
/// them on disk or transfer them over the network.
|
||||
///
|
||||
/// The format start with a 8 byte magic number to identify the type.
|
||||
/// Encrypted chunks contain a 16 byte IV, followed by a 18 byte AD
|
||||
/// tag, followed by the encrypted data (MAGIC || IV || TAG ||
|
||||
/// EncryptedData).
|
||||
///
|
||||
/// Unecrypted chunks simply contain the (compressed) data.
|
||||
///
|
||||
/// Please use the ``DataChunkBuilder`` to create new instances.
|
||||
pub struct DataChunk {
|
||||
digest: [u8; 32],
|
||||
raw_data: Vec<u8>, // tagged, compressed, encryped data
|
||||
}
|
||||
|
||||
impl DataChunk {
|
||||
|
||||
/// accessor to raw_data field
|
||||
pub fn raw_data(&self) -> &[u8] {
|
||||
&self.raw_data
|
||||
}
|
||||
|
||||
/// accessor to chunk digest field
|
||||
pub fn digest(&self) -> &[u8; 32] {
|
||||
&self.digest
|
||||
}
|
||||
|
||||
/// accessor to chunk type (magic number)
|
||||
pub fn magic(&self) -> &[u8; 8] {
|
||||
self.raw_data[0..8].try_into().unwrap()
|
||||
}
|
||||
|
||||
// only valid for enrypted data
|
||||
//pub fn iv(&self) -> &[u8; 16] {
|
||||
// self.raw_data[8..24].try_into().unwrap()
|
||||
//}
|
||||
|
||||
// only valid for enrypted data
|
||||
//pub fn mac(&self) -> &[u8; 16] {
|
||||
// self.raw_data[24..40].try_into().unwrap()
|
||||
//}
|
||||
|
||||
fn new(
|
||||
data: &[u8],
|
||||
config: Option<&CryptConfig>,
|
||||
digest: [u8;32],
|
||||
compress: bool,
|
||||
) -> Result<Self, Error> {
|
||||
|
||||
if let Some(config) = config {
|
||||
|
||||
let enc_data = config.encode_chunk(data, compress)?;
|
||||
let chunk = DataChunk { digest, raw_data: enc_data };
|
||||
|
||||
Ok(chunk)
|
||||
} else {
|
||||
|
||||
if compress {
|
||||
let mut comp_data = Vec::with_capacity(data.len() + 8);
|
||||
|
||||
comp_data.write_all(&COMPRESSED_CHUNK_MAGIC_1_0)?;
|
||||
zstd::stream::copy_encode(data, &mut comp_data, 1)?;
|
||||
|
||||
let chunk = DataChunk { digest, raw_data: comp_data };
|
||||
|
||||
return Ok(chunk);
|
||||
} else {
|
||||
// TODO: howto avoid data copy here?
|
||||
let mut raw_data = Vec::with_capacity(data.len() + 8);
|
||||
|
||||
raw_data.write_all(&UNCOMPRESSED_CHUNK_MAGIC_1_0)?;
|
||||
raw_data.extend_from_slice(data);
|
||||
|
||||
let chunk = DataChunk { digest, raw_data };
|
||||
return Ok(chunk);
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
/// Decode chunk data
|
||||
pub fn decode(self, config: &CryptConfig) -> Result<Vec<u8>, Error> {
|
||||
|
||||
let magic = self.magic();
|
||||
|
||||
if magic == &UNCOMPRESSED_CHUNK_MAGIC_1_0 {
|
||||
return Ok(self.raw_data);
|
||||
} else if magic == &COMPRESSED_CHUNK_MAGIC_1_0 {
|
||||
|
||||
let data = zstd::block::decompress(&self.raw_data[8..], 16*1024*1024)?;
|
||||
return Ok(data);
|
||||
|
||||
} else if magic == &ENCR_COMPR_CHUNK_MAGIC_1_0 || magic == &ENCRYPTED_CHUNK_MAGIC_1_0 {
|
||||
|
||||
let data = config.decode_chunk(&self.raw_data)?;
|
||||
|
||||
return Ok(data);
|
||||
} else {
|
||||
bail!("Invalid chunk magic number.");
|
||||
}
|
||||
}
|
||||
|
||||
/// Load chunk data from ``reader``
|
||||
///
|
||||
/// Please note that it is impossible to compute the digest for
|
||||
/// encrypted chunks, so we need to trust and use the provided
|
||||
/// ``digest``.
|
||||
pub fn load(reader: &mut dyn std::io::Read, digest: [u8; 32]) -> Result<Self, Error> {
|
||||
|
||||
let mut data = Vec::with_capacity(1024*1024);
|
||||
reader.read_to_end(&mut data)?;
|
||||
|
||||
if data.len() < 8 {
|
||||
bail!("chunk too small ({} bytes).", data.len());
|
||||
}
|
||||
|
||||
let magic = &data[0..8];
|
||||
|
||||
if magic == ENCR_COMPR_CHUNK_MAGIC_1_0 || magic == ENCRYPTED_CHUNK_MAGIC_1_0 {
|
||||
|
||||
if data.len() < 40 {
|
||||
bail!("encrypted chunk too small ({} bytes).", data.len());
|
||||
}
|
||||
|
||||
let chunk = DataChunk { digest: digest, raw_data: data };
|
||||
|
||||
Ok(chunk)
|
||||
} else if magic == COMPRESSED_CHUNK_MAGIC_1_0 || magic == UNCOMPRESSED_CHUNK_MAGIC_1_0 {
|
||||
|
||||
let chunk = DataChunk { digest: digest, raw_data: data };
|
||||
|
||||
Ok(chunk)
|
||||
} else {
|
||||
bail!("unable to load chunk - wrong magic");
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
/// Builder for DataChunk
|
||||
///
|
||||
/// Main purpose is to centralize digest computation. Digest
|
||||
/// computation differ for encryped chunk, and this interface ensures that
|
||||
/// we always compute the correct one.
|
||||
pub struct DataChunkBuilder<'a, 'b> {
|
||||
config: Option<&'b CryptConfig>,
|
||||
orig_data: &'a [u8],
|
||||
digest_computed: bool,
|
||||
digest: [u8; 32],
|
||||
compress: bool,
|
||||
}
|
||||
|
||||
impl <'a, 'b> DataChunkBuilder<'a, 'b> {
|
||||
|
||||
/// Create a new builder instance.
|
||||
pub fn new(orig_data: &'a [u8]) -> Self {
|
||||
Self {
|
||||
orig_data,
|
||||
config: None,
|
||||
digest_computed: false,
|
||||
digest: [0u8; 32],
|
||||
compress: false,
|
||||
}
|
||||
}
|
||||
|
||||
/// Set compression flag.
|
||||
///
|
||||
/// If true, chunk data is compressed using zstd (level 1).
|
||||
pub fn compress(mut self, value: bool) -> Self {
|
||||
self.compress = value;
|
||||
self
|
||||
}
|
||||
|
||||
/// Set encryption Configuration
|
||||
///
|
||||
/// If set, chunks are encrypted.
|
||||
pub fn crypt_config(mut self, value: &'b CryptConfig) -> Self {
|
||||
if self.digest_computed {
|
||||
panic!("unable to set crypt_config after compute_digest().");
|
||||
}
|
||||
self.config = Some(value);
|
||||
self
|
||||
}
|
||||
|
||||
fn compute_digest(&mut self) {
|
||||
if !self.digest_computed {
|
||||
if let Some(config) = self.config {
|
||||
self.digest = config.compute_digest(self.orig_data);
|
||||
} else {
|
||||
self.digest = openssl::sha::sha256(self.orig_data);
|
||||
}
|
||||
self.digest_computed = true;
|
||||
}
|
||||
}
|
||||
|
||||
/// Returns the chunk Digest
|
||||
///
|
||||
/// Note: For encrypted chunks, this needs to be called after
|
||||
/// ``crypt_config``.
|
||||
pub fn digest(&mut self) -> &[u8; 32] {
|
||||
if !self.digest_computed {
|
||||
self.compute_digest();
|
||||
}
|
||||
&self.digest
|
||||
}
|
||||
|
||||
/// Consume self and build the ``DataChunk``.
|
||||
pub fn build(mut self) -> Result<DataChunk, Error> {
|
||||
if !self.digest_computed {
|
||||
self.compute_digest();
|
||||
}
|
||||
|
||||
let chunk = DataChunk::new(self.orig_data, self.config, self.digest, self.compress)?;
|
||||
|
||||
Ok(chunk)
|
||||
}
|
||||
}
|
Loading…
Reference in New Issue
Block a user