2018-12-30 16:43:53 +00:00
|
|
|
//! *catar* format decoder.
|
2019-01-06 16:27:57 +00:00
|
|
|
//!
|
|
|
|
//! This module contain the code to decode *catar* archive files.
|
2018-12-30 16:32:52 +00:00
|
|
|
|
2019-01-06 16:27:57 +00:00
|
|
|
use failure::*;
|
2019-01-07 18:07:03 +00:00
|
|
|
use endian_trait::Endian;
|
2018-12-30 16:32:52 +00:00
|
|
|
|
2019-01-06 16:27:57 +00:00
|
|
|
use super::format_definition::*;
|
|
|
|
use crate::tools;
|
|
|
|
|
|
|
|
use std::io::{Read, Seek, SeekFrom};
|
2019-01-07 18:07:03 +00:00
|
|
|
use std::path::{Path, PathBuf};
|
2019-01-06 16:27:57 +00:00
|
|
|
|
|
|
|
use std::os::unix::ffi::{OsStrExt, OsStringExt};
|
|
|
|
use std::ffi::{OsStr, OsString};
|
|
|
|
|
|
|
|
pub struct CaDirectoryEntry {
|
|
|
|
start: u64,
|
|
|
|
end: u64,
|
|
|
|
pub filename: OsString,
|
|
|
|
pub entry: CaFormatEntry,
|
|
|
|
}
|
|
|
|
|
|
|
|
// This one needs Read+Seek (we may want one without Seek?)
|
|
|
|
pub struct CaTarDecoder<'a, R: Read + Seek> {
|
|
|
|
reader: &'a mut R,
|
|
|
|
root_start: u64,
|
|
|
|
root_end: u64,
|
|
|
|
}
|
|
|
|
|
|
|
|
const HEADER_SIZE: u64 = std::mem::size_of::<CaFormatHeader>() as u64;
|
|
|
|
|
|
|
|
impl <'a, R: Read + Seek> CaTarDecoder<'a, R> {
|
|
|
|
|
|
|
|
pub fn new(reader: &'a mut R) -> Result<Self, Error> {
|
|
|
|
|
|
|
|
let root_end = reader.seek(SeekFrom::End(0))?;
|
|
|
|
|
|
|
|
Ok(Self {
|
|
|
|
reader: reader,
|
|
|
|
root_start: 0,
|
|
|
|
root_end: root_end,
|
|
|
|
})
|
|
|
|
}
|
|
|
|
|
|
|
|
pub fn root(&self) -> CaDirectoryEntry {
|
|
|
|
CaDirectoryEntry {
|
|
|
|
start: self.root_start,
|
|
|
|
end: self.root_end,
|
|
|
|
filename: OsString::new(), // Empty
|
|
|
|
entry: CaFormatEntry {
|
|
|
|
feature_flags: 0,
|
|
|
|
mode: 0,
|
|
|
|
flags: 0,
|
|
|
|
uid: 0,
|
|
|
|
gid: 0,
|
|
|
|
mtime: 0,
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2019-01-07 18:07:03 +00:00
|
|
|
fn read_item<T: Endian>(&mut self) -> Result<T, Error> {
|
2019-01-06 16:27:57 +00:00
|
|
|
|
2019-01-07 18:07:03 +00:00
|
|
|
let mut result: T = unsafe { std::mem::uninitialized() };
|
2019-01-06 16:27:57 +00:00
|
|
|
|
2019-01-07 18:07:03 +00:00
|
|
|
let buffer = unsafe { std::slice::from_raw_parts_mut(
|
|
|
|
&mut result as *mut T as *mut u8,
|
|
|
|
std::mem::size_of::<T>()
|
|
|
|
)};
|
|
|
|
|
|
|
|
self.reader.read_exact(buffer)?;
|
|
|
|
|
|
|
|
Ok(result.from_le())
|
|
|
|
}
|
|
|
|
|
|
|
|
fn read_symlink(&mut self, size: u64) -> Result<PathBuf, Error> {
|
|
|
|
if size < (HEADER_SIZE + 2) {
|
|
|
|
bail!("dectected short symlink target.");
|
2019-01-06 16:27:57 +00:00
|
|
|
}
|
2019-01-07 18:07:03 +00:00
|
|
|
let target_len = size - HEADER_SIZE;
|
2019-01-06 16:27:57 +00:00
|
|
|
|
2019-01-07 18:07:03 +00:00
|
|
|
if target_len > (libc::PATH_MAX as u64) {
|
|
|
|
bail!("symlink target too long ({}).", target_len);
|
|
|
|
}
|
2019-01-06 16:27:57 +00:00
|
|
|
|
2019-01-07 18:07:03 +00:00
|
|
|
let mut buffer = vec![0u8; target_len as usize];
|
|
|
|
self.reader.read_exact(&mut buffer)?;
|
2019-01-06 16:27:57 +00:00
|
|
|
|
2019-01-07 18:07:03 +00:00
|
|
|
let last_byte = buffer.pop().unwrap();
|
|
|
|
if last_byte != 0u8 {
|
|
|
|
bail!("symlink target not nul terminated.");
|
2019-01-06 16:27:57 +00:00
|
|
|
}
|
2019-01-07 18:07:03 +00:00
|
|
|
|
|
|
|
Ok(PathBuf::from(std::ffi::OsString::from_vec(buffer)))
|
|
|
|
}
|
|
|
|
|
|
|
|
fn read_filename(&mut self, size: u64) -> Result<OsString, Error> {
|
|
|
|
if size < (HEADER_SIZE + 2) {
|
|
|
|
bail!("dectected short filename");
|
|
|
|
}
|
|
|
|
let name_len = size - HEADER_SIZE;
|
2019-01-06 16:27:57 +00:00
|
|
|
|
|
|
|
if name_len > ((libc::FILENAME_MAX as u64) + 1) {
|
2019-01-07 18:07:03 +00:00
|
|
|
bail!("filename too long ({}).", name_len);
|
2019-01-06 16:27:57 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
let mut buffer = vec![0u8; name_len as usize];
|
|
|
|
self.reader.read_exact(&mut buffer)?;
|
|
|
|
|
|
|
|
let last_byte = buffer.pop().unwrap();
|
|
|
|
if last_byte != 0u8 {
|
2019-01-07 18:07:03 +00:00
|
|
|
bail!("filename entry not nul terminated.");
|
|
|
|
}
|
2019-01-06 16:27:57 +00:00
|
|
|
|
2019-01-07 18:07:03 +00:00
|
|
|
Ok(std::ffi::OsString::from_vec(buffer))
|
|
|
|
}
|
|
|
|
|
|
|
|
pub fn restore<F: Fn(&Path) -> Result<(), Error>>(
|
|
|
|
&mut self,
|
|
|
|
dir: &CaDirectoryEntry,
|
|
|
|
callback: F,
|
|
|
|
) -> Result<(), Error> {
|
|
|
|
|
|
|
|
let start = dir.start;
|
|
|
|
let end = dir.end;
|
|
|
|
|
|
|
|
self.reader.seek(SeekFrom::Start(start))?;
|
|
|
|
|
|
|
|
let mut path = PathBuf::from(".");
|
|
|
|
|
|
|
|
self.restore_sequential(&mut path, &callback)
|
|
|
|
}
|
|
|
|
|
|
|
|
pub fn restore_sequential<F: Fn(&Path) -> Result<(), Error>>(
|
|
|
|
&mut self,
|
|
|
|
path: &mut PathBuf,
|
|
|
|
callback: &F,
|
|
|
|
) -> Result<(), Error> {
|
|
|
|
|
|
|
|
// read ENTRY first
|
|
|
|
let head: CaFormatHeader = self.read_item()?;
|
|
|
|
check_ca_header::<CaFormatEntry>(&head, CA_FORMAT_ENTRY)?;
|
|
|
|
let entry: CaFormatEntry = self.read_item()?;
|
|
|
|
|
2019-01-07 18:18:59 +00:00
|
|
|
let mode = entry.mode as u32; //fixme: upper 32bits?
|
|
|
|
|
|
|
|
let is_dir = (mode & libc::S_IFMT) == libc::S_IFDIR;
|
2019-01-07 18:07:03 +00:00
|
|
|
|
|
|
|
loop {
|
|
|
|
let head: CaFormatHeader = self.read_item()?;
|
|
|
|
match head.htype {
|
|
|
|
CA_FORMAT_SYMLINK => {
|
2019-01-07 18:18:59 +00:00
|
|
|
if ((mode & libc::S_IFMT) != libc::S_IFLNK) {
|
|
|
|
bail!("detected unexpected symlink item.");
|
|
|
|
}
|
2019-01-07 18:07:03 +00:00
|
|
|
let target = self.read_symlink(head.size)?;
|
|
|
|
println!("TARGET: {:?}", target);
|
2019-01-07 18:18:59 +00:00
|
|
|
return Ok(());
|
2019-01-07 18:07:03 +00:00
|
|
|
}
|
|
|
|
CA_FORMAT_FILENAME => {
|
2019-01-07 18:18:59 +00:00
|
|
|
if !is_dir {
|
|
|
|
bail!("onyl directoriy entries may contain file names.");
|
|
|
|
}
|
2019-01-07 18:07:03 +00:00
|
|
|
let name = self.read_filename(head.size)?;
|
|
|
|
path.push(name);
|
|
|
|
println!("NAME: {:?}", path);
|
|
|
|
self.restore_sequential(path, callback)?;
|
|
|
|
path.pop();
|
2019-01-07 18:18:59 +00:00
|
|
|
}
|
2019-01-07 18:07:03 +00:00
|
|
|
CA_FORMAT_PAYLOAD => {
|
2019-01-07 18:18:59 +00:00
|
|
|
if ((mode & libc::S_IFMT) != libc::S_IFREG) {
|
|
|
|
bail!("detected enexpected paylod item.");
|
|
|
|
}
|
2019-01-07 18:07:03 +00:00
|
|
|
println!("Skip Payload");
|
|
|
|
if head.size < HEADER_SIZE { bail!("detected short payload"); }
|
|
|
|
self.reader.seek(SeekFrom::Current((head.size - HEADER_SIZE) as i64))?;
|
2019-01-07 18:18:59 +00:00
|
|
|
return Ok(());
|
|
|
|
}
|
2019-01-07 18:07:03 +00:00
|
|
|
CA_FORMAT_GOODBYE => {
|
2019-01-07 18:18:59 +00:00
|
|
|
if !is_dir {
|
|
|
|
bail!("onyl directoriy entries may contain goodbye tables.");
|
|
|
|
}
|
2019-01-07 18:07:03 +00:00
|
|
|
println!("Skip Goodbye");
|
|
|
|
if head.size < HEADER_SIZE { bail!("detected short goodbye table"); }
|
|
|
|
self.reader.seek(SeekFrom::Current((head.size - HEADER_SIZE) as i64))?;
|
|
|
|
return Ok(());
|
|
|
|
}
|
|
|
|
_ => {
|
|
|
|
bail!("got unknown header type {:016x}", head.htype);
|
|
|
|
}
|
|
|
|
}
|
2019-01-06 16:27:57 +00:00
|
|
|
}
|
|
|
|
|
2019-01-07 18:07:03 +00:00
|
|
|
Ok(())
|
|
|
|
}
|
|
|
|
|
|
|
|
fn read_directory_entry(&mut self, start: u64, end: u64) -> Result<CaDirectoryEntry, Error> {
|
2019-01-06 16:27:57 +00:00
|
|
|
|
2019-01-07 18:07:03 +00:00
|
|
|
self.reader.seek(SeekFrom::Start(start))?;
|
2019-01-06 16:27:57 +00:00
|
|
|
let mut buffer = [0u8; HEADER_SIZE as usize];
|
|
|
|
self.reader.read_exact(&mut buffer)?;
|
|
|
|
let head = tools::map_struct::<CaFormatHeader>(&buffer)?;
|
|
|
|
|
2019-01-07 18:07:03 +00:00
|
|
|
if u64::from_le(head.htype) != CA_FORMAT_FILENAME {
|
|
|
|
bail!("wrong filename header type for object [{}..{}]", start, end);
|
2019-01-06 16:27:57 +00:00
|
|
|
}
|
|
|
|
|
2019-01-07 18:07:03 +00:00
|
|
|
let mut name_len = u64::from_le(head.size);
|
2019-01-06 16:27:57 +00:00
|
|
|
|
2019-01-07 18:07:03 +00:00
|
|
|
let entry_start = start + name_len;
|
2019-01-06 16:27:57 +00:00
|
|
|
|
2019-01-07 18:07:03 +00:00
|
|
|
let filename = self.read_filename(name_len)?;
|
|
|
|
|
|
|
|
let head: CaFormatHeader = self.read_item()?;
|
|
|
|
check_ca_header::<CaFormatEntry>(&head, CA_FORMAT_ENTRY)?;
|
|
|
|
let entry: CaFormatEntry = self.read_item()?;
|
2019-01-06 16:27:57 +00:00
|
|
|
|
|
|
|
Ok(CaDirectoryEntry {
|
|
|
|
start: entry_start,
|
|
|
|
end: end,
|
|
|
|
filename: filename,
|
|
|
|
entry: CaFormatEntry {
|
|
|
|
feature_flags: u64::from_le(entry.feature_flags),
|
|
|
|
mode: u64::from_le(entry.mode),
|
|
|
|
flags: u64::from_le(entry.flags),
|
|
|
|
uid: u64::from_le(entry.uid),
|
|
|
|
gid: u64::from_le(entry.gid),
|
|
|
|
mtime: u64::from_le(entry.mtime),
|
|
|
|
},
|
|
|
|
})
|
|
|
|
}
|
|
|
|
|
|
|
|
pub fn list_dir(&mut self, dir: &CaDirectoryEntry) -> Result<Vec<CaDirectoryEntry>, Error> {
|
|
|
|
|
|
|
|
const GOODBYE_ITEM_SIZE: u64 = std::mem::size_of::<CaFormatGoodbyeItem>() as u64;
|
|
|
|
|
|
|
|
let start = dir.start;
|
|
|
|
let end = dir.end;
|
|
|
|
|
|
|
|
//println!("list_dir1: {} {}", start, end);
|
|
|
|
|
|
|
|
if (end - start) < (HEADER_SIZE + GOODBYE_ITEM_SIZE) {
|
|
|
|
bail!("detected short object [{}..{}]", start, end);
|
|
|
|
}
|
|
|
|
|
|
|
|
self.reader.seek(SeekFrom::Start(end - GOODBYE_ITEM_SIZE))?;
|
|
|
|
let mut buffer = [0u8; GOODBYE_ITEM_SIZE as usize];
|
|
|
|
self.reader.read_exact(&mut buffer)?;
|
|
|
|
|
|
|
|
let item = tools::map_struct::<CaFormatGoodbyeItem>(&buffer)?;
|
|
|
|
|
|
|
|
if u64::from_le(item.hash) != CA_FORMAT_GOODBYE_TAIL_MARKER {
|
|
|
|
bail!("missing goodbye tail marker for object [{}..{}]", start, end);
|
|
|
|
}
|
|
|
|
|
|
|
|
let goodbye_table_size = u64::from_le(item.size);
|
|
|
|
if goodbye_table_size < (HEADER_SIZE + GOODBYE_ITEM_SIZE) {
|
|
|
|
bail!("short goodbye table size for object [{}..{}]", start, end);
|
|
|
|
|
|
|
|
}
|
|
|
|
let goodbye_inner_size = goodbye_table_size - HEADER_SIZE - GOODBYE_ITEM_SIZE;
|
|
|
|
if (goodbye_inner_size % GOODBYE_ITEM_SIZE) != 0 {
|
|
|
|
bail!("wrong goodbye inner table size for entry [{}..{}]", start, end);
|
|
|
|
}
|
|
|
|
|
|
|
|
let goodbye_start = end - goodbye_table_size;
|
|
|
|
|
|
|
|
if u64::from_le(item.offset) != (goodbye_start - start) {
|
|
|
|
println!("DEBUG: {} {}", u64::from_le(item.offset), goodbye_start - start);
|
|
|
|
bail!("wrong offset in goodbye tail marker for entry [{}..{}]", start, end);
|
|
|
|
}
|
|
|
|
|
|
|
|
self.reader.seek(SeekFrom::Start(goodbye_start))?;
|
|
|
|
let mut buffer = [0u8; HEADER_SIZE as usize];
|
|
|
|
self.reader.read_exact(&mut buffer)?;
|
|
|
|
let head = tools::map_struct::<CaFormatHeader>(&buffer)?;
|
|
|
|
|
|
|
|
if u64::from_le(head.htype) != CA_FORMAT_GOODBYE {
|
|
|
|
bail!("wrong goodbye table header type for entry [{}..{}]", start, end);
|
|
|
|
}
|
|
|
|
|
|
|
|
if u64::from_le(head.size) != goodbye_table_size {
|
|
|
|
bail!("wrong goodbye table size for entry [{}..{}]", start, end);
|
|
|
|
}
|
|
|
|
|
|
|
|
let mut buffer = [0u8; GOODBYE_ITEM_SIZE as usize];
|
|
|
|
|
|
|
|
let mut range_list = Vec::new();
|
|
|
|
|
|
|
|
for i in 0..goodbye_inner_size/GOODBYE_ITEM_SIZE {
|
|
|
|
self.reader.read_exact(&mut buffer)?;
|
|
|
|
let item = tools::map_struct::<CaFormatGoodbyeItem>(&buffer)?;
|
|
|
|
let item_offset = u64::from_le(item.offset);
|
|
|
|
if item_offset > (goodbye_start - start) {
|
|
|
|
bail!("goodbye entry {} offset out of range [{}..{}] {} {} {}",
|
|
|
|
i, start, end, item_offset, goodbye_start, start);
|
|
|
|
}
|
|
|
|
let item_start = goodbye_start - item_offset;
|
|
|
|
let item_hash = u64::from_le(item.hash);
|
|
|
|
let item_end = item_start + u64::from_le(item.size);
|
|
|
|
if item_end > goodbye_start {
|
|
|
|
bail!("goodbye entry {} end out of range [{}..{}]",
|
|
|
|
i, start, end);
|
|
|
|
}
|
|
|
|
|
|
|
|
range_list.push((item_start, item_end));
|
|
|
|
}
|
|
|
|
|
|
|
|
let mut result = vec![];
|
|
|
|
|
|
|
|
for (item_start, item_end) in range_list {
|
|
|
|
let entry = self.read_directory_entry(item_start, item_end)?;
|
|
|
|
//println!("ENTRY: {} {} {:?}", item_start, item_end, entry.filename);
|
|
|
|
result.push(entry);
|
|
|
|
}
|
|
|
|
|
|
|
|
Ok(result)
|
|
|
|
}
|
|
|
|
|
|
|
|
pub fn print_filenames<W: std::io::Write>(
|
|
|
|
&mut self,
|
|
|
|
output: &mut W,
|
|
|
|
prefix: &mut PathBuf,
|
|
|
|
dir: &CaDirectoryEntry,
|
|
|
|
) -> Result<(), Error> {
|
|
|
|
|
|
|
|
let mut list = self.list_dir(dir)?;
|
|
|
|
|
|
|
|
list.sort_unstable_by(|a, b| a.filename.cmp(&b.filename));
|
|
|
|
|
|
|
|
for item in &list {
|
|
|
|
|
|
|
|
prefix.push(item.filename.clone());
|
|
|
|
|
|
|
|
let mode = item.entry.mode as u32;
|
|
|
|
|
|
|
|
let osstr: &OsStr = prefix.as_ref();
|
|
|
|
output.write(osstr.as_bytes())?;
|
|
|
|
output.write(b"\n")?;
|
|
|
|
|
|
|
|
if (mode & libc::S_IFMT) == libc::S_IFDIR {
|
|
|
|
self.print_filenames(output, prefix, item)?;
|
|
|
|
} else if (mode & libc::S_IFMT) == libc::S_IFREG {
|
|
|
|
} else if (mode & libc::S_IFMT) == libc::S_IFLNK {
|
|
|
|
} else {
|
|
|
|
bail!("unknown item mode/type for {:?}", prefix);
|
|
|
|
}
|
|
|
|
|
|
|
|
prefix.pop();
|
|
|
|
}
|
|
|
|
|
|
|
|
Ok(())
|
|
|
|
}
|
|
|
|
}
|