catar/decoder.rs: start implementation
This commit is contained in:
		@ -1,3 +1,253 @@
 | 
			
		||||
//! *catar* format decoder.
 | 
			
		||||
//!
 | 
			
		||||
//! This module contain the code to decode *catar* archive files.
 | 
			
		||||
 | 
			
		||||
use failure::*;
 | 
			
		||||
 | 
			
		||||
use super::format_definition::*;
 | 
			
		||||
use crate::tools;
 | 
			
		||||
 | 
			
		||||
use std::io::{Read, Seek, SeekFrom};
 | 
			
		||||
use std::path::PathBuf;
 | 
			
		||||
 | 
			
		||||
use std::os::unix::ffi::{OsStrExt, OsStringExt};
 | 
			
		||||
use std::ffi::{OsStr, OsString};
 | 
			
		||||
 | 
			
		||||
pub struct CaDirectoryEntry {
 | 
			
		||||
    start: u64,
 | 
			
		||||
    end: u64,
 | 
			
		||||
    pub filename: OsString,
 | 
			
		||||
    pub entry: CaFormatEntry,
 | 
			
		||||
}
 | 
			
		||||
 | 
			
		||||
// This one needs Read+Seek (we may want one without Seek?)
 | 
			
		||||
pub struct CaTarDecoder<'a, R: Read + Seek> {
 | 
			
		||||
    reader: &'a mut R,
 | 
			
		||||
    root_start: u64,
 | 
			
		||||
    root_end: u64,
 | 
			
		||||
}
 | 
			
		||||
 | 
			
		||||
const HEADER_SIZE: u64 = std::mem::size_of::<CaFormatHeader>() as u64;
 | 
			
		||||
 | 
			
		||||
impl <'a, R: Read + Seek> CaTarDecoder<'a, R> {
 | 
			
		||||
 | 
			
		||||
    pub fn new(reader: &'a mut R) -> Result<Self, Error> {
 | 
			
		||||
 | 
			
		||||
        let root_end = reader.seek(SeekFrom::End(0))?;
 | 
			
		||||
 | 
			
		||||
        Ok(Self {
 | 
			
		||||
            reader: reader,
 | 
			
		||||
            root_start: 0,
 | 
			
		||||
            root_end: root_end,
 | 
			
		||||
        })
 | 
			
		||||
    }
 | 
			
		||||
 | 
			
		||||
    pub fn root(&self) -> CaDirectoryEntry {
 | 
			
		||||
        CaDirectoryEntry {
 | 
			
		||||
            start: self.root_start,
 | 
			
		||||
            end: self.root_end,
 | 
			
		||||
            filename: OsString::new(), // Empty
 | 
			
		||||
            entry: CaFormatEntry {
 | 
			
		||||
                feature_flags: 0,
 | 
			
		||||
                mode: 0,
 | 
			
		||||
                flags: 0,
 | 
			
		||||
                uid: 0,
 | 
			
		||||
                gid: 0,
 | 
			
		||||
                mtime: 0,
 | 
			
		||||
            }
 | 
			
		||||
        }
 | 
			
		||||
    }
 | 
			
		||||
 | 
			
		||||
    fn read_directory_entry(&mut self, start: u64, end: u64) -> Result<CaDirectoryEntry, Error> {
 | 
			
		||||
 | 
			
		||||
        self.reader.seek(SeekFrom::Start(start))?;
 | 
			
		||||
        let mut buffer = [0u8; HEADER_SIZE as usize];
 | 
			
		||||
        self.reader.read_exact(&mut buffer)?;
 | 
			
		||||
        let head = tools::map_struct::<CaFormatHeader>(&buffer)?;
 | 
			
		||||
 | 
			
		||||
        if u64::from_le(head.htype) != CA_FORMAT_FILENAME {
 | 
			
		||||
            bail!("wrong filename header type for object [{}..{}]", start, end);
 | 
			
		||||
        }
 | 
			
		||||
 | 
			
		||||
        let mut name_len = u64::from_le(head.size);
 | 
			
		||||
 | 
			
		||||
        let entry_start = start + name_len;
 | 
			
		||||
 | 
			
		||||
        if name_len < (HEADER_SIZE + 2) {
 | 
			
		||||
            bail!("filename size too short for object [{}..{}]", start, end);
 | 
			
		||||
        }
 | 
			
		||||
        name_len -= HEADER_SIZE;
 | 
			
		||||
 | 
			
		||||
        if name_len > ((libc::FILENAME_MAX as u64) + 1) {
 | 
			
		||||
            bail!("filename too long for object [{}..{}]", start, end);
 | 
			
		||||
        }
 | 
			
		||||
 | 
			
		||||
        let mut buffer = vec![0u8; name_len as usize];
 | 
			
		||||
        self.reader.read_exact(&mut buffer)?;
 | 
			
		||||
 | 
			
		||||
        // fixme: check nul termination
 | 
			
		||||
        let last_byte = buffer.pop().unwrap();
 | 
			
		||||
        if last_byte != 0u8 {
 | 
			
		||||
            bail!("filename entry not nul terminated, object [{}..{}]", start, end);
 | 
			
		||||
 | 
			
		||||
        }
 | 
			
		||||
 | 
			
		||||
        let filename = std::ffi::OsString::from_vec(buffer);
 | 
			
		||||
 | 
			
		||||
        let mut buffer = [0u8; HEADER_SIZE as usize];
 | 
			
		||||
        self.reader.read_exact(&mut buffer)?;
 | 
			
		||||
        let head = tools::map_struct::<CaFormatHeader>(&buffer)?;
 | 
			
		||||
 | 
			
		||||
        if u64::from_le(head.htype) != CA_FORMAT_ENTRY {
 | 
			
		||||
            bail!("wrong entry header type for object [{}..{}]", start, end);
 | 
			
		||||
        }
 | 
			
		||||
 | 
			
		||||
        const ENTRY_SIZE: u64 = std::mem::size_of::<CaFormatEntry>() as u64;
 | 
			
		||||
 | 
			
		||||
        let mut entry_len = u64::from_le(head.size);
 | 
			
		||||
        if entry_len != (HEADER_SIZE + ENTRY_SIZE) {
 | 
			
		||||
            bail!("wrong entry header size for object [{}..{}]", start, end);
 | 
			
		||||
        }
 | 
			
		||||
        entry_len -= HEADER_SIZE;
 | 
			
		||||
 | 
			
		||||
        let mut buffer = [0u8; ENTRY_SIZE as usize];
 | 
			
		||||
        self.reader.read_exact(&mut buffer)?;
 | 
			
		||||
        let entry = tools::map_struct::<CaFormatEntry>(&buffer)?;
 | 
			
		||||
 | 
			
		||||
        Ok(CaDirectoryEntry {
 | 
			
		||||
            start: entry_start,
 | 
			
		||||
            end: end,
 | 
			
		||||
            filename: filename,
 | 
			
		||||
            entry: CaFormatEntry {
 | 
			
		||||
                feature_flags: u64::from_le(entry.feature_flags),
 | 
			
		||||
                mode: u64::from_le(entry.mode),
 | 
			
		||||
                flags: u64::from_le(entry.flags),
 | 
			
		||||
                uid: u64::from_le(entry.uid),
 | 
			
		||||
                gid: u64::from_le(entry.gid),
 | 
			
		||||
                mtime: u64::from_le(entry.mtime),
 | 
			
		||||
            },
 | 
			
		||||
        })
 | 
			
		||||
    }
 | 
			
		||||
 | 
			
		||||
    pub fn list_dir(&mut self, dir: &CaDirectoryEntry) -> Result<Vec<CaDirectoryEntry>, Error> {
 | 
			
		||||
 | 
			
		||||
        const GOODBYE_ITEM_SIZE: u64 = std::mem::size_of::<CaFormatGoodbyeItem>() as u64;
 | 
			
		||||
 | 
			
		||||
        let start = dir.start;
 | 
			
		||||
        let end = dir.end;
 | 
			
		||||
 | 
			
		||||
        //println!("list_dir1: {} {}", start, end);
 | 
			
		||||
 | 
			
		||||
        if (end - start) < (HEADER_SIZE + GOODBYE_ITEM_SIZE) {
 | 
			
		||||
            bail!("detected short object [{}..{}]", start, end);
 | 
			
		||||
        }
 | 
			
		||||
 | 
			
		||||
        self.reader.seek(SeekFrom::Start(end - GOODBYE_ITEM_SIZE))?;
 | 
			
		||||
        let mut buffer = [0u8; GOODBYE_ITEM_SIZE as usize];
 | 
			
		||||
        self.reader.read_exact(&mut buffer)?;
 | 
			
		||||
 | 
			
		||||
        let item = tools::map_struct::<CaFormatGoodbyeItem>(&buffer)?;
 | 
			
		||||
 | 
			
		||||
        if u64::from_le(item.hash) != CA_FORMAT_GOODBYE_TAIL_MARKER {
 | 
			
		||||
            bail!("missing goodbye tail marker for object [{}..{}]", start, end);
 | 
			
		||||
        }
 | 
			
		||||
 | 
			
		||||
        let goodbye_table_size = u64::from_le(item.size);
 | 
			
		||||
        if goodbye_table_size < (HEADER_SIZE + GOODBYE_ITEM_SIZE) {
 | 
			
		||||
            bail!("short goodbye table size for object [{}..{}]", start, end);
 | 
			
		||||
 | 
			
		||||
        }
 | 
			
		||||
        let goodbye_inner_size = goodbye_table_size - HEADER_SIZE - GOODBYE_ITEM_SIZE;
 | 
			
		||||
        if (goodbye_inner_size % GOODBYE_ITEM_SIZE) != 0 {
 | 
			
		||||
            bail!("wrong goodbye inner table size for entry [{}..{}]", start, end);
 | 
			
		||||
        }
 | 
			
		||||
 | 
			
		||||
        let goodbye_start = end - goodbye_table_size;
 | 
			
		||||
 | 
			
		||||
        if u64::from_le(item.offset) != (goodbye_start - start) {
 | 
			
		||||
            println!("DEBUG: {} {}", u64::from_le(item.offset), goodbye_start - start);
 | 
			
		||||
            bail!("wrong offset in goodbye tail marker for entry [{}..{}]", start, end);
 | 
			
		||||
        }
 | 
			
		||||
 | 
			
		||||
        self.reader.seek(SeekFrom::Start(goodbye_start))?;
 | 
			
		||||
        let mut buffer = [0u8; HEADER_SIZE as usize];
 | 
			
		||||
        self.reader.read_exact(&mut buffer)?;
 | 
			
		||||
        let head = tools::map_struct::<CaFormatHeader>(&buffer)?;
 | 
			
		||||
 | 
			
		||||
        if u64::from_le(head.htype) != CA_FORMAT_GOODBYE {
 | 
			
		||||
            bail!("wrong goodbye table header type for entry [{}..{}]", start, end);
 | 
			
		||||
        }
 | 
			
		||||
 | 
			
		||||
        if u64::from_le(head.size) != goodbye_table_size {
 | 
			
		||||
            bail!("wrong goodbye table size for entry [{}..{}]", start, end);
 | 
			
		||||
        }
 | 
			
		||||
 | 
			
		||||
        let mut buffer = [0u8; GOODBYE_ITEM_SIZE as usize];
 | 
			
		||||
 | 
			
		||||
        let mut range_list = Vec::new();
 | 
			
		||||
 | 
			
		||||
        for i in 0..goodbye_inner_size/GOODBYE_ITEM_SIZE {
 | 
			
		||||
            self.reader.read_exact(&mut buffer)?;
 | 
			
		||||
            let item = tools::map_struct::<CaFormatGoodbyeItem>(&buffer)?;
 | 
			
		||||
            let item_offset = u64::from_le(item.offset);
 | 
			
		||||
            if item_offset > (goodbye_start - start) {
 | 
			
		||||
                bail!("goodbye entry {} offset out of range [{}..{}] {} {} {}",
 | 
			
		||||
                      i, start, end, item_offset, goodbye_start, start);
 | 
			
		||||
            }
 | 
			
		||||
            let item_start = goodbye_start - item_offset;
 | 
			
		||||
            let item_hash = u64::from_le(item.hash);
 | 
			
		||||
            let item_end = item_start + u64::from_le(item.size);
 | 
			
		||||
            if item_end > goodbye_start {
 | 
			
		||||
                bail!("goodbye entry {} end out of range [{}..{}]",
 | 
			
		||||
                      i, start, end);
 | 
			
		||||
            }
 | 
			
		||||
 | 
			
		||||
            range_list.push((item_start, item_end));
 | 
			
		||||
        }
 | 
			
		||||
 | 
			
		||||
        let mut result = vec![];
 | 
			
		||||
 | 
			
		||||
        for (item_start, item_end) in range_list {
 | 
			
		||||
            let entry = self.read_directory_entry(item_start, item_end)?;
 | 
			
		||||
            //println!("ENTRY: {} {} {:?}", item_start, item_end, entry.filename);
 | 
			
		||||
            result.push(entry);
 | 
			
		||||
        }
 | 
			
		||||
 | 
			
		||||
        Ok(result)
 | 
			
		||||
    }
 | 
			
		||||
 | 
			
		||||
    pub fn print_filenames<W: std::io::Write>(
 | 
			
		||||
        &mut self,
 | 
			
		||||
        output: &mut W,
 | 
			
		||||
        prefix: &mut PathBuf,
 | 
			
		||||
        dir: &CaDirectoryEntry,
 | 
			
		||||
    ) -> Result<(), Error> {
 | 
			
		||||
 | 
			
		||||
        let mut list = self.list_dir(dir)?;
 | 
			
		||||
 | 
			
		||||
        list.sort_unstable_by(|a, b| a.filename.cmp(&b.filename));
 | 
			
		||||
 | 
			
		||||
        for item in &list {
 | 
			
		||||
 | 
			
		||||
            prefix.push(item.filename.clone());
 | 
			
		||||
 | 
			
		||||
            let mode = item.entry.mode as u32;
 | 
			
		||||
 | 
			
		||||
            let osstr: &OsStr =  prefix.as_ref();
 | 
			
		||||
            output.write(osstr.as_bytes())?;
 | 
			
		||||
            output.write(b"\n")?;
 | 
			
		||||
 | 
			
		||||
            if (mode & libc::S_IFMT) == libc::S_IFDIR {
 | 
			
		||||
                self.print_filenames(output, prefix, item)?;
 | 
			
		||||
            } else if (mode & libc::S_IFMT) == libc::S_IFREG {
 | 
			
		||||
            } else if (mode & libc::S_IFMT) == libc::S_IFLNK {
 | 
			
		||||
            } else {
 | 
			
		||||
                bail!("unknown item mode/type for {:?}", prefix);
 | 
			
		||||
            }
 | 
			
		||||
 | 
			
		||||
            prefix.pop();
 | 
			
		||||
        }
 | 
			
		||||
 | 
			
		||||
        Ok(())
 | 
			
		||||
    }
 | 
			
		||||
}
 | 
			
		||||
 | 
			
		||||
		Reference in New Issue
	
	Block a user