use failure::*; use super::format_definition::*; use super::binary_search_tree::*; use std::io::Write; use std::os::unix::io::AsRawFd; use std::os::unix::ffi::OsStrExt; use std::os::unix::io::RawFd; use std::path::{Path, PathBuf}; use std::ffi::CStr; use nix::NixPath; use nix::fcntl::OFlag; use nix::sys::stat::Mode; use nix::errno::Errno; use nix::sys::stat::FileStat; use siphasher::sip::SipHasher24; const FILE_COPY_BUFFER_SIZE: usize = 1024*1024; pub struct CaTarEncoder { current_path: PathBuf, // used for error reporting writer: W, writer_pos: usize, size: usize, file_copy_buffer: Vec, } impl CaTarEncoder { pub fn encode(path: PathBuf, dir: &mut nix::dir::Dir, writer: W) -> Result<(), Error> { let mut file_copy_buffer = Vec::with_capacity(FILE_COPY_BUFFER_SIZE); unsafe { file_copy_buffer.set_len(FILE_COPY_BUFFER_SIZE); } let mut me = Self { current_path: path, writer: writer, writer_pos: 0, size: 0, file_copy_buffer, }; // todo: use scandirat?? me.encode_dir(dir)?; Ok(()) } fn write(&mut self, buf: &[u8]) -> Result<(), Error> { self.writer.write(buf)?; self.writer_pos += buf.len(); Ok(()) } fn flush_copy_buffer(&mut self, size: usize) -> Result<(), Error> { self.writer.write(&self.file_copy_buffer[..size])?; self.writer_pos += size; Ok(()) } fn write_header(&mut self, htype: u64, size: u64) -> Result<(), Error> { let mut buffer = [0u8; std::mem::size_of::()]; let mut header = crate::tools::map_struct_mut::(&mut buffer)?; header.size = u64::to_le((std::mem::size_of::() as u64) + size); header.htype = u64::to_le(htype); self.write(&buffer)?; Ok(()) } fn write_filename(&mut self, name: &CStr) -> Result<(), Error> { let buffer = name.to_bytes_with_nul(); self.write_header(CA_FORMAT_FILENAME, buffer.len() as u64)?; self.write(buffer)?; Ok(()) } fn write_entry(&mut self, stat: &FileStat) -> Result<(), Error> { let mut buffer = [0u8; std::mem::size_of::() + std::mem::size_of::()]; let mut header = crate::tools::map_struct_mut::(&mut buffer)?; header.size = u64::to_le((std::mem::size_of::() + std::mem::size_of::()) as u64); header.htype = u64::to_le(CA_FORMAT_ENTRY); let mut entry = crate::tools::map_struct_mut::(&mut buffer[std::mem::size_of::()..])?; entry.feature_flags = u64::to_le(CA_FORMAT_FEATURE_FLAGS_MAX); if (stat.st_mode & libc::S_IFMT) == libc::S_IFLNK { entry.mode = u64::to_le((libc::S_IFLNK | 0o777) as u64); } else { let mode = stat.st_mode & (libc::S_IFMT | 0o7777); entry.mode = u64::to_le(mode as u64); } entry.flags = 0; // todo: CHATTR, FAT_ATTRS, subvolume? entry.uid = u64::to_le(stat.st_uid as u64); entry.gid = u64::to_le(stat.st_gid as u64); let mtime = stat.st_mtime * 1_000_000_000 + stat.st_mtime_nsec; if mtime > 0 { entry.mtime = mtime as u64 }; self.write(&buffer)?; Ok(()) } fn encode_dir(&mut self, dir: &mut nix::dir::Dir) -> Result<(), Error> { println!("encode_dir: {:?} start {}", self.current_path, self.writer_pos); let mut name_list = vec![]; let rawfd = dir.as_raw_fd(); let dir_stat = match nix::sys::stat::fstat(rawfd) { Ok(stat) => stat, Err(err) => bail!("fstat {:?} failed - {}", self.current_path, err), }; if (dir_stat.st_mode & libc::S_IFMT) != libc::S_IFDIR { bail!("got unexpected file type {:?} (not a directory)", self.current_path); } let dir_start_pos = self.writer_pos; self.write_entry(&dir_stat)?; for entry in dir.iter() { let entry = match entry { Ok(entry) => entry, Err(err) => bail!("readir {:?} failed - {}", self.current_path, err), }; let filename = entry.file_name().to_owned(); let name = filename.to_bytes_with_nul(); let name_len = name.len(); if name_len == 2 && name[0] == b'.' && name[1] == 0u8 { continue; } if name_len == 3 && name[0] == b'.' && name[1] == b'.' && name[2] == 0u8 { continue; } match nix::sys::stat::fstatat(rawfd, filename.as_ref(), nix::fcntl::AtFlags::AT_SYMLINK_NOFOLLOW) { Ok(stat) => { name_list.push((filename, stat)); } Err(nix::Error::Sys(Errno::ENOENT)) => self.report_vanished_file(&self.current_path)?, Err(err) => bail!("fstat {:?} failed - {}", self.current_path, err), } } name_list.sort_unstable_by(|a, b| a.0.cmp(&b.0)); let mut goodby_items = vec![]; for (filename, stat) in &name_list { self.current_path.push(std::ffi::OsStr::from_bytes(filename.as_bytes())); let start_pos = self.writer_pos; self.write_filename(&filename)?; if (stat.st_mode & libc::S_IFMT) == libc::S_IFDIR { match nix::dir::Dir::openat(rawfd, filename.as_ref(), OFlag::O_NOFOLLOW, Mode::empty()) { Ok(mut dir) => self.encode_dir(&mut dir)?, Err(nix::Error::Sys(Errno::ENOENT)) => self.report_vanished_file(&self.current_path)?, Err(err) => bail!("open dir {:?} failed - {}", self.current_path, err), } } else if (stat.st_mode & libc::S_IFMT) == libc::S_IFREG { match nix::fcntl::openat(rawfd, filename.as_ref(), OFlag::O_NOFOLLOW, Mode::empty()) { Ok(filefd) => { let res = self.encode_file(filefd); let _ = nix::unistd::close(filefd); // ignore close errors res?; } Err(nix::Error::Sys(Errno::ENOENT)) => self.report_vanished_file(&self.current_path)?, Err(err) => bail!("open file {:?} failed - {}", self.current_path, err), } } else if (stat.st_mode & libc::S_IFMT) == libc::S_IFLNK { let mut buffer = [0u8; libc::PATH_MAX as usize]; let res = filename.with_nix_path(|cstr| { unsafe { libc::readlinkat(rawfd, cstr.as_ptr(), buffer.as_mut_ptr() as *mut libc::c_char, buffer.len()-1) } })?; match Errno::result(res) { Ok(len) => { buffer[len as usize] = 0u8; // add Nul byte self.encode_symlink(&buffer[..((len+1) as usize)], &stat)? } Err(nix::Error::Sys(Errno::ENOENT)) => self.report_vanished_file(&self.current_path)?, Err(err) => bail!("readlink {:?} failed - {}", self.current_path, err), } } else { bail!("unsupported file type (mode {:o} {:?})", stat.st_mode, self.current_path); } let end_pos = self.writer_pos; goodby_items.push(CaFormatGoodbyeItem { offset: start_pos as u64, size: (end_pos - start_pos) as u64, hash: compute_goodby_hash(&filename), }); self.current_path.pop(); } println!("encode_dir: {:?} end {}", self.current_path, self.writer_pos); let goodby_start = self.writer_pos as u64; let item_count = goodby_items.len(); let goodby_table_size = (item_count + 1)*std::mem::size_of::(); for item in &mut goodby_items { item.offset = goodby_start - item.offset; } // fixme: sort goodby_items (BST) let goodby_offset = self.writer_pos - dir_start_pos; self.write_header(CA_FORMAT_GOODBYE, goodby_table_size as u64)?; if goodby_table_size > FILE_COPY_BUFFER_SIZE { bail!("goodby table too large ({} > {})", goodby_table_size, FILE_COPY_BUFFER_SIZE); } let buffer = &mut self.file_copy_buffer; let buffer_ptr = buffer.as_ptr(); copy_binary_search_tree(item_count, |s, d| { let item = &goodby_items[s]; let offset = d*std::mem::size_of::(); let dest = crate::tools::map_struct_mut::(&mut buffer[offset..]).unwrap(); dest.offset = u64::to_le(item.offset); dest.size = u64::to_le(item.size); dest.hash = u64::to_le(item.hash); }); // append CaFormatGoodbyeTail as last item let offset = item_count*std::mem::size_of::(); let dest = crate::tools::map_struct_mut::(&mut buffer[offset..]).unwrap(); dest.offset = u64::to_le(goodby_offset as u64); dest.size = u64::to_le((goodby_table_size + std::mem::size_of::()) as u64); dest.hash = u64::to_le(CA_FORMAT_GOODBYE_TAIL_MARKER); self.flush_copy_buffer(goodby_table_size)?; println!("encode_dir: {:?} end1 {}", self.current_path, self.writer_pos); Ok(()) } fn encode_file(&mut self, filefd: RawFd) -> Result<(), Error> { println!("encode_file: {:?}", self.current_path); let stat = match nix::sys::stat::fstat(filefd) { Ok(stat) => stat, Err(err) => bail!("fstat {:?} failed - {}", self.current_path, err), }; if (stat.st_mode & libc::S_IFMT) != libc::S_IFREG { bail!("got unexpected file type {:?} (not a regular file)", self.current_path); } self.write_entry(&stat)?; let size = stat.st_size as u64; self.write_header(CA_FORMAT_PAYLOAD, size)?; let mut pos: u64 = 0; loop { let n = match nix::unistd::read(filefd, &mut self.file_copy_buffer) { Ok(n) => n, Err(nix::Error::Sys(Errno::EINTR)) => continue /* try again */, Err(err) => bail!("read {:?} failed - {}", self.current_path, err), }; if n == 0 { // EOF if pos != size { // Note:: casync format cannot handle that bail!("detected shrinked file {:?} ({} < {})", self.current_path, pos, size); } break; } let mut next = pos + (n as u64); if next > size { next = size; } let count = (next - pos) as usize; self.flush_copy_buffer(count)?; pos = next; if pos >= size { break; } } Ok(()) } fn encode_symlink(&mut self, target: &[u8], stat: &FileStat) -> Result<(), Error> { println!("encode_symlink: {:?} -> {:?}", self.current_path, target); self.write_entry(stat)?; self.write_header(CA_FORMAT_SYMLINK, target.len() as u64)?; self.write(target)?; Ok(()) } // the report_XXX method may raise and error - depending on encoder configuration fn report_vanished_file(&self, path: &Path) -> Result<(), Error> { eprintln!("WARNING: detected vanished file {:?}", path); Ok(()) } } fn compute_goodby_hash(name: &CStr) -> u64 { use std::hash::Hasher; let mut hasher = SipHasher24::new_with_keys(0x8574442b0f1d84b3, 0x2736ed30d1c22ec1); hasher.write(name.to_bytes()); hasher.finish() }