use anyhow::{bail, Context, Result}; use std::fs::{read_link, symlink_metadata}; use std::io::{empty, BufWriter, Write}; use std::path::Path; use tar::{Builder, Header}; use walkdir::WalkDir; use crate::{ compression::{CombinedEncoder, CompressionFormats}, util::*, }; actor! { #[derive(Debug)] pub struct Tarballer { /// The input folder to be compressed. #[clap(value_name = "NAME")] input: String = "package", /// The prefix of the tarballs. #[clap(value_name = "PATH")] output: String = "./dist", /// The folder in which the input is to be found. #[clap(value_name = "DIR")] work_dir: String = "./workdir", /// The formats used to compress the tarball. #[clap(value_name = "FORMAT", default_value_t)] compression_formats: CompressionFormats, } } impl Tarballer { /// Generates the actual tarballs pub fn run(self) -> Result<()> { let tarball_name = self.output.clone() + ".tar"; let encoder = CombinedEncoder::new( self.compression_formats .iter() .map(|f| f.encode(&tarball_name)) .collect::>>()?, ); // Sort files by their suffix, to group files with the same name from // different locations (likely identical) and files with the same // extension (likely containing similar data). let (dirs, mut files) = get_recursive_paths(&self.work_dir, &self.input) .context("failed to collect file paths")?; files.sort_by(|a, b| a.bytes().rev().cmp(b.bytes().rev())); // Write the tar into both encoded files. We write all directories // first, so files may be directly created. (See rust-lang/rustup.rs#1092.) let buf = BufWriter::with_capacity(1024 * 1024, encoder); let mut builder = Builder::new(buf); let pool = rayon::ThreadPoolBuilder::new() .num_threads(2) .build() .unwrap(); pool.install(move || { for path in dirs { let src = Path::new(&self.work_dir).join(&path); builder .append_dir(&path, &src) .with_context(|| format!("failed to tar dir '{}'", src.display()))?; } for path in files { let src = Path::new(&self.work_dir).join(&path); append_path(&mut builder, &src, &path) .with_context(|| format!("failed to tar file '{}'", src.display()))?; } builder .into_inner() .context("failed to finish writing .tar stream")? .into_inner() .ok() .unwrap() .finish()?; Ok(()) }) } } fn append_path(builder: &mut Builder, src: &Path, path: &String) -> Result<()> { let stat = symlink_metadata(src)?; let mut header = Header::new_gnu(); header.set_metadata(&stat); if stat.file_type().is_symlink() { let link = read_link(src)?; header.set_link_name(&link)?; builder.append_data(&mut header, path, &mut empty())?; } else { if cfg!(windows) { // Windows doesn't really have a mode, so `tar` never marks files executable. // Use an extension whitelist to update files that usually should be so. const EXECUTABLES: [&'static str; 4] = ["exe", "dll", "py", "sh"]; if let Some(ext) = src.extension().and_then(|s| s.to_str()) { if EXECUTABLES.contains(&ext) { let mode = header.mode()?; header.set_mode(mode | 0o111); } } } let file = open_file(src)?; builder.append_data(&mut header, path, &file)?; } Ok(()) } /// Returns all `(directories, files)` under the source path. fn get_recursive_paths(root: P, name: Q) -> Result<(Vec, Vec)> where P: AsRef, Q: AsRef, { let root = root.as_ref(); let name = name.as_ref(); if !name.is_relative() && !name.starts_with(root) { bail!( "input '{}' is not in work dir '{}'", name.display(), root.display() ); } let mut dirs = vec![]; let mut files = vec![]; for entry in WalkDir::new(root.join(name)) { let entry = entry?; let path = entry.path().strip_prefix(root)?; let path = path_to_str(&path)?; if entry.file_type().is_dir() { dirs.push(path.to_owned()); } else { files.push(path.to_owned()); } } Ok((dirs, files)) }