Compare commits

...

4 Commits
main ... main

Author SHA1 Message Date
Matteo Settenvini c9e39e284c Merge pull request 'Extra features and fixes' (#1) from arthurep/sysroot-cleaner:extra-features into main
Reviewed-on: matteo/sysroot-cleaner#1
Reviewed-by: Matteo Settenvini <matteo.settenvini@montecristosoftware.eu>
2025-03-19 21:29:33 +01:00
Arthur Pinheiro 6825d63aaa feat: display size of each file and total removed size 2025-03-14 10:46:24 +01:00
Arthur Pinheiro 266a00d983 feat: use vector for --allowlist and --blocklist for passing multiples 2025-03-14 10:46:24 +01:00
Arthur Pinheiro 8983863ffa fix: allow relative paths in allowlist and blocklist 2025-03-14 10:46:24 +01:00
4 changed files with 95 additions and 20 deletions

7
Cargo.lock generated
View File

@ -136,6 +136,12 @@ version = "1.10.0"
source = "registry+https://github.com/rust-lang/crates.io-index" source = "registry+https://github.com/rust-lang/crates.io-index"
checksum = "f61dac84819c6588b558454b194026eb1f09c293b9036ae9b159e74e73ab6cf9" checksum = "f61dac84819c6588b558454b194026eb1f09c293b9036ae9b159e74e73ab6cf9"
[[package]]
name = "bytesize"
version = "2.0.1"
source = "registry+https://github.com/rust-lang/crates.io-index"
checksum = "a3c8f83209414aacf0eeae3cf730b18d6981697fba62f200fcfb92b9f082acba"
[[package]] [[package]]
name = "cfg-if" name = "cfg-if"
version = "1.0.0" version = "1.0.0"
@ -634,6 +640,7 @@ version = "0.1.0"
dependencies = [ dependencies = [
"anyhow", "anyhow",
"async-trait", "async-trait",
"bytesize",
"clap", "clap",
"env_logger", "env_logger",
"goblin", "goblin",

View File

@ -23,3 +23,4 @@ nix = { version = "0.29", features = ["fs"] }
petgraph = { version = "0.7" } petgraph = { version = "0.7" }
tokio = { version = "1", features = ["full"] } tokio = { version = "1", features = ["full"] }
walkdir = { version = "2" } walkdir = { version = "2" }
bytesize = { version = "2.0" }

View File

@ -3,7 +3,29 @@
use std::path::PathBuf; use std::path::PathBuf;
use clap::Parser; use clap::{builder::{PathBufValueParser, TypedValueParser}, Parser};
#[derive(Clone, Default)]
struct AbsolutePathBufValueParser;
impl TypedValueParser for AbsolutePathBufValueParser {
type Value = PathBuf;
fn parse_ref(
&self,
cmd: &clap::Command,
arg: Option<&clap::Arg>,
value: &std::ffi::OsStr,
) -> Result<Self::Value, clap::Error> {
let pathbuf_parser = PathBufValueParser::new();
let v = pathbuf_parser.parse_ref(cmd, arg, value)?;
v.canonicalize().map_err(|e| clap::Error::raw(
clap::error::ErrorKind::Io,
e,
))
}
}
/// A tool to clean up sysroots for Linux embedded devices to save storage space. /// A tool to clean up sysroots for Linux embedded devices to save storage space.
#[derive(Parser, Debug)] #[derive(Parser, Debug)]
@ -19,13 +41,15 @@ pub struct Args {
pub split_to: Option<PathBuf>, pub split_to: Option<PathBuf>,
/// An allowlist of files to keep, in .gitignore format. /// An allowlist of files to keep, in .gitignore format.
/// Can be passed multiple times.
/// Note: this will take precedence over all other removal decisions. /// Note: this will take precedence over all other removal decisions.
#[arg(long)] #[arg(long, value_parser = AbsolutePathBufValueParser::default())]
pub allowlist: Option<PathBuf>, pub allowlist: Vec<PathBuf>,
/// A blocklist of files to remove, in .gitignore format. /// A blocklist of files to remove, in .gitignore format.
/// Can be passed multiple times.
#[arg(long)] #[arg(long)]
pub blocklist: Option<PathBuf>, pub blocklist: Vec<PathBuf>,
/// An optional path to save the file graph of the DSO cleaner /// An optional path to save the file graph of the DSO cleaner
/// in GraphViz format. Useful for debugging. /// in GraphViz format. Useful for debugging.
@ -35,3 +59,4 @@ pub struct Args {
/// The location of the sysroot to clean up /// The location of the sysroot to clean up
pub sysroot_location: PathBuf, pub sysroot_location: PathBuf,
} }

View File

@ -10,10 +10,11 @@ use crate::{
}; };
use anyhow::{Error, Result}; use anyhow::{Error, Result};
use async_trait::async_trait; use async_trait::async_trait;
use bytesize::ByteSize;
use dso::DsoCleaner; use dso::DsoCleaner;
use list::ListCleaner; use list::ListCleaner;
use nix::libc::EXDEV; use nix::libc::EXDEV;
use std::{collections::HashMap, io, path::Path}; use std::{collections::HashMap, fmt, io, ops::AddAssign, path::Path};
use tokio::{sync::mpsc, task::JoinSet}; use tokio::{sync::mpsc, task::JoinSet};
use walkdir::{DirEntry, WalkDir}; use walkdir::{DirEntry, WalkDir};
@ -26,8 +27,22 @@ pub trait Cleaner {
) -> Result<()>; ) -> Result<()>;
} }
struct FileSize(u64);
impl fmt::Display for FileSize {
fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
write!(f, "{}", ByteSize(self.0))
}
}
impl AddAssign for FileSize {
fn add_assign(&mut self, rhs: Self) {
self.0.add_assign(rhs.0);
}
}
type Cleaners = Vec<Box<dyn Cleaner + Send>>; type Cleaners = Vec<Box<dyn Cleaner + Send>>;
type RemovalFn = Box<dyn Fn(&Path) -> io::Result<()>>; type RemovalFn = Box<dyn Fn(&Path) -> io::Result<FileSize>>;
pub struct Runner { pub struct Runner {
cleaners: Cleaners, cleaners: Cleaners,
@ -41,11 +56,11 @@ impl Runner {
let removal_fn = Self::new_removal_fn(&args); let removal_fn = Self::new_removal_fn(&args);
let mut cleaners: Cleaners = vec![]; let mut cleaners: Cleaners = vec![];
if let Some(wl) = args.allowlist { for wl in args.allowlist {
cleaners.push(Box::new(ListCleaner::new(list::ListType::Allow, wl))); cleaners.push(Box::new(ListCleaner::new(list::ListType::Allow, wl)));
} }
if let Some(bl) = args.blocklist { for bl in args.blocklist {
cleaners.push(Box::new(ListCleaner::new(list::ListType::Block, bl))); cleaners.push(Box::new(ListCleaner::new(list::ListType::Block, bl)));
} }
@ -129,6 +144,8 @@ impl Runner {
async fn final_decision(removal_fn: RemovalFn, mut output_rx: mpsc::Receiver<Decision>) { async fn final_decision(removal_fn: RemovalFn, mut output_rx: mpsc::Receiver<Decision>) {
let mut final_decisions = HashMap::new(); let mut final_decisions = HashMap::new();
let mut total_removed_size = FileSize(0);
while let Some(input_decision) = output_rx.recv().await { while let Some(input_decision) = output_rx.recv().await {
if input_decision.action == Action::Undecided { if input_decision.action == Action::Undecided {
continue; continue;
@ -147,28 +164,38 @@ impl Runner {
for (file, action) in final_decisions { for (file, action) in final_decisions {
if action == Action::Remove { if action == Action::Remove {
if let Err(err) = (removal_fn)(&file) { let removed_size = match (removal_fn)(&file) {
log::error!("{}: {}", file.display(), err); Ok(size) => size,
} Err(err) => {
log::error!("{}: {}", file.display(), err);
FileSize(0)
}
};
total_removed_size += removed_size;
} }
} }
log::info!("Total space removed: {}", total_removed_size);
} }
fn new_removal_fn(args: &Args) -> RemovalFn { fn new_removal_fn(args: &Args) -> RemovalFn {
if let Some(dest) = args.split_to.clone() { if let Some(dest) = args.split_to.clone() {
if args.dry_run { if args.dry_run {
Box::new(move |path| { Box::new(move |path| {
let size = Self::get_file_size(path)?;
log::info!( log::info!(
"(dry-run) would move {} to {}", "(dry-run) would move {} to {} ({})",
path.display(), path.display(),
dest.display() dest.display(),
size
); );
Ok(()) Ok(size)
}) })
} else { } else {
Box::new(move |path| { Box::new(move |path| {
log::info!("moving {} to {}", path.display(), dest.display()); let size = Self::get_file_size(path)?;
Self::move_preserve(&path, &dest) log::info!("moving {} to {} ({})", path.display(), dest.display(), size);
Self::move_preserve(&path, &dest)?;
Ok(size)
}) })
} }
} else { } else {
@ -179,18 +206,33 @@ impl Runner {
} else { } else {
"regular file" "regular file"
}; };
log::info!("(dry-run) would remove {} {}", ty, path.display()); let size = Self::get_file_size(path)?;
Ok(()) log::info!("(dry-run) would remove {} {} ({})", ty, path.display(), size);
Ok(size)
}) })
} else { } else {
Box::new(move |path| { Box::new(move |path| {
log::info!("removing {}", path.display()); let size = Self::get_file_size(path)?;
std::fs::remove_file(&path) log::info!("removing {} ({})", path.display(), size);
std::fs::remove_file(&path)?;
Ok(size)
}) })
} }
} }
} }
fn get_file_size(file: &Path) -> io::Result<FileSize> {
let lstat = nix::sys::stat::lstat(file);
let size = match lstat {
Err(err) => {
log::error!("failed to get metadata from: {}, {}", file.display(), err);
FileSize(0)
},
Ok(lstat) => FileSize(lstat.st_size as u64)
};
Ok(size)
}
fn move_preserve(src: &Path, dest: &Path) -> io::Result<()> { fn move_preserve(src: &Path, dest: &Path) -> io::Result<()> {
assert!(src.is_relative()); assert!(src.is_relative());
let abs_dest = dest.join(src); let abs_dest = dest.join(src);