Compare commits

..

3 Commits

3 changed files with 68 additions and 11 deletions

View File

@ -32,6 +32,14 @@ struct Args {
#[arg(short, long, default_value_t = 10)] #[arg(short, long, default_value_t = 10)]
top_n: usize, top_n: usize,
/// Include subpart headers keys in fingerprint
#[arg(short, long)]
include_header_keys: bool,
/// Include subpart params in fingerprint
#[arg(long)]
include_params: bool,
/// List of input directories to recursively search /// List of input directories to recursively search
input_dir: String, input_dir: String,
} }
@ -68,7 +76,12 @@ fn main() -> anyhow::Result<()> {
if should_skip(&arg) { if should_skip(&arg) {
return None; return None;
} }
match parse(&arg, youngest) { match parse(
&arg,
youngest,
args.include_header_keys,
args.include_params,
) {
Ok(Some(h)) => Some((h, arg)), Ok(Some(h)) => Some((h, arg)),
// Skip old emails // Skip old emails
Ok(None) => return None, Ok(None) => return None,
@ -116,7 +129,12 @@ fn main() -> anyhow::Result<()> {
} }
// If the date in the email is before youngest Ok(None) will be returned. // If the date in the email is before youngest Ok(None) will be returned.
fn parse<P: AsRef<Path>>(path: P, youngest: i64) -> Result<Option<String>, EmailError> { fn parse<P: AsRef<Path>>(
path: P,
youngest: i64,
include_header_keys: bool,
include_params: bool,
) -> Result<Option<String>, EmailError> {
let file = File::open(&path)?; let file = File::open(&path)?;
let mmap = unsafe { MmapOptions::new().map(&file)? }; let mmap = unsafe { MmapOptions::new().map(&file)? };
let m = parse_mail(&mmap)?; let m = parse_mail(&mmap)?;
@ -131,5 +149,7 @@ fn parse<P: AsRef<Path>>(path: P, youngest: i64) -> Result<Option<String>, Email
return Ok(None); return Ok(None);
} }
//println!("{}: {:#?}", path.as_ref().display(), m.ctype); //println!("{}: {:#?}", path.as_ref().display(), m.ctype);
Ok(Some(fingerprint(&m).join("\n"))) Ok(Some(
fingerprint(&m, include_header_keys, include_params).join("\n"),
))
} }

View File

@ -9,6 +9,14 @@ use memmap::MmapOptions;
#[derive(Parser, Debug)] #[derive(Parser, Debug)]
#[command(author, version, about, long_about = None)] #[command(author, version, about, long_about = None)]
struct Args { struct Args {
/// Include subpart headers keys in fingerprint
#[arg(short, long)]
include_header_keys: bool,
/// Include subpart params in fingerprint
#[arg(long)]
include_params: bool,
/// List of files to summarize /// List of files to summarize
paths: Vec<String>, paths: Vec<String>,
} }
@ -23,7 +31,10 @@ fn main() -> anyhow::Result<()> {
.headers .headers
.get_first_value("subject") .get_first_value("subject")
.unwrap_or("(NO SUBJECT)".to_owned()); .unwrap_or("(NO SUBJECT)".to_owned());
println!("{subject}: {path}\n{}", fingerprint(&m).join("\n")); println!(
"{subject}: {path}\n{}",
fingerprint(&m, args.include_header_keys, args.include_params).join("\n")
);
} }
Ok(()) Ok(())
} }

View File

@ -65,15 +65,41 @@ pub fn should_skip(path: &str) -> bool {
SKIP_FILES.contains(&filename) SKIP_FILES.contains(&filename)
} }
pub fn fingerprint(pm: &ParsedMail<'_>) -> Vec<String> { pub fn fingerprint(
fingerprint_rec(pm, 0) pm: &ParsedMail<'_>,
include_header_keys: bool,
include_params: bool,
) -> Vec<String> {
fingerprint_rec(pm, include_header_keys, include_params, 0)
}
fn fingerprint_rec(
pm: &ParsedMail<'_>,
include_header_keys: bool,
include_params: bool,
depth: usize,
) -> Vec<String> {
let indent = " ".repeat(depth * 2);
let mut parts = vec![format!("{}{}", indent, pm.ctype.mimetype)];
if include_header_keys {
parts.push(format!("{indent}Headers:"));
for k in &pm.headers {
parts.push(format!("{indent} {}", k.get_key()));
}
}
if include_params {
for (k, v) in &pm.ctype.params {
parts.push(format!("{indent} {k}: {v}"));
}
} }
fn fingerprint_rec(pm: &ParsedMail<'_>, depth: usize) -> Vec<String> {
let mut v = vec![format!("{}{}", " ".repeat(depth * 2), pm.ctype.mimetype)];
for c in &pm.subparts { for c in &pm.subparts {
v.extend(fingerprint_rec(&c, depth + 1)); parts.extend(fingerprint_rec(
&c,
include_header_keys,
include_params,
depth + 1,
));
} }
v parts
} }
#[cfg(test)] #[cfg(test)]