add coeff_aggr.rs

This commit is contained in:
Youngjoon Lee 2024-09-09 14:42:27 +09:00
parent d43f08d2be
commit 809d43bec9
No known key found for this signature in database
GPG Key ID: 167546E2D1712F8C
2 changed files with 92 additions and 0 deletions

View File

@ -46,6 +46,11 @@ fn aggregate(path: &str) {
);
add_stats_columns(&mut df, entry.path().join("latency_stats.csv"), "latency_");
let coeff_stats_path = entry.path().join("coeff_stats.csv");
if coeff_stats_path.exists() {
add_stats_columns(&mut df, coeff_stats_path, "");
}
dataframes.push(df);
}
}

View File

@ -0,0 +1,87 @@
use glob::glob;
use polars::prelude::*;
use std::env;
use std::fs::File;
use walkdir::WalkDir;
fn aggregate(path: &str) {
for entry in WalkDir::new(path)
.into_iter()
.filter_map(|e| e.ok())
.filter(|e| e.file_type().is_dir())
{
let dir_name = entry.path().file_name().unwrap().to_string_lossy();
if dir_name.starts_with("paramset_") {
let mut strongs = Series::new_empty("", &DataType::Int64);
let mut casuals = Series::new_empty("", &DataType::Int64);
let mut weaks = Series::new_empty("", &DataType::Int64);
let pattern = format!("{}/**/coeffs.csv", entry.path().display());
for file in glob(&pattern).unwrap().filter_map(Result::ok) {
let df = CsvReadOptions::default()
.with_has_header(true)
.try_into_reader_with_file_path(Some(file.clone()))
.unwrap()
.finish()
.unwrap();
extend_series(&mut strongs, &df, "strong");
extend_series(&mut casuals, &df, "casual");
extend_series(&mut weaks, &df, "weak");
println!("Processed {}", file.display());
}
save_stats(
&strongs,
&format!("{}/strong_coeff_stats.csv", entry.path().display()),
);
save_stats(
&casuals,
&format!("{}/casual_coeff_stats.csv", entry.path().display()),
);
save_stats(
&weaks,
&format!("{}/weak_coeff_stats.csv", entry.path().display()),
);
}
}
}
fn extend_series(series: &mut Series, df: &DataFrame, column: &str) {
series
.extend(
&df.column(column)
.unwrap()
.i64()
.unwrap()
.clone()
.into_series(),
)
.unwrap();
}
fn save_stats(aggregated: &Series, outpath: &str) {
let mut df = DataFrame::new(vec![
Series::new("min", &[aggregated.min::<i64>().unwrap()]),
Series::new("median", &[aggregated.median().unwrap()]),
Series::new("mean", &[aggregated.mean().unwrap()]),
Series::new("std", &[aggregated.std(1).unwrap()]),
Series::new("max", &[aggregated.max::<i64>().unwrap()]),
])
.unwrap();
let mut file = File::create(outpath).unwrap();
CsvWriter::new(&mut file).finish(&mut df).unwrap();
println!("Saved {}", outpath);
}
fn main() {
let args: Vec<String> = env::args().collect();
if args.len() < 2 {
eprintln!("Usage: {} <path>", args[0]);
std::process::exit(1);
}
let path = &args[1];
aggregate(path);
}