process.rs 12 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273
  1. use std::{fmt::Debug, path::{Path, PathBuf}, fs::File, io::{Read, BufReader, BufRead, Write}, collections::{HashMap, HashSet}, net::Ipv4Addr};
  2. use anyhow::{Context, bail, anyhow};
  3. use clap::Parser;
  4. use json::JsonValue;
  5. use regex::Regex;
  6. use crate::run::{BENCH_BASE_PATH, BENCH_DATA_PATH};
  7. fn json_from_file<P>(path: P) -> anyhow::Result<HashMap<String, f64>>
  8. where
  9. P: Debug,
  10. P: AsRef<Path>
  11. {
  12. if !path.as_ref().exists() {
  13. return Ok(HashMap::new());
  14. }
  15. let mut vec = vec![];
  16. File::open(&path)
  17. .context(format!("Failed to open {:?}", path))?
  18. .read_to_end(&mut vec)?;
  19. let json_val = json::parse(String::from_utf8(vec)?.as_str())?;
  20. let json_obj = if let JsonValue::Object(o) = json_val {
  21. o
  22. } else {
  23. bail!("Expected json object, got: {}", json_val);
  24. };
  25. let mut map = HashMap::new();
  26. for (key, val) in json_obj.iter() {
  27. let val: f64 = match val {
  28. JsonValue::Number(n) => {
  29. f64::from(*n)
  30. },
  31. JsonValue::String(_) | JsonValue::Short(_) => {
  32. val.as_str()
  33. .unwrap()
  34. .strip_suffix("%")
  35. .ok_or(anyhow!("Expected percentage String, got: {:?}", val))?
  36. .parse()?
  37. },
  38. _ => bail!("Expected json number or string, got: {:?}", val),
  39. };
  40. map.insert(String::from(key), val);
  41. }
  42. Ok(map)
  43. }
  44. fn ips_from_file<P>(path: P) -> anyhow::Result<HashSet<Ipv4Addr>>
  45. where
  46. P: Debug,
  47. P: AsRef<Path>
  48. {
  49. let f = File::open(path)?;
  50. let reader = BufReader::new(f);
  51. let mut hashset = HashSet::new();
  52. for line in reader.lines() {
  53. let line = line?;
  54. hashset.insert(line.parse()?);
  55. }
  56. Ok(hashset)
  57. }
  58. fn parse_rate(rate: &str, unit: &str) -> anyhow::Result<f64> {
  59. let multiplier = match unit {
  60. "G" => 1_000_000_000f64,
  61. "M" => 1_000_000f64,
  62. "K" => 1_000f64,
  63. "" => 1f64,
  64. m => bail!("Unknown unit {} (rate: {})", m, rate)
  65. };
  66. let rate: f64 = rate.parse()?;
  67. return Ok(rate * multiplier)
  68. }
  69. fn zmap_stats<P>(path: P, regex: &Regex) -> anyhow::Result<(f64, f64, f64)>
  70. where
  71. P: Debug,
  72. P: AsRef<Path>
  73. {
  74. let f = File::open(path)?;
  75. let reader = BufReader::new(f);
  76. let mut rates = None;
  77. for line in reader.lines() {
  78. let line = line?;
  79. if let Some(capture) = regex.captures(&line) {
  80. let result: anyhow::Result<_> = (|| {
  81. let send_rate = capture
  82. .get(1)
  83. .ok_or(anyhow!("Capture group 1 did not match"))?;
  84. let send_rate_unit = capture
  85. .get(2)
  86. .ok_or(anyhow!("Capture group 2 did not match"))?;
  87. let send_rate = parse_rate(send_rate.as_str(), send_rate_unit.as_str())?;
  88. let receive_rate = capture
  89. .get(3)
  90. .ok_or(anyhow!("Capture group 3 did not match"))?;
  91. let receive_rate_unit = capture
  92. .get(4)
  93. .ok_or(anyhow!("Capture group 4 did not match"))?;
  94. let receive_rate = parse_rate(receive_rate.as_str(), receive_rate_unit.as_str())?;
  95. let drop_rate = capture
  96. .get(5)
  97. .ok_or(anyhow!("Capture group 5 did not match"))?;
  98. let drop_rate_unit = capture
  99. .get(6)
  100. .ok_or(anyhow!("Capture group 6 did not match"))?;
  101. let drop_rate = parse_rate(drop_rate.as_str(), drop_rate_unit.as_str())?;
  102. Ok((send_rate, receive_rate, drop_rate))
  103. })();
  104. rates = Some(result.context(format!("Failed to parse stats line: '{}'", line))?);
  105. }
  106. }
  107. rates.ok_or(anyhow!("Failed to find final stats line"))
  108. }
  109. #[derive(Debug, Parser)]
  110. pub struct Options {
  111. seed: String
  112. }
  113. pub fn process(opts: Options) -> anyhow::Result<()> {
  114. let mut path = PathBuf::new();
  115. path.push(BENCH_BASE_PATH);
  116. path.push(BENCH_DATA_PATH);
  117. path.push(opts.seed);
  118. let zmap_stats_regex = Regex::new(r"^[^\(;]+(?:\(.+left\))?; send: [^\(;]+done \(([\d\.]+) ([KMG]?)p/s avg\); recv: [^\(;]+\(([\d\.]+) ([KMG]?)p/s avg\); drops: [^\(;]+\(([\d\.]+) ([KMG]?)p/s avg\); hitrate: [^;]+$")?;
  119. let header_row = [
  120. "type", "filter-type",
  121. "subnet_size", "hitrate", "bloom_filter_bits", "bloom_filter_hash_count", "zmap_scanrate",
  122. "bpf_run_time_total", "bpf_run_count", "bpf_memory_lock",
  123. "filter_intern_build_time", "filter_intern_write_time",
  124. "filter_extern_time_clock", "filter_extern_cpu_p", "filter_extern_kernel_secs", "filter_extern_user_secs",
  125. "zmap_send_rate", "zmap_receive_rate", "zmap_drop_rate",
  126. "false_positive_count", "false_negative_count"
  127. ];
  128. let mut data_rows = vec![];
  129. data_rows.push(header_row.map(str::to_string));
  130. for subnet_dir in path.read_dir().context(format!("Failed to read subnet dirs in path {:?}", &path))? {
  131. let subnet_dir = subnet_dir.context(format!("Failed to read file info on file in path {:?}", &path))?;
  132. if !subnet_dir
  133. .file_type()
  134. .context(format!("Failed to read file info on file {:?}", subnet_dir.path()))?
  135. .is_dir() {
  136. bail!("Expected dir at {:?}", subnet_dir.path())
  137. }
  138. let subnet = subnet_dir.file_name().into_string().map_err(|e| anyhow!(format!("{:?}", e)))?;
  139. for hitrate_dir in subnet_dir.path().read_dir().context(format!("Failed to read hitrate dirs in path {:?}", subnet_dir.path()))? {
  140. let hitrate_dir = hitrate_dir.context(format!("Failed to read file info on file in path {:?}",subnet_dir.path()))?;
  141. if !hitrate_dir
  142. .file_type()
  143. .context(format!("Failed to read file info on file {:?}", hitrate_dir.path()))?
  144. .is_dir() {
  145. bail!("Expected dir at {:?}", hitrate_dir.path())
  146. }
  147. let hitrate = hitrate_dir.file_name().into_string().map_err(|e| anyhow!(format!("{:?}", e)))?;
  148. let in_ips = ips_from_file(hitrate_dir.path().join("ips.txt")).context(format!("Failed to read ips from {:?}/ips.txt", hitrate_dir.path()))?;
  149. for bloom_dir in hitrate_dir.path().read_dir().context(format!("Failed to read bloom dirs in path {:?}", hitrate_dir.path()))? {
  150. let bloom_dir = bloom_dir.context(format!("Failed to read file info on file in path {:?}", hitrate_dir.path()))?;
  151. if !bloom_dir
  152. .file_type()
  153. .context(format!("Failed to read file info on file {:?}", bloom_dir.path()))?
  154. .is_dir() {
  155. continue;
  156. }
  157. let bloom_folder_name = bloom_dir
  158. .file_name()
  159. .into_string()
  160. .map_err(|e| anyhow!(format!("{:?}", e)))?;
  161. let (test_type, filter_type, bloom_bits, bloom_hashes) = if bloom_folder_name.contains('-') {
  162. let (bloom_bits, rem) = bloom_folder_name.split_once("-")
  163. .ok_or(anyhow!("Expected filename with -, got {:?}", bloom_dir.file_name()))?;
  164. let (filter_type, rem) = rem.split_once("-").unwrap_or((rem, ""));
  165. let (bloom_hashes, bpf_enabled) = if filter_type == "bloom" {
  166. rem.split_once("-").map(|(c, rem)| (c,rem=="bpf")).unwrap_or((rem, false))
  167. } else {
  168. ("0", rem == "bpf")
  169. };
  170. let bloom_bits = bloom_bits.to_string();
  171. let bloom_hashes = bloom_hashes.to_string();
  172. let test_type = if bpf_enabled {
  173. "bpf-stats"
  174. } else {
  175. "normal"
  176. };
  177. (test_type, filter_type, bloom_bits, bloom_hashes)
  178. } else {
  179. ("baseline","none", String::from("-1"), String::from("-1"))
  180. };
  181. let bloom_path = bloom_dir.path();
  182. let mut filter_intern_time = json_from_file(bloom_path.join("filter_intern_time.json"))
  183. .context(format!("Failed to parse filter_intern_time.json for {:?}", bloom_path))?;
  184. let mut filter_extern_time = json_from_file(bloom_path.join("filter_extern_time.json"))
  185. .context(format!("Failed to parse filter_extern_time.json for {:?}", bloom_path))?;
  186. for scan_rate_dir in bloom_dir.path().read_dir().context(format!("Failed to read scan rate dirs in path {:?}", bloom_dir.path()))? {
  187. let scan_rate_dir = scan_rate_dir.context(format!("Failed to read file info on file in path {:?}", bloom_dir.path()))?;
  188. if !scan_rate_dir
  189. .file_type()
  190. .context(format!("Failed to read file info on file {:?}", scan_rate_dir.path()))?
  191. .is_dir() {
  192. continue;
  193. }
  194. let scan_rate = scan_rate_dir.file_name().to_str().unwrap().to_string();
  195. let wd_path = scan_rate_dir.path();
  196. let mut bpf_stats = json_from_file(wd_path.join("bpf_stats.json"))
  197. .context(format!("Failed to parse bpf_stats.json for {:?}", wd_path))?;
  198. let out_ips = ips_from_file(wd_path.join("zmap_out_ips.txt"))
  199. .context(format!("Failed to parse zmap_out_ips.txt from {:?}", wd_path))?;
  200. let zmap_stats = zmap_stats(wd_path.join("zmap_stats.txt"), &zmap_stats_regex)
  201. .context(format!("Failed to parse zmap_stats.txt from {:?}", wd_path))?;
  202. let get_or_default = |map: &mut HashMap<String, f64>, k: &str| map
  203. .get(k).unwrap_or(&-1f64).to_string();
  204. let data_row = (|| {
  205. Ok([
  206. test_type.to_owned(),
  207. filter_type.to_owned(),
  208. subnet.clone(), hitrate.clone(), bloom_bits.clone(), bloom_hashes.clone(), scan_rate.clone(),
  209. get_or_default(&mut bpf_stats, "run_time"),
  210. get_or_default(&mut bpf_stats, "run_count"),
  211. get_or_default(&mut bpf_stats, "mem_lock"),
  212. get_or_default(&mut filter_intern_time, "build"),
  213. get_or_default(&mut filter_intern_time, "write"),
  214. get_or_default(&mut filter_extern_time, "clock"),
  215. get_or_default(&mut filter_extern_time, "cpu_p"),
  216. get_or_default(&mut filter_extern_time, "kernel_s"),
  217. get_or_default(&mut filter_extern_time, "user_s"),
  218. zmap_stats.0.to_string(),
  219. zmap_stats.1.to_string(),
  220. zmap_stats.2.to_string(),
  221. out_ips.difference(&in_ips).count().to_string(),
  222. in_ips.difference(&out_ips).count().to_string(),
  223. ])
  224. })().map_err(|key: String| {
  225. anyhow!("Failed to read data point {} for {:?}", key, wd_path)
  226. })?;
  227. let mut f = File::create(wd_path.join("data_row.csv"))?;
  228. f.write_all(header_row.join(",").as_bytes())?;
  229. f.write(&[b'\n'])?;
  230. f.write_all(data_row.join(",").as_bytes())?;
  231. data_rows.push(data_row);
  232. }
  233. }
  234. }
  235. }
  236. let data = data_rows.into_iter()
  237. .map(|row| row.join(","))
  238. .fold(String::new(), |a, b| a + &b + "\n");
  239. File::create(path.join("data.csv"))?.write_all(data.as_bytes())?;
  240. Ok(())
  241. }