Allow eBPF map sizes and general buffer size for profiler to be chang…

…ed via CLI options (#54) * Add options to modify eBPF map sizes * eBPF map size info output now works * Convert PERF_BUFFER_BYTES into a command line config with default * add ProfilerConfig to integration_test * add ProfilerConfig default impl * Sane defaults for ProfilerConfig in Profiler default() * Add several test fixtures to support tests for perf buffer CLI argument
javierhonduco · Aug 13, 2024 · 81ccb90 · 81ccb90
1 parent abf0b12
commit 81ccb90
Show file tree

Hide file tree

Showing 4 changed files with 308 additions and 37 deletions.
diff --git a/src/collector.rs b/src/collector.rs
@@ -127,7 +127,7 @@ impl AggregatorCollector {
     }
 }
 
-/// Aggregagates the samples in memory, which might be acceptable when profiling for short amounts of time.
+/// Aggregates the samples in memory, which might be acceptable when profiling for short amounts of time.
 impl Collector for AggregatorCollector {
     fn collect(
         &mut self,

diff --git a/src/main.rs b/src/main.rs
@@ -1,3 +1,4 @@
+use core::str;
 use std::error::Error;
 use std::fs::File;
 use std::io::IsTerminal;
@@ -22,7 +23,7 @@ use tracing_subscriber::FmtSubscriber;
 use lightswitch::object::ObjectFile;
 use lightswitch::profile::symbolize_profile;
 use lightswitch::profile::{fold_profile, to_pprof};
-use lightswitch::profiler::Profiler;
+use lightswitch::profiler::{Profiler, ProfilerConfig};
 use lightswitch::unwind_info::in_memory_unwind_info;
 use lightswitch::unwind_info::remove_redundant;
 use lightswitch::unwind_info::remove_unnecesary_markers;
@@ -62,6 +63,27 @@ fn sample_freq_in_range(s: &str) -> Result<u16, String> {
     Ok(sample_freq as u16)
 }
 
+// Clap value_parser() in the form of: Fn(&str) -> Result<T,E>
+// Convert a &str into a usize, if possible, and return the result if it's a
+// power of 2, otherwise Error
+fn value_is_power_of_two(s: &str) -> Result<usize, String> {
+    let value: usize = s
+        .parse()
+        .map_err(|_| format!("`{s}' isn't a valid usize"))?;
+    // Now we have a value, test whether it's a power of 2
+    if is_power_of_two(value) {
+        Ok(value)
+    } else {
+        Err(format!("{} is not a power of 2", value))
+    }
+}
+
+fn is_power_of_two(v: usize) -> bool {
+    // NOTE: Neither 0 nor 1 are a power of 2 (ignoring 2^0 for this use case),
+    //       so rule them out
+    (v != 0) && (v != 1) && ((v & (v - 1)) == 0)
+}
+
 /// Given a non-prime unsigned int, return the prime number that precedes it
 /// as well as the prime that succeeds it
 fn primes_before_after(non_prime: usize) -> Result<(usize, usize), String> {
@@ -153,6 +175,51 @@ struct Cli {
     /// Where to write the profile.
     #[arg(long, default_value_t, value_enum)]
     sender: ProfileSender,
+    // Buffer Sizes with defaults
+    #[arg(long, default_value_t = 512 * 1024, value_name = "PERF_BUFFER_BYTES",
+          help="Size of each profiler perf buffer, in bytes (must be a power of 2)",
+          value_parser = value_is_power_of_two)]
+    perf_buffer_bytes: usize,
+    // Print out info on eBPF map sizes
+    #[arg(long, help = "Print eBPF map sizes after creation")]
+    mapsize_info: bool,
+    // eBPF map stacks
+    #[arg(
+        long,
+        default_value_t = 100000,
+        help = "max number of individual \
+        stacks to capture before aggregation"
+    )]
+    mapsize_stacks: u32,
+    // eBPF map aggregated_stacks
+    #[arg(
+        long,
+        default_value_t = 10000,
+        help = "Derived from constant MAX_AGGREGATED_STACKS_ENTRIES - max \
+                number of unique stacks after aggregation"
+    )]
+    mapsize_aggregated_stacks: u32,
+    // eBPF map unwind_info_chunks
+    #[arg(
+        long,
+        default_value_t = 5000,
+        help = "max number of chunks allowed inside a shard"
+    )]
+    mapsize_unwind_info_chunks: u32,
+    // eBPF map unwind_tables
+    #[arg(
+        long,
+        default_value_t = 65,
+        help = "Derived from constant MAX_UNWIND_INFO_SHARDS"
+    )]
+    mapsize_unwind_tables: u32,
+    // eBPF map rate_limits
+    #[arg(
+        long,
+        default_value_t = 5000,
+        help = "Derived from constant MAX_PROCESSES"
+    )]
+    mapsize_rate_limits: u32,
 }
 
 /// Exit the main thread if any thread panics. We prefer this behaviour because pretty much every
@@ -228,6 +295,21 @@ fn main() -> Result<(), Box<dyn Error>> {
         }
     }));
 
+    let profiler_config = ProfilerConfig {
+        // NOTE the difference in this arg name from the actual config name
+        libbpf_debug: args.libbpf_logs,
+        bpf_logging: args.bpf_logging,
+        duration: args.duration,
+        sample_freq: args.sample_freq,
+        perf_buffer_bytes: args.perf_buffer_bytes,
+        mapsize_info: args.mapsize_info,
+        mapsize_stacks: args.mapsize_stacks,
+        mapsize_aggregated_stacks: args.mapsize_aggregated_stacks,
+        mapsize_unwind_info_chunks: args.mapsize_unwind_info_chunks,
+        mapsize_unwind_tables: args.mapsize_unwind_tables,
+        mapsize_rate_limits: args.mapsize_rate_limits,
+    };
+
     let (stop_signal_sender, stop_signal_receive) = bounded(1);
 
     ctrlc::set_handler(move || {
@@ -236,13 +318,7 @@ fn main() -> Result<(), Box<dyn Error>> {
     })
     .expect("Error setting Ctrl-C handler");
 
-    let mut p: Profiler<'_> = Profiler::new(
-        args.libbpf_logs,
-        args.bpf_logging,
-        args.duration,
-        args.sample_freq,
-        stop_signal_receive,
-    );
+    let mut p: Profiler<'_> = Profiler::new(profiler_config, stop_signal_receive);
     p.profile_pids(args.pids);
     p.run(collector.clone());
 
@@ -305,7 +381,9 @@ mod tests {
     use super::*;
     use assert_cmd::Command;
     use clap::Parser;
-    use rstest::rstest;
+    use rand::distributions::{Distribution, Uniform};
+    use rstest::{fixture, rstest};
+    use std::collections::HashSet;
 
     #[test]
     fn verify_cli() {
@@ -322,7 +400,7 @@ mod tests {
         let actual = String::from_utf8(cmd.unwrap().stdout).unwrap();
         insta::assert_yaml_snapshot!(actual, @r###"
         ---
-        "Usage: lightswitch [OPTIONS]\n\nOptions:\n      --pids <PIDS>\n          Specific PIDs to profile\n\n      --tids <TIDS>\n          Specific TIDs to profile (these can be outside the PIDs selected above)\n\n      --show-unwind-info <PATH_TO_BINARY>\n          Show unwind info for given binary\n\n      --show-info <PATH_TO_BINARY>\n          Show build ID for given binary\n\n  -D, --duration <DURATION>\n          How long this agent will run in seconds\n          \n          [default: 18446744073709551615]\n\n      --libbpf-logs\n          Enable libbpf logs. This includes the BPF verifier output\n\n      --bpf-logging\n          Enable BPF programs logging\n\n      --logging <LOGGING>\n          Set lightswitch's logging level\n          \n          [default: info]\n          [possible values: trace, debug, info, warn, error]\n\n      --sample-freq <SAMPLE_FREQ_IN_HZ>\n          Per-CPU Sampling Frequency in Hz\n          \n          [default: 19]\n\n      --profile-format <PROFILE_FORMAT>\n          Output file for Flame Graph in SVG format\n          \n          [default: flame-graph]\n          [possible values: none, flame-graph, pprof]\n\n      --profile-name <PROFILE_NAME>\n          Name for the generated profile\n\n      --sender <SENDER>\n          Where to write the profile\n          \n          [default: local-disk]\n\n          Possible values:\n          - none:       Discard the profile. Used for kernel tests\n          - local-disk\n          - remote\n\n  -h, --help\n          Print help (see a summary with '-h')\n"
+        "Usage: lightswitch [OPTIONS]\n\nOptions:\n      --pids <PIDS>\n          Specific PIDs to profile\n\n      --tids <TIDS>\n          Specific TIDs to profile (these can be outside the PIDs selected above)\n\n      --show-unwind-info <PATH_TO_BINARY>\n          Show unwind info for given binary\n\n      --show-info <PATH_TO_BINARY>\n          Show build ID for given binary\n\n  -D, --duration <DURATION>\n          How long this agent will run in seconds\n          \n          [default: 18446744073709551615]\n\n      --libbpf-logs\n          Enable libbpf logs. This includes the BPF verifier output\n\n      --bpf-logging\n          Enable BPF programs logging\n\n      --logging <LOGGING>\n          Set lightswitch's logging level\n          \n          [default: info]\n          [possible values: trace, debug, info, warn, error]\n\n      --sample-freq <SAMPLE_FREQ_IN_HZ>\n          Per-CPU Sampling Frequency in Hz\n          \n          [default: 19]\n\n      --profile-format <PROFILE_FORMAT>\n          Output file for Flame Graph in SVG format\n          \n          [default: flame-graph]\n          [possible values: none, flame-graph, pprof]\n\n      --profile-name <PROFILE_NAME>\n          Name for the generated profile\n\n      --sender <SENDER>\n          Where to write the profile\n          \n          [default: local-disk]\n\n          Possible values:\n          - none:       Discard the profile. Used for kernel tests\n          - local-disk\n          - remote\n\n      --perf-buffer-bytes <PERF_BUFFER_BYTES>\n          Size of each profiler perf buffer, in bytes (must be a power of 2)\n          \n          [default: 524288]\n\n      --mapsize-info\n          Print eBPF map sizes after creation\n\n      --mapsize-stacks <MAPSIZE_STACKS>\n          max number of individual stacks to capture before aggregation\n          \n          [default: 100000]\n\n      --mapsize-aggregated-stacks <MAPSIZE_AGGREGATED_STACKS>\n          Derived from constant MAX_AGGREGATED_STACKS_ENTRIES - max number of unique stacks after aggregation\n          \n          [default: 10000]\n\n      --mapsize-unwind-info-chunks <MAPSIZE_UNWIND_INFO_CHUNKS>\n          max number of chunks allowed inside a shard\n          \n          [default: 5000]\n\n      --mapsize-unwind-tables <MAPSIZE_UNWIND_TABLES>\n          Derived from constant MAX_UNWIND_INFO_SHARDS\n          \n          [default: 65]\n\n      --mapsize-rate-limits <MAPSIZE_RATE_LIMITS>\n          Derived from constant MAX_PROCESSES\n          \n          [default: 5000]\n\n  -h, --help\n          Print help (see a summary with '-h')\n"
         "###);
     }
 
@@ -394,4 +472,94 @@ mod tests {
             }
         }
     }
+
+    // Powers of 2 in usize range
+    #[fixture]
+    fn power_of_two_usize() -> Vec<usize> {
+        let mut test_usizes = vec![];
+        for shift in 0..63 {
+            let val: usize = 2 << shift;
+            test_usizes.push(val);
+        }
+        test_usizes
+    }
+
+    // Powers of 2 represented as Strings
+    #[fixture]
+    fn power_of_two_strings(power_of_two_usize: Vec<usize>) -> Vec<String> {
+        let mut test_uint_strings = vec![];
+        for val in power_of_two_usize {
+            let val_str = val.to_string();
+            test_uint_strings.push(val_str);
+        }
+        test_uint_strings
+    }
+
+    // This fixture produces 5 million random results from the range of usize
+    // integers that are NOT powers of 2
+    #[fixture]
+    fn all_but_power_of_two_usize(power_of_two_usize: Vec<usize>) -> Vec<usize> {
+        let mut test_usize_set: HashSet<usize> = HashSet::new();
+        let mut test_usize_not_p2: Vec<usize> = vec![];
+        // usizes that ARE powers of two, for later exclusion
+        for val in power_of_two_usize {
+            test_usize_set.insert(val);
+        }
+        // Now, for a random sampling of 500000 integers in the range of usize,
+        // excluding any that are known to be powers of 2
+        let between = Uniform::from(0..=usize::MAX);
+        let mut rng = rand::thread_rng();
+        for _ in 0..500000 {
+            let usize_int: usize = between.sample(&mut rng);
+            if test_usize_set.contains(&usize_int) {
+                // We know this is a power of 2, already tested separately, skip
+                continue;
+            }
+            test_usize_not_p2.push(usize_int);
+        }
+        test_usize_not_p2
+    }
+
+    // all_but_power_of_two_usize, but as Strings
+    #[fixture]
+    fn all_but_power_of_two_strings(all_but_power_of_two_usize: Vec<usize>) -> Vec<String> {
+        let mut test_uint_strings: Vec<String> = vec![];
+        for val in all_but_power_of_two_usize {
+            let val_str = val.to_string();
+            test_uint_strings.push(val_str);
+        }
+        test_uint_strings
+    }
+
+    // Testing is_power_of_two predicate used by perf_buffer_bytes
+    // value_parser()
+    #[rstest]
+    fn test_should_be_powers_of_two(power_of_two_usize: Vec<usize>) {
+        for val in power_of_two_usize {
+            assert!(is_power_of_two(val))
+        }
+    }
+
+    #[rstest]
+    fn test_should_not_be_powers_of_two(all_but_power_of_two_usize: Vec<usize>) {
+        for val in all_but_power_of_two_usize {
+            assert!(!is_power_of_two(val))
+        }
+    }
+
+    // Testing the value_parser() implementation for perf_buffer_bytes
+    #[rstest]
+    fn args_should_be_powers_of_two(power_of_two_strings: Vec<String>) {
+        for val_string in power_of_two_strings {
+            assert!(value_is_power_of_two(val_string.as_str()).is_ok())
+        }
+    }
+
+    #[rstest]
+    fn args_should_not_be_powers_of_two(all_but_power_of_two_strings: Vec<String>) {
+        for non_p2_string in all_but_power_of_two_strings {
+            let result = value_is_power_of_two(non_p2_string.as_str());
+            assert!(result.is_err());
+        }
+    }
 }