2019-09-30 08:58:53 +00:00
//! FIXME: write short doc here
2019-06-30 10:30:17 +00:00
mod memory_usage ;
2019-08-17 12:29:57 +00:00
#[ cfg(feature = " cpu_profiler " ) ]
mod google_cpu_profiler ;
2019-06-30 10:30:17 +00:00
2019-05-07 17:54:33 +00:00
use std ::{
cell ::RefCell ,
2020-01-19 15:07:15 +00:00
collections ::BTreeMap ,
2019-07-04 20:05:17 +00:00
collections ::HashSet ,
2019-05-07 17:54:33 +00:00
io ::{ stderr , Write } ,
2019-07-04 20:05:17 +00:00
mem ,
sync ::{
atomic ::{ AtomicBool , Ordering } ,
RwLock ,
} ,
time ::{ Duration , Instant } ,
2019-05-07 17:54:33 +00:00
} ;
2019-07-04 20:05:17 +00:00
use once_cell ::sync ::Lazy ;
2019-03-27 15:09:51 +00:00
2019-07-04 20:05:17 +00:00
pub use crate ::memory_usage ::{ Bytes , MemoryUsage } ;
2019-06-30 10:30:17 +00:00
// We use jemalloc mainly to get heap usage statistics, actual performance
// difference is not measures.
2019-11-14 16:47:18 +00:00
#[ cfg(all(feature = " jemalloc " , not(target_env = " msvc " ))) ]
2019-06-30 10:30:17 +00:00
#[ global_allocator ]
static ALLOC : jemallocator ::Jemalloc = jemallocator ::Jemalloc ;
2019-04-03 13:05:55 +00:00
/// Set profiling filter. It specifies descriptions allowed to profile.
/// This is helpful when call stack has too many nested profiling scopes.
/// Additionally filter can specify maximum depth of profiling scopes nesting.
///
/// #Example
/// ```
2019-04-14 22:03:11 +00:00
/// use ra_prof::{set_filter, Filter};
/// let f = Filter::from_spec("profile1|profile2@2");
2019-04-03 13:05:55 +00:00
/// set_filter(f);
/// ```
2019-03-29 12:34:05 +00:00
pub fn set_filter ( f : Filter ) {
2019-04-14 19:54:57 +00:00
PROFILING_ENABLED . store ( f . depth > 0 , Ordering ::SeqCst ) ;
2019-05-07 17:54:33 +00:00
let set : HashSet < _ > = f . allowed . iter ( ) . cloned ( ) . collect ( ) ;
2019-03-29 12:34:05 +00:00
let mut old = FILTER . write ( ) . unwrap ( ) ;
2019-04-14 20:20:12 +00:00
let filter_data = FilterData {
depth : f . depth ,
allowed : set ,
longer_than : f . longer_than ,
version : old . version + 1 ,
} ;
2019-03-29 12:34:05 +00:00
* old = filter_data ;
}
2019-04-03 13:05:55 +00:00
/// This function starts a profiling scope in the current execution stack with a given description.
/// It returns a Profile structure and measure elapsed time between this method invocation and Profile structure drop.
/// It supports nested profiling scopes in case when this function invoked multiple times at the execution stack. In this case the profiling information will be nested at the output.
/// Profiling information is being printed in the stderr.
///
2019-07-06 11:04:56 +00:00
/// # Example
2019-04-03 13:05:55 +00:00
/// ```
2019-04-14 22:03:11 +00:00
/// use ra_prof::{profile, set_filter, Filter};
2019-04-03 13:05:55 +00:00
///
2019-04-14 22:03:11 +00:00
/// let f = Filter::from_spec("profile1|profile2@2");
2019-04-03 13:05:55 +00:00
/// set_filter(f);
/// profiling_function1();
///
/// fn profiling_function1() {
/// let _p = profile("profile1");
/// profiling_function2();
/// }
///
/// fn profiling_function2() {
/// let _p = profile("profile2");
/// }
/// ```
/// This will print in the stderr the following:
/// ```text
/// 0ms - profile
/// 0ms - profile2
/// ```
2019-03-29 12:34:05 +00:00
pub fn profile ( desc : & str ) -> Profiler {
2019-04-14 19:54:57 +00:00
assert! ( ! desc . is_empty ( ) ) ;
if ! PROFILING_ENABLED . load ( Ordering ::Relaxed ) {
return Profiler { desc : None } ;
}
2019-03-29 12:34:05 +00:00
PROFILE_STACK . with ( | stack | {
let mut stack = stack . borrow_mut ( ) ;
2019-04-26 15:42:56 +00:00
if stack . starts . is_empty ( ) {
if let Ok ( f ) = FILTER . try_read ( ) {
if f . version > stack . filter_data . version {
stack . filter_data = f . clone ( ) ;
2019-03-29 12:34:05 +00:00
}
} ;
}
2019-04-14 19:54:57 +00:00
if stack . starts . len ( ) > stack . filter_data . depth {
return Profiler { desc : None } ;
}
2019-06-01 07:41:47 +00:00
let allowed = & stack . filter_data . allowed ;
if stack . starts . is_empty ( ) & & ! allowed . is_empty ( ) & & ! allowed . contains ( desc ) {
return Profiler { desc : None } ;
2019-03-29 12:34:05 +00:00
}
2019-06-01 07:41:47 +00:00
stack . starts . push ( Instant ::now ( ) ) ;
Profiler { desc : Some ( desc . to_string ( ) ) }
2019-03-29 12:34:05 +00:00
} )
}
2019-03-27 15:09:51 +00:00
pub struct Profiler {
2019-03-29 12:34:05 +00:00
desc : Option < String > ,
2019-03-27 15:09:51 +00:00
}
pub struct Filter {
depth : usize ,
allowed : Vec < String > ,
2019-04-14 20:20:12 +00:00
longer_than : Duration ,
2019-03-27 15:09:51 +00:00
}
2019-04-02 14:52:04 +00:00
impl Filter {
2019-04-14 20:18:58 +00:00
// Filtering syntax
// env RA_PROFILE=* // dump everything
// env RA_PROFILE=foo|bar|baz // enabled only selected entries
// env RA_PROFILE=*@3>10 // dump everything, up to depth 3, if it takes more than 10 ms
pub fn from_spec ( mut spec : & str ) -> Filter {
2019-04-26 15:41:58 +00:00
let longer_than = if let Some ( idx ) = spec . rfind ( '>' ) {
2019-04-14 20:20:12 +00:00
let longer_than = spec [ idx + 1 .. ] . parse ( ) . expect ( " invalid profile longer_than " ) ;
2019-04-14 20:18:58 +00:00
spec = & spec [ .. idx ] ;
2019-04-14 20:20:12 +00:00
Duration ::from_millis ( longer_than )
2019-04-14 20:18:58 +00:00
} else {
Duration ::new ( 0 , 0 )
} ;
2019-04-26 15:41:58 +00:00
let depth = if let Some ( idx ) = spec . rfind ( '@' ) {
2019-04-14 20:18:58 +00:00
let depth : usize = spec [ idx + 1 .. ] . parse ( ) . expect ( " invalid profile depth " ) ;
spec = & spec [ .. idx ] ;
depth
} else {
999
} ;
let allowed =
2019-04-26 15:41:58 +00:00
if spec = = " * " { Vec ::new ( ) } else { spec . split ( '|' ) . map ( String ::from ) . collect ( ) } ;
2019-04-14 20:20:12 +00:00
Filter ::new ( depth , allowed , longer_than )
2019-04-14 20:18:58 +00:00
}
2019-04-14 20:04:08 +00:00
pub fn disabled ( ) -> Filter {
2019-04-14 20:18:58 +00:00
Filter ::new ( 0 , Vec ::new ( ) , Duration ::new ( 0 , 0 ) )
2019-04-14 20:04:08 +00:00
}
2019-04-14 20:20:12 +00:00
pub fn new ( depth : usize , allowed : Vec < String > , longer_than : Duration ) -> Filter {
Filter { depth , allowed , longer_than }
2019-04-02 14:52:04 +00:00
}
}
2019-03-27 15:09:51 +00:00
struct ProfileStack {
2019-03-29 12:34:05 +00:00
starts : Vec < Instant > ,
2019-03-27 15:09:51 +00:00
messages : Vec < Message > ,
filter_data : FilterData ,
}
2019-03-29 12:34:05 +00:00
struct Message {
level : usize ,
duration : Duration ,
message : String ,
}
2019-03-27 15:09:51 +00:00
impl ProfileStack {
fn new ( ) -> ProfileStack {
ProfileStack { starts : Vec ::new ( ) , messages : Vec ::new ( ) , filter_data : Default ::default ( ) }
}
}
2019-03-29 12:34:05 +00:00
#[ derive(Default, Clone) ]
2019-03-27 15:09:51 +00:00
struct FilterData {
depth : usize ,
version : usize ,
allowed : HashSet < String > ,
2019-04-14 20:20:12 +00:00
longer_than : Duration ,
2019-03-27 15:09:51 +00:00
}
2019-04-14 19:54:57 +00:00
static PROFILING_ENABLED : AtomicBool = AtomicBool ::new ( false ) ;
2019-05-07 17:54:33 +00:00
static FILTER : Lazy < RwLock < FilterData > > = Lazy ::new ( Default ::default ) ;
2019-03-27 15:09:51 +00:00
thread_local! ( static PROFILE_STACK : RefCell < ProfileStack > = RefCell ::new ( ProfileStack ::new ( ) ) ) ;
impl Drop for Profiler {
fn drop ( & mut self ) {
2019-03-29 12:34:05 +00:00
match self {
Profiler { desc : Some ( desc ) } = > {
PROFILE_STACK . with ( | stack | {
let mut stack = stack . borrow_mut ( ) ;
let start = stack . starts . pop ( ) . unwrap ( ) ;
let duration = start . elapsed ( ) ;
let level = stack . starts . len ( ) ;
let message = mem ::replace ( desc , String ::new ( ) ) ;
stack . messages . push ( Message { level , duration , message } ) ;
if level = = 0 {
let stdout = stderr ( ) ;
2019-05-21 21:00:58 +00:00
let longer_than = stack . filter_data . longer_than ;
2020-01-02 16:21:40 +00:00
// Convert to millis for comparison to avoid problems with rounding
// (otherwise we could print `0ms` despite user's `>0` filter when
// `duration` is just a few nanos).
if duration . as_millis ( ) > longer_than . as_millis ( ) {
2020-01-19 15:07:15 +00:00
print ( & stack . messages , longer_than , & mut stdout . lock ( ) ) ;
2019-04-14 20:18:58 +00:00
}
2019-03-29 12:34:05 +00:00
stack . messages . clear ( ) ;
}
} ) ;
2019-03-27 15:09:51 +00:00
}
2019-03-29 12:34:05 +00:00
Profiler { desc : None } = > ( ) ,
}
2019-03-27 15:09:51 +00:00
}
}
2020-01-19 15:07:15 +00:00
fn print ( msgs : & [ Message ] , longer_than : Duration , out : & mut impl Write ) {
2020-01-11 18:09:31 +00:00
if msgs . is_empty ( ) {
return ;
}
2020-01-19 15:07:15 +00:00
let children_map = idx_to_children ( msgs ) ;
let root_idx = msgs . len ( ) - 1 ;
print_for_idx ( root_idx , & children_map , msgs , longer_than , out ) ;
}
fn print_for_idx (
current_idx : usize ,
children_map : & [ Vec < usize > ] ,
msgs : & [ Message ] ,
longer_than : Duration ,
out : & mut impl Write ,
) {
let current = & msgs [ current_idx ] ;
let current_indent = " " . repeat ( current . level ) ;
writeln! ( out , " {}{:5}ms - {} " , current_indent , current . duration . as_millis ( ) , current . message )
. expect ( " printing profiling info " ) ;
let longer_than_millis = longer_than . as_millis ( ) ;
let children_indices = & children_map [ current_idx ] ;
2019-10-24 06:05:11 +00:00
let mut accounted_for = Duration ::default ( ) ;
2020-01-19 15:07:15 +00:00
let mut short_children = BTreeMap ::new ( ) ; // Use `BTreeMap` to get deterministic output.
2019-05-21 13:24:53 +00:00
2020-01-19 15:07:15 +00:00
for child_idx in children_indices . iter ( ) {
let child = & msgs [ * child_idx ] ;
if child . duration . as_millis ( ) > longer_than_millis {
print_for_idx ( * child_idx , children_map , msgs , longer_than , out ) ;
2019-05-21 21:00:58 +00:00
} else {
2020-01-19 15:07:15 +00:00
let pair = short_children . entry ( & child . message ) . or_insert ( ( Duration ::default ( ) , 0 ) ) ;
pair . 0 + = child . duration ;
pair . 1 + = 1 ;
2019-05-21 21:00:58 +00:00
}
2020-01-19 15:07:15 +00:00
accounted_for + = child . duration ;
}
2019-03-29 12:34:05 +00:00
2020-01-19 15:07:15 +00:00
for ( child_msg , ( duration , count ) ) in short_children . iter ( ) {
let millis = duration . as_millis ( ) ;
writeln! ( out , " {}{:5}ms - {} ({} calls) " , current_indent , millis , child_msg , count )
. expect ( " printing profiling info " ) ;
2019-03-27 15:09:51 +00:00
}
2020-01-19 15:07:15 +00:00
let unaccounted_millis = ( current . duration - accounted_for ) . as_millis ( ) ;
if ! children_indices . is_empty ( )
& & unaccounted_millis > 0
& & unaccounted_millis > longer_than_millis
{
writeln! ( out , " {}{:5}ms - ??? " , current_indent , unaccounted_millis )
. expect ( " printing profiling info " ) ;
2019-05-21 21:00:58 +00:00
}
2020-01-19 15:07:15 +00:00
}
2019-10-24 06:05:11 +00:00
2020-01-19 15:07:15 +00:00
/// Returns a mapping from an index in the `msgs` to the vector with the indices of its children.
///
/// This assumes that the entries in `msgs` are in the order of when the calls to `profile` finish.
/// In other words, a postorder of the call graph. In particular, the root is the last element of
/// `msgs`.
fn idx_to_children ( msgs : & [ Message ] ) -> Vec < Vec < usize > > {
// Initialize with the index of the root; `ancestors` should be never empty.
let mut ancestors = vec! [ msgs . len ( ) - 1 ] ;
let mut result : Vec < Vec < usize > > = vec! [ ] ;
result . resize_with ( msgs . len ( ) , Default ::default ) ;
for ( idx , msg ) in msgs [ .. msgs . len ( ) - 1 ] . iter ( ) . enumerate ( ) . rev ( ) {
// We need to find the parent of the current message, i.e., the last ancestor that has a
// level lower than the current message.
while msgs [ * ancestors . last ( ) . unwrap ( ) ] . level > = msg . level {
ancestors . pop ( ) ;
2019-10-24 06:05:11 +00:00
}
2020-01-19 15:07:15 +00:00
result [ * ancestors . last ( ) . unwrap ( ) ] . push ( idx ) ;
ancestors . push ( idx ) ;
}
// Note that above we visited all children from the last to the first one. Let's reverse vectors
// to get the more natural order where the first element is the first child.
for vec in result . iter_mut ( ) {
vec . reverse ( ) ;
2019-10-24 06:05:11 +00:00
}
2020-01-19 15:07:15 +00:00
result
2019-03-27 15:09:51 +00:00
}
2019-06-03 21:25:43 +00:00
/// Prints backtrace to stderr, useful for debugging.
pub fn print_backtrace ( ) {
let bt = backtrace ::Backtrace ::new ( ) ;
eprintln! ( " {:?} " , bt ) ;
}
thread_local! ( static IN_SCOPE : RefCell < bool > = RefCell ::new ( false ) ) ;
/// Allows to check if the current code is withing some dynamic scope, can be
/// useful during debugging to figure out why a function is called.
pub struct Scope {
2019-06-04 11:46:22 +00:00
prev : bool ,
2019-06-03 21:25:43 +00:00
}
impl Scope {
pub fn enter ( ) -> Scope {
2019-06-04 11:46:22 +00:00
let prev = IN_SCOPE . with ( | slot | std ::mem ::replace ( & mut * slot . borrow_mut ( ) , true ) ) ;
Scope { prev }
2019-06-03 21:25:43 +00:00
}
pub fn is_active ( ) -> bool {
IN_SCOPE . with ( | slot | * slot . borrow ( ) )
}
}
impl Drop for Scope {
fn drop ( & mut self ) {
2019-06-04 11:46:22 +00:00
IN_SCOPE . with ( | slot | * slot . borrow_mut ( ) = self . prev ) ;
2019-06-03 21:25:43 +00:00
}
}
2019-08-17 12:29:57 +00:00
/// A wrapper around google_cpu_profiler.
2019-06-26 08:11:28 +00:00
///
2019-08-17 12:29:57 +00:00
/// Usage:
/// 1. Install gpref_tools (https://github.com/gperftools/gperftools), probably packaged with your Linux distro.
/// 2. Build with `cpu_profiler` feature.
/// 3. Tun the code, the *raw* output would be in the `./out.profile` file.
/// 4. Install pprof for visualization (https://github.com/google/pprof).
/// 5. Use something like `pprof -svg target/release/ra_cli ./out.profile` to see the results.
///
/// For example, here's how I run profiling on NixOS:
///
/// ```bash
/// $ nix-shell -p gperftools --run \
/// 'cargo run --release -p ra_cli -- parse < ~/projects/rustbench/parser.rs > /dev/null'
/// ```
2019-06-26 08:11:28 +00:00
#[ derive(Debug) ]
pub struct CpuProfiler {
_private : ( ) ,
}
pub fn cpu_profiler ( ) -> CpuProfiler {
2019-08-17 12:29:57 +00:00
#[ cfg(feature = " cpu_profiler " ) ]
2019-06-26 08:11:28 +00:00
{
2019-08-17 12:29:57 +00:00
google_cpu_profiler ::start ( " ./out.profile " . as_ref ( ) )
2019-06-26 08:11:28 +00:00
}
2019-08-17 12:29:57 +00:00
#[ cfg(not(feature = " cpu_profiler " )) ]
2019-06-26 08:11:28 +00:00
{
2019-08-17 12:29:57 +00:00
eprintln! ( " cpu_profiler feature is disabled " )
2019-06-26 08:11:28 +00:00
}
CpuProfiler { _private : ( ) }
}
impl Drop for CpuProfiler {
fn drop ( & mut self ) {
2019-08-17 12:29:57 +00:00
#[ cfg(feature = " cpu_profiler " ) ]
2019-06-26 08:11:28 +00:00
{
2019-08-17 12:29:57 +00:00
google_cpu_profiler ::stop ( )
2019-06-26 08:11:28 +00:00
}
}
}
2019-06-30 10:30:17 +00:00
pub fn memory_usage ( ) -> MemoryUsage {
MemoryUsage ::current ( )
}
2019-03-27 15:09:51 +00:00
#[ cfg(test) ]
mod tests {
2019-04-14 22:03:11 +00:00
use super ::* ;
2019-03-27 15:09:51 +00:00
#[ test ]
fn test_basic_profile ( ) {
let s = vec! [ " profile1 " . to_string ( ) , " profile2 " . to_string ( ) ] ;
2019-04-14 22:03:11 +00:00
let f = Filter ::new ( 2 , s , Duration ::new ( 0 , 0 ) ) ;
2019-03-27 15:09:51 +00:00
set_filter ( f ) ;
profiling_function1 ( ) ;
}
fn profiling_function1 ( ) {
let _p = profile ( " profile1 " ) ;
profiling_function2 ( ) ;
}
fn profiling_function2 ( ) {
let _p = profile ( " profile2 " ) ;
}
2020-01-02 16:21:40 +00:00
#[ test ]
fn test_longer_than ( ) {
let mut result = vec! [ ] ;
let msgs = vec! [
Message { level : 1 , duration : Duration ::from_nanos ( 3 ) , message : " bar " . to_owned ( ) } ,
Message { level : 1 , duration : Duration ::from_nanos ( 2 ) , message : " bar " . to_owned ( ) } ,
Message { level : 0 , duration : Duration ::from_millis ( 1 ) , message : " foo " . to_owned ( ) } ,
] ;
2020-01-19 15:07:15 +00:00
print ( & msgs , Duration ::from_millis ( 0 ) , & mut result ) ;
2020-01-02 16:21:40 +00:00
// The calls to `bar` are so short that they'll be rounded to 0ms and should get collapsed
// when printing.
assert_eq! (
std ::str ::from_utf8 ( & result ) . unwrap ( ) ,
" 1ms - foo \n 0ms - bar (2 calls) \n "
) ;
}
2020-01-11 18:09:31 +00:00
#[ test ]
fn test_unaccounted_for_topmost ( ) {
let mut result = vec! [ ] ;
let msgs = vec! [
Message { level : 1 , duration : Duration ::from_millis ( 2 ) , message : " bar " . to_owned ( ) } ,
Message { level : 0 , duration : Duration ::from_millis ( 5 ) , message : " foo " . to_owned ( ) } ,
] ;
2020-01-19 15:07:15 +00:00
print ( & msgs , Duration ::from_millis ( 0 ) , & mut result ) ;
2020-01-11 18:09:31 +00:00
assert_eq! (
std ::str ::from_utf8 ( & result ) . unwrap ( ) . lines ( ) . collect ::< Vec < _ > > ( ) ,
vec! [
" 5ms - foo " ,
" 2ms - bar " ,
" 3ms - ??? " ,
// Dummy comment to improve formatting
]
) ;
}
#[ test ]
fn test_unaccounted_for_multiple_levels ( ) {
let mut result = vec! [ ] ;
let msgs = vec! [
Message { level : 2 , duration : Duration ::from_millis ( 3 ) , message : " baz " . to_owned ( ) } ,
Message { level : 1 , duration : Duration ::from_millis ( 5 ) , message : " bar " . to_owned ( ) } ,
Message { level : 2 , duration : Duration ::from_millis ( 2 ) , message : " baz " . to_owned ( ) } ,
Message { level : 1 , duration : Duration ::from_millis ( 4 ) , message : " bar " . to_owned ( ) } ,
Message { level : 0 , duration : Duration ::from_millis ( 9 ) , message : " foo " . to_owned ( ) } ,
] ;
2020-01-19 15:07:15 +00:00
print ( & msgs , Duration ::from_millis ( 0 ) , & mut result ) ;
2020-01-11 18:09:31 +00:00
assert_eq! (
std ::str ::from_utf8 ( & result ) . unwrap ( ) . lines ( ) . collect ::< Vec < _ > > ( ) ,
vec! [
" 9ms - foo " ,
" 5ms - bar " ,
" 3ms - baz " ,
" 2ms - ??? " ,
" 4ms - bar " ,
" 2ms - baz " ,
" 2ms - ??? " ,
]
) ;
}
2019-03-27 15:09:51 +00:00
}