Skip to content

Commit 75d3d84

Browse files
bors[bot]matklad
andauthored
Merge #4144
4144: Refactor hierarchical profiling r=matklad a=matklad bors r+ 🤖 Co-authored-by: Aleksey Kladov <[email protected]>
2 parents 5671bac + 0202087 commit 75d3d84

File tree

8 files changed

+344
-397
lines changed

8 files changed

+344
-397
lines changed

Cargo.lock

+1
Some generated files are not rendered by default. Learn more about customizing how changed files appear on GitHub.

crates/ra_arena/src/lib.rs

+3
Original file line numberDiff line numberDiff line change
@@ -96,6 +96,9 @@ impl<T> Arena<T> {
9696
pub const fn new() -> Arena<T> {
9797
Arena { data: Vec::new() }
9898
}
99+
pub fn clear(&mut self) {
100+
self.data.clear();
101+
}
99102

100103
pub fn len(&self) -> usize {
101104
self.data.len()

crates/ra_hir_ty/src/infer.rs

+1-2
Original file line numberDiff line numberDiff line change
@@ -686,10 +686,9 @@ mod diagnostics {
686686
) {
687687
match self {
688688
InferenceDiagnostic::NoSuchField { expr, field } => {
689-
let source = owner.lookup(db.upcast()).source(db.upcast());
690689
let (_, source_map) = db.body_with_source_map(owner.into());
691690
let field = source_map.field_syntax(*expr, *field);
692-
sink.push(NoSuchField { file: source.file_id, field: field.value })
691+
sink.push(NoSuchField { file: field.file_id, field: field.value })
693692
}
694693
}
695694
}

crates/ra_prof/Cargo.toml

+1
Original file line numberDiff line numberDiff line change
@@ -9,6 +9,7 @@ publish = false
99
doctest = false
1010

1111
[dependencies]
12+
ra_arena = { path = "../ra_arena" }
1213
once_cell = "1.3.1"
1314
backtrace = { version = "0.3.44", optional = true }
1415

crates/ra_prof/src/hprof.rs

+246
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,246 @@
1+
//! Simple hierarchical profiler
2+
use once_cell::sync::Lazy;
3+
use std::{
4+
cell::RefCell,
5+
collections::{BTreeMap, HashSet},
6+
io::{stderr, Write},
7+
sync::{
8+
atomic::{AtomicBool, Ordering},
9+
RwLock,
10+
},
11+
time::{Duration, Instant},
12+
};
13+
14+
use crate::tree::{Idx, Tree};
15+
16+
/// Filtering syntax
17+
/// env RA_PROFILE=* // dump everything
18+
/// env RA_PROFILE=foo|bar|baz // enabled only selected entries
19+
/// env RA_PROFILE=*@3>10 // dump everything, up to depth 3, if it takes more than 10 ms
20+
pub fn init() {
21+
let spec = std::env::var("RA_PROFILE").unwrap_or_default();
22+
init_from(&spec);
23+
}
24+
25+
pub fn init_from(spec: &str) {
26+
let filter = if spec.is_empty() { Filter::disabled() } else { Filter::from_spec(spec) };
27+
filter.install();
28+
}
29+
30+
pub type Label = &'static str;
31+
32+
/// This function starts a profiling scope in the current execution stack with a given description.
33+
/// It returns a Profile structure and measure elapsed time between this method invocation and Profile structure drop.
34+
/// It supports nested profiling scopes in case when this function invoked multiple times at the execution stack. In this case the profiling information will be nested at the output.
35+
/// Profiling information is being printed in the stderr.
36+
///
37+
/// # Example
38+
/// ```
39+
/// use ra_prof::{profile, set_filter, Filter};
40+
///
41+
/// let f = Filter::from_spec("profile1|profile2@2");
42+
/// set_filter(f);
43+
/// profiling_function1();
44+
///
45+
/// fn profiling_function1() {
46+
/// let _p = profile("profile1");
47+
/// profiling_function2();
48+
/// }
49+
///
50+
/// fn profiling_function2() {
51+
/// let _p = profile("profile2");
52+
/// }
53+
/// ```
54+
/// This will print in the stderr the following:
55+
/// ```text
56+
/// 0ms - profile
57+
/// 0ms - profile2
58+
/// ```
59+
pub fn profile(label: Label) -> Profiler {
60+
assert!(!label.is_empty());
61+
let enabled = PROFILING_ENABLED.load(Ordering::Relaxed)
62+
&& PROFILE_STACK.with(|stack| stack.borrow_mut().push(label));
63+
let label = if enabled { Some(label) } else { None };
64+
Profiler { label, detail: None }
65+
}
66+
67+
pub struct Profiler {
68+
label: Option<Label>,
69+
detail: Option<String>,
70+
}
71+
72+
impl Profiler {
73+
pub fn detail(mut self, detail: impl FnOnce() -> String) -> Profiler {
74+
if self.label.is_some() {
75+
self.detail = Some(detail())
76+
}
77+
self
78+
}
79+
}
80+
81+
impl Drop for Profiler {
82+
fn drop(&mut self) {
83+
match self {
84+
Profiler { label: Some(label), detail } => {
85+
PROFILE_STACK.with(|stack| {
86+
stack.borrow_mut().pop(label, detail.take());
87+
});
88+
}
89+
Profiler { label: None, .. } => (),
90+
}
91+
}
92+
}
93+
94+
static PROFILING_ENABLED: AtomicBool = AtomicBool::new(false);
95+
static FILTER: Lazy<RwLock<Filter>> = Lazy::new(Default::default);
96+
thread_local!(static PROFILE_STACK: RefCell<ProfileStack> = RefCell::new(ProfileStack::new()));
97+
98+
#[derive(Default, Clone, Debug)]
99+
struct Filter {
100+
depth: usize,
101+
allowed: HashSet<String>,
102+
longer_than: Duration,
103+
version: usize,
104+
}
105+
106+
impl Filter {
107+
fn disabled() -> Filter {
108+
Filter::default()
109+
}
110+
111+
fn from_spec(mut spec: &str) -> Filter {
112+
let longer_than = if let Some(idx) = spec.rfind('>') {
113+
let longer_than = spec[idx + 1..].parse().expect("invalid profile longer_than");
114+
spec = &spec[..idx];
115+
Duration::from_millis(longer_than)
116+
} else {
117+
Duration::new(0, 0)
118+
};
119+
120+
let depth = if let Some(idx) = spec.rfind('@') {
121+
let depth: usize = spec[idx + 1..].parse().expect("invalid profile depth");
122+
spec = &spec[..idx];
123+
depth
124+
} else {
125+
999
126+
};
127+
let allowed =
128+
if spec == "*" { HashSet::new() } else { spec.split('|').map(String::from).collect() };
129+
Filter { depth, allowed, longer_than, version: 0 }
130+
}
131+
132+
fn install(mut self) {
133+
PROFILING_ENABLED.store(self.depth > 0, Ordering::SeqCst);
134+
let mut old = FILTER.write().unwrap();
135+
self.version = old.version + 1;
136+
*old = self;
137+
}
138+
}
139+
140+
struct ProfileStack {
141+
starts: Vec<Instant>,
142+
filter: Filter,
143+
messages: Tree<Message>,
144+
}
145+
146+
#[derive(Default)]
147+
struct Message {
148+
duration: Duration,
149+
label: Label,
150+
detail: Option<String>,
151+
}
152+
153+
impl ProfileStack {
154+
fn new() -> ProfileStack {
155+
ProfileStack { starts: Vec::new(), messages: Tree::default(), filter: Default::default() }
156+
}
157+
158+
fn push(&mut self, label: Label) -> bool {
159+
if self.starts.is_empty() {
160+
if let Ok(f) = FILTER.try_read() {
161+
if f.version > self.filter.version {
162+
self.filter = f.clone();
163+
}
164+
};
165+
}
166+
if self.starts.len() > self.filter.depth {
167+
return false;
168+
}
169+
let allowed = &self.filter.allowed;
170+
if self.starts.is_empty() && !allowed.is_empty() && !allowed.contains(label) {
171+
return false;
172+
}
173+
174+
self.starts.push(Instant::now());
175+
self.messages.start();
176+
true
177+
}
178+
179+
pub fn pop(&mut self, label: Label, detail: Option<String>) {
180+
let start = self.starts.pop().unwrap();
181+
let duration = start.elapsed();
182+
let level = self.starts.len();
183+
self.messages.finish(Message { duration, label, detail });
184+
if level == 0 {
185+
let longer_than = self.filter.longer_than;
186+
// Convert to millis for comparison to avoid problems with rounding
187+
// (otherwise we could print `0ms` despite user's `>0` filter when
188+
// `duration` is just a few nanos).
189+
if duration.as_millis() > longer_than.as_millis() {
190+
let stderr = stderr();
191+
if let Some(root) = self.messages.root() {
192+
print(&self.messages, root, 0, longer_than, &mut stderr.lock());
193+
}
194+
}
195+
self.messages.clear();
196+
assert!(self.starts.is_empty())
197+
}
198+
}
199+
}
200+
201+
fn print(
202+
tree: &Tree<Message>,
203+
curr: Idx<Message>,
204+
level: u32,
205+
longer_than: Duration,
206+
out: &mut impl Write,
207+
) {
208+
let current_indent = " ".repeat(level as usize);
209+
let detail = tree[curr].detail.as_ref().map(|it| format!(" @ {}", it)).unwrap_or_default();
210+
writeln!(
211+
out,
212+
"{}{:5}ms - {}{}",
213+
current_indent,
214+
tree[curr].duration.as_millis(),
215+
tree[curr].label,
216+
detail,
217+
)
218+
.expect("printing profiling info");
219+
220+
let mut accounted_for = Duration::default();
221+
let mut short_children = BTreeMap::new(); // Use `BTreeMap` to get deterministic output.
222+
for child in tree.children(curr) {
223+
accounted_for += tree[child].duration;
224+
225+
if tree[child].duration.as_millis() > longer_than.as_millis() {
226+
print(tree, child, level + 1, longer_than, out)
227+
} else {
228+
let (total_duration, cnt) =
229+
short_children.entry(tree[child].label).or_insert((Duration::default(), 0));
230+
*total_duration += tree[child].duration;
231+
*cnt += 1;
232+
}
233+
}
234+
235+
for (child_msg, (duration, count)) in short_children.iter() {
236+
let millis = duration.as_millis();
237+
writeln!(out, " {}{:5}ms - {} ({} calls)", current_indent, millis, child_msg, count)
238+
.expect("printing profiling info");
239+
}
240+
241+
let unaccounted = tree[curr].duration - accounted_for;
242+
if tree.children(curr).next().is_some() && unaccounted > longer_than {
243+
writeln!(out, " {}{:5}ms - ???", current_indent, unaccounted.as_millis())
244+
.expect("printing profiling info");
245+
}
246+
}

0 commit comments

Comments
 (0)