forked from tokio-rs/tracing
-
Notifications
You must be signed in to change notification settings - Fork 0
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
opentelemetry: support publishing metrics (tokio-rs#2185)
Motivation: Currently, there is no way to publish metrics via tracing. Solution: Update the tracing-opentelemetry crate to publish metrics for event fields that contain specific prefixes in the name. Right now, we lazily instantiate and store one metrics object per-callsite, but a future improvement that we should add to tracing itself is the ability to store data per-callsite, so that we don't have to do a HashMap lookup each time we want to publish a metric. Co-authored-by: Eliza Weisman <[email protected]> Co-authored-by: David Barsky <[email protected]>
- Loading branch information
Showing
4 changed files
with
644 additions
and
1 deletion.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,352 @@ | ||
use std::{collections::HashMap, fmt, sync::RwLock}; | ||
use tracing::{field::Visit, Subscriber}; | ||
use tracing_core::Field; | ||
|
||
use opentelemetry::{ | ||
metrics::{Counter, Meter, MeterProvider, UpDownCounter, ValueRecorder}, | ||
sdk::metrics::PushController, | ||
}; | ||
use tracing_subscriber::{layer::Context, registry::LookupSpan, Layer}; | ||
|
||
const CARGO_PKG_VERSION: &str = env!("CARGO_PKG_VERSION"); | ||
const INSTRUMENTATION_LIBRARY_NAME: &str = "tracing/tracing-opentelemetry"; | ||
|
||
const METRIC_PREFIX_MONOTONIC_COUNTER: &str = "monotonic_counter."; | ||
const METRIC_PREFIX_COUNTER: &str = "counter."; | ||
const METRIC_PREFIX_VALUE: &str = "value."; | ||
const I64_MAX: u64 = i64::MAX as u64; | ||
|
||
#[derive(Default)] | ||
pub(crate) struct Instruments { | ||
u64_counter: MetricsMap<Counter<u64>>, | ||
f64_counter: MetricsMap<Counter<f64>>, | ||
i64_up_down_counter: MetricsMap<UpDownCounter<i64>>, | ||
f64_up_down_counter: MetricsMap<UpDownCounter<f64>>, | ||
u64_value_recorder: MetricsMap<ValueRecorder<u64>>, | ||
i64_value_recorder: MetricsMap<ValueRecorder<i64>>, | ||
f64_value_recorder: MetricsMap<ValueRecorder<f64>>, | ||
} | ||
|
||
type MetricsMap<T> = RwLock<HashMap<&'static str, T>>; | ||
|
||
#[derive(Copy, Clone, Debug)] | ||
pub(crate) enum InstrumentType { | ||
CounterU64(u64), | ||
CounterF64(f64), | ||
UpDownCounterI64(i64), | ||
UpDownCounterF64(f64), | ||
ValueRecorderU64(u64), | ||
ValueRecorderI64(i64), | ||
ValueRecorderF64(f64), | ||
} | ||
|
||
impl Instruments { | ||
pub(crate) fn update_metric( | ||
&self, | ||
meter: &Meter, | ||
instrument_type: InstrumentType, | ||
metric_name: &'static str, | ||
) { | ||
fn update_or_insert<T>( | ||
map: &MetricsMap<T>, | ||
name: &'static str, | ||
insert: impl FnOnce() -> T, | ||
update: impl FnOnce(&T), | ||
) { | ||
{ | ||
let lock = map.read().unwrap(); | ||
if let Some(metric) = lock.get(name) { | ||
update(metric); | ||
return; | ||
} | ||
} | ||
|
||
// that metric did not already exist, so we have to acquire a write lock to | ||
// create it. | ||
let mut lock = map.write().unwrap(); | ||
// handle the case where the entry was created while we were waiting to | ||
// acquire the write lock | ||
let metric = lock.entry(name).or_insert_with(insert); | ||
update(metric) | ||
} | ||
|
||
match instrument_type { | ||
InstrumentType::CounterU64(value) => { | ||
update_or_insert( | ||
&self.u64_counter, | ||
metric_name, | ||
|| meter.u64_counter(metric_name).init(), | ||
|ctr| ctr.add(value, &[]), | ||
); | ||
} | ||
InstrumentType::CounterF64(value) => { | ||
update_or_insert( | ||
&self.f64_counter, | ||
metric_name, | ||
|| meter.f64_counter(metric_name).init(), | ||
|ctr| ctr.add(value, &[]), | ||
); | ||
} | ||
InstrumentType::UpDownCounterI64(value) => { | ||
update_or_insert( | ||
&self.i64_up_down_counter, | ||
metric_name, | ||
|| meter.i64_up_down_counter(metric_name).init(), | ||
|ctr| ctr.add(value, &[]), | ||
); | ||
} | ||
InstrumentType::UpDownCounterF64(value) => { | ||
update_or_insert( | ||
&self.f64_up_down_counter, | ||
metric_name, | ||
|| meter.f64_up_down_counter(metric_name).init(), | ||
|ctr| ctr.add(value, &[]), | ||
); | ||
} | ||
InstrumentType::ValueRecorderU64(value) => { | ||
update_or_insert( | ||
&self.u64_value_recorder, | ||
metric_name, | ||
|| meter.u64_value_recorder(metric_name).init(), | ||
|rec| rec.record(value, &[]), | ||
); | ||
} | ||
InstrumentType::ValueRecorderI64(value) => { | ||
update_or_insert( | ||
&self.i64_value_recorder, | ||
metric_name, | ||
|| meter.i64_value_recorder(metric_name).init(), | ||
|rec| rec.record(value, &[]), | ||
); | ||
} | ||
InstrumentType::ValueRecorderF64(value) => { | ||
update_or_insert( | ||
&self.f64_value_recorder, | ||
metric_name, | ||
|| meter.f64_value_recorder(metric_name).init(), | ||
|rec| rec.record(value, &[]), | ||
); | ||
} | ||
}; | ||
} | ||
} | ||
|
||
pub(crate) struct MetricVisitor<'a> { | ||
pub(crate) instruments: &'a Instruments, | ||
pub(crate) meter: &'a Meter, | ||
} | ||
|
||
impl<'a> Visit for MetricVisitor<'a> { | ||
fn record_debug(&mut self, _field: &Field, _value: &dyn fmt::Debug) { | ||
// Do nothing | ||
} | ||
|
||
fn record_u64(&mut self, field: &Field, value: u64) { | ||
if let Some(metric_name) = field.name().strip_prefix(METRIC_PREFIX_MONOTONIC_COUNTER) { | ||
self.instruments.update_metric( | ||
self.meter, | ||
InstrumentType::CounterU64(value), | ||
metric_name, | ||
); | ||
} else if let Some(metric_name) = field.name().strip_prefix(METRIC_PREFIX_COUNTER) { | ||
if value <= I64_MAX { | ||
self.instruments.update_metric( | ||
self.meter, | ||
InstrumentType::UpDownCounterI64(value as i64), | ||
metric_name, | ||
); | ||
} else { | ||
eprintln!( | ||
"[tracing-opentelemetry]: Received Counter metric, but \ | ||
provided u64: {} is greater than i64::MAX. Ignoring \ | ||
this metric.", | ||
value | ||
); | ||
} | ||
} else if let Some(metric_name) = field.name().strip_prefix(METRIC_PREFIX_VALUE) { | ||
self.instruments.update_metric( | ||
self.meter, | ||
InstrumentType::ValueRecorderU64(value), | ||
metric_name, | ||
); | ||
} | ||
} | ||
|
||
fn record_f64(&mut self, field: &Field, value: f64) { | ||
if let Some(metric_name) = field.name().strip_prefix(METRIC_PREFIX_MONOTONIC_COUNTER) { | ||
self.instruments.update_metric( | ||
self.meter, | ||
InstrumentType::CounterF64(value), | ||
metric_name, | ||
); | ||
} else if let Some(metric_name) = field.name().strip_prefix(METRIC_PREFIX_COUNTER) { | ||
self.instruments.update_metric( | ||
self.meter, | ||
InstrumentType::UpDownCounterF64(value), | ||
metric_name, | ||
); | ||
} else if let Some(metric_name) = field.name().strip_prefix(METRIC_PREFIX_VALUE) { | ||
self.instruments.update_metric( | ||
self.meter, | ||
InstrumentType::ValueRecorderF64(value), | ||
metric_name, | ||
); | ||
} | ||
} | ||
|
||
fn record_i64(&mut self, field: &Field, value: i64) { | ||
if let Some(metric_name) = field.name().strip_prefix(METRIC_PREFIX_MONOTONIC_COUNTER) { | ||
self.instruments.update_metric( | ||
self.meter, | ||
InstrumentType::CounterU64(value as u64), | ||
metric_name, | ||
); | ||
} else if let Some(metric_name) = field.name().strip_prefix(METRIC_PREFIX_COUNTER) { | ||
self.instruments.update_metric( | ||
self.meter, | ||
InstrumentType::UpDownCounterI64(value), | ||
metric_name, | ||
); | ||
} else if let Some(metric_name) = field.name().strip_prefix(METRIC_PREFIX_VALUE) { | ||
self.instruments.update_metric( | ||
self.meter, | ||
InstrumentType::ValueRecorderI64(value), | ||
metric_name, | ||
); | ||
} | ||
} | ||
} | ||
|
||
/// A layer that publishes metrics via the OpenTelemetry SDK. | ||
/// | ||
/// # Usage | ||
/// | ||
/// No configuration is needed for this Layer, as it's only responsible for | ||
/// pushing data out to the `opentelemetry` family of crates. For example, when | ||
/// using `opentelemetry-otlp`, that crate will provide its own set of | ||
/// configuration options for setting up the duration metrics will be collected | ||
/// before exporting to the OpenTelemetry Collector, aggregation of data points, | ||
/// etc. | ||
/// | ||
/// ```no_run | ||
/// use tracing_opentelemetry::MetricsLayer; | ||
/// use tracing_subscriber::layer::SubscriberExt; | ||
/// use tracing_subscriber::Registry; | ||
/// # use opentelemetry::sdk::metrics::PushController; | ||
/// | ||
/// // Constructing a PushController is out-of-scope for the docs here, but there | ||
/// // are examples in the opentelemetry repository. See: | ||
/// // https://github.com/open-telemetry/opentelemetry-rust/blob/c13a11e62a68eacd8c41a0742a0d097808e28fbd/examples/basic-otlp/src/main.rs#L39-L53 | ||
/// # let push_controller: PushController = unimplemented!(); | ||
/// | ||
/// let opentelemetry_metrics = MetricsLayer::new(push_controller); | ||
/// let subscriber = Registry::default().with(opentelemetry_metrics); | ||
/// tracing::subscriber::set_global_default(subscriber).unwrap(); | ||
/// ``` | ||
/// | ||
/// To publish a new metric, add a key-value pair to your `tracing::Event` that | ||
/// contains following prefixes: | ||
/// - `monotonic_counter.` (non-negative numbers): Used when the counter should | ||
/// only ever increase | ||
/// - `counter.`: Used when the counter can go up or down | ||
/// - `value.`: Used for discrete data points (i.e., summing them does not make | ||
/// semantic sense) | ||
/// | ||
/// Examples: | ||
/// ``` | ||
/// # use tracing::info; | ||
/// info!(monotonic_counter.foo = 1); | ||
/// info!(monotonic_counter.bar = 1.1); | ||
/// | ||
/// info!(counter.baz = 1); | ||
/// info!(counter.baz = -1); | ||
/// info!(counter.xyz = 1.1); | ||
/// | ||
/// info!(value.qux = 1); | ||
/// info!(value.abc = -1); | ||
/// info!(value.def = 1.1); | ||
/// ``` | ||
/// | ||
/// # Mixing data types | ||
/// | ||
/// ## Floating-point numbers | ||
/// | ||
/// Do not mix floating point and non-floating point numbers for the same | ||
/// metric. If a floating point number will be used for a given metric, be sure | ||
/// to cast any other usages of that metric to a floating point number. | ||
/// | ||
/// Do this: | ||
/// ``` | ||
/// # use tracing::info; | ||
/// info!(monotonic_counter.foo = 1_f64); | ||
/// info!(monotonic_counter.foo = 1.1); | ||
/// ``` | ||
/// | ||
/// This is because all data published for a given metric name must be the same | ||
/// numeric type. | ||
/// | ||
/// ## Integers | ||
/// | ||
/// Positive and negative integers can be mixed freely. The instrumentation | ||
/// provided by `tracing` assumes that all integers are `i64` unless explicitly | ||
/// cast to something else. In the case that an integer *is* cast to `u64`, this | ||
/// subscriber will handle the conversion internally. | ||
/// | ||
/// For example: | ||
/// ``` | ||
/// # use tracing::info; | ||
/// // The subscriber receives an i64 | ||
/// info!(counter.baz = 1); | ||
/// | ||
/// // The subscriber receives an i64 | ||
/// info!(counter.baz = -1); | ||
/// | ||
/// // The subscriber receives a u64, but casts it to i64 internally | ||
/// info!(counter.baz = 1_u64); | ||
/// | ||
/// // The subscriber receives a u64, but cannot cast it to i64 because of | ||
/// // overflow. An error is printed to stderr, and the metric is dropped. | ||
/// info!(counter.baz = (i64::MAX as u64) + 1) | ||
/// ``` | ||
/// | ||
/// # Implementation Details | ||
/// | ||
/// `MetricsLayer` holds a set of maps, with each map corresponding to a | ||
/// type of metric supported by OpenTelemetry. These maps are populated lazily. | ||
/// The first time that a metric is emitted by the instrumentation, a `Metric` | ||
/// instance will be created and added to the corresponding map. This means that | ||
/// any time a metric is emitted by the instrumentation, one map lookup has to | ||
/// be performed. | ||
/// | ||
/// In the future, this can be improved by associating each `Metric` instance to | ||
/// its callsite, eliminating the need for any maps. | ||
pub struct MetricsLayer { | ||
meter: Meter, | ||
instruments: Instruments, | ||
} | ||
|
||
impl MetricsLayer { | ||
/// Create a new instance of MetricsLayer. | ||
pub fn new(push_controller: PushController) -> Self { | ||
let meter = push_controller | ||
.provider() | ||
.meter(INSTRUMENTATION_LIBRARY_NAME, Some(CARGO_PKG_VERSION)); | ||
MetricsLayer { | ||
meter, | ||
instruments: Default::default(), | ||
} | ||
} | ||
} | ||
|
||
impl<S> Layer<S> for MetricsLayer | ||
where | ||
S: Subscriber + for<'span> LookupSpan<'span>, | ||
{ | ||
fn on_event(&self, event: &tracing::Event<'_>, _ctx: Context<'_, S>) { | ||
let mut metric_visitor = MetricVisitor { | ||
instruments: &self.instruments, | ||
meter: &self.meter, | ||
}; | ||
event.record(&mut metric_visitor); | ||
} | ||
} |
Oops, something went wrong.