-
Notifications
You must be signed in to change notification settings - Fork 493
fix(tracing): honor OTEL resource env config #7061
New issue
Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.
By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.
Already on GitHub? Sign in to your account
base: main
Are you sure you want to change the base?
Changes from all commits
7012fe7
c452c4e
60e65ad
0b4c16b
File filter
Filter by extension
Conversations
Jump to
Diff view
Diff view
There are no files selected for viewing
| Original file line number | Diff line number | Diff line change |
|---|---|---|
| @@ -1,12 +1,14 @@ | ||
| use std::time::Duration; | ||
|
|
||
| use opentelemetry::Key; | ||
| // These match the OTEL_EXPORTER_OTLP_* environment variables from: | ||
| // https://opentelemetry.io/docs/languages/sdk-configuration/otlp-exporter/#endpoint-configuration | ||
| use opentelemetry_otlp::{ | ||
| OTEL_EXPORTER_OTLP_ENDPOINT, OTEL_EXPORTER_OTLP_LOGS_ENDPOINT, | ||
| OTEL_EXPORTER_OTLP_METRICS_ENDPOINT, OTEL_EXPORTER_OTLP_PROTOCOL, | ||
| OTEL_EXPORTER_OTLP_TRACES_ENDPOINT, Protocol, | ||
| }; | ||
| use opentelemetry_sdk::Resource; | ||
|
|
||
| /// Environment variable for the general OTLP endpoint. | ||
| pub const ENV_OLD_OTLP_ENDPOINT: &str = "DAFT_DEV_OTEL_EXPORTER_OTLP_ENDPOINT"; | ||
|
|
@@ -107,4 +109,123 @@ impl Config { | |
| .map(Duration::from_millis) | ||
| .unwrap_or(Duration::from_millis(500)) | ||
| } | ||
|
|
||
| pub fn resource(&self) -> Resource { | ||
| let detected_resource = Resource::builder().build(); | ||
| let service_name = std::env::var("OTEL_SERVICE_NAME") | ||
| .ok() | ||
| .filter(|name| !name.is_empty()) | ||
| .or_else(|| { | ||
| detected_resource | ||
| .get(&Key::new("service.name")) | ||
| .map(|value| value.to_string()) | ||
| .filter(|name| name != "unknown_service") | ||
| }) | ||
| .unwrap_or_else(|| "daft".to_string()); | ||
|
|
||
| Resource::builder().with_service_name(service_name).build() | ||
| } | ||
| } | ||
|
|
||
| #[cfg(test)] | ||
| mod tests { | ||
| use std::sync::Mutex; | ||
|
|
||
| use opentelemetry::{Key, Value}; | ||
|
|
||
| use super::*; | ||
|
|
||
| static ENV_LOCK: Mutex<()> = Mutex::new(()); | ||
|
|
||
| fn with_env_vars<R>(vars: &[(&str, Option<&str>)], f: impl FnOnce() -> R) -> R { | ||
| let _guard = ENV_LOCK.lock().unwrap(); | ||
| let previous_values: Vec<_> = vars | ||
| .iter() | ||
| .map(|(name, _)| (*name, std::env::var(name).ok())) | ||
| .collect(); | ||
|
|
||
| for (name, value) in vars { | ||
| match value { | ||
| Some(value) => unsafe { std::env::set_var(name, value) }, | ||
| None => unsafe { std::env::remove_var(name) }, | ||
| } | ||
| } | ||
|
|
||
| let result = f(); | ||
|
|
||
| for (name, value) in previous_values { | ||
| match value { | ||
| Some(value) => unsafe { std::env::set_var(name, value) }, | ||
| None => unsafe { std::env::remove_var(name) }, | ||
| } | ||
| } | ||
|
|
||
| result | ||
| } | ||
|
Comment on lines
+140
to
+164
Contributor
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more.
If the closure |
||
|
|
||
| #[test] | ||
| fn resource_defaults_to_daft_service_name() { | ||
| with_env_vars( | ||
| &[ | ||
| ("OTEL_SERVICE_NAME", None), | ||
| ("OTEL_RESOURCE_ATTRIBUTES", None), | ||
| ], | ||
| || { | ||
| let resource = Config::from_env().resource(); | ||
| assert_eq!( | ||
| resource.get(&Key::new("service.name")), | ||
| Some(Value::from("daft")) | ||
| ); | ||
| }, | ||
| ); | ||
| } | ||
|
|
||
| #[test] | ||
| fn resource_uses_otel_service_name_env() { | ||
| with_env_vars( | ||
| &[ | ||
| ("OTEL_SERVICE_NAME", Some("daft-ray-worker")), | ||
| ("OTEL_RESOURCE_ATTRIBUTES", None), | ||
| ], | ||
| || { | ||
| let resource = Config::from_env().resource(); | ||
| assert_eq!( | ||
| resource.get(&Key::new("service.name")), | ||
| Some(Value::from("daft-ray-worker")) | ||
| ); | ||
| }, | ||
| ); | ||
| } | ||
|
|
||
| #[test] | ||
| fn resource_includes_otel_resource_attributes() { | ||
| with_env_vars( | ||
| &[ | ||
| ("OTEL_SERVICE_NAME", None), | ||
| ( | ||
| "OTEL_RESOURCE_ATTRIBUTES", | ||
| Some("deployment.environment=staging,service.version=0.7.14"), | ||
| ), | ||
| ], | ||
| || { | ||
| let resource = Config::from_env().resource(); | ||
| assert_eq!( | ||
| resource.get(&Key::new("deployment.environment")), | ||
| Some(Value::from("staging")) | ||
| ); | ||
| assert_eq!( | ||
| resource.get(&Key::new("telemetry.sdk.language")), | ||
| Some(Value::from("rust")) | ||
| ); | ||
| assert_eq!( | ||
| resource.get(&Key::new("service.version")), | ||
| Some(Value::from("0.7.14")) | ||
| ); | ||
| assert_eq!( | ||
| resource.get(&Key::new("service.name")), | ||
| Some(Value::from("daft")) | ||
| ); | ||
| }, | ||
| ); | ||
| } | ||
| } | ||
| Original file line number | Diff line number | Diff line change |
|---|---|---|
| @@ -1,9 +1,6 @@ | ||
| mod config; | ||
|
|
||
| use std::{ | ||
| sync::{LazyLock, Mutex}, | ||
| time::Duration, | ||
| }; | ||
| use std::sync::{LazyLock, Mutex}; | ||
|
|
||
| use common_runtime::get_io_runtime; | ||
| pub use config::Config; | ||
|
|
@@ -53,7 +50,7 @@ impl TraceFormat { | |
|
|
||
| pub fn init_tracing() { | ||
| let config = Config::from_env(); | ||
| let resource = Resource::builder().with_service_name("daft").build(); | ||
| let resource = config.resource(); | ||
| let tracer_provider = if config.enabled() { | ||
| let runtime = get_io_runtime(true); | ||
| runtime.block_on_current_thread(async { | ||
|
|
@@ -158,7 +155,6 @@ fn init_otlp_logger_provider(config: &Config, otlp_endpoint: &str, resource: Res | |
| let log_exporter = opentelemetry_otlp::LogExporter::builder() | ||
| .with_tonic() | ||
| .with_endpoint(otlp_endpoint) | ||
| .with_timeout(Duration::from_secs(10)) | ||
| .build() | ||
| .expect("Failed to build OTLP logger exporter."); | ||
|
|
||
|
|
@@ -188,14 +184,12 @@ fn init_otlp_metrics_provider(config: &Config, endpoint: &str, resource: Resourc | |
| opentelemetry_otlp::MetricExporter::builder() | ||
| .with_tonic() | ||
| .with_endpoint(endpoint) | ||
| .with_timeout(Duration::from_secs(10)) | ||
| .build() | ||
| } | ||
| Protocol::HttpBinary => { | ||
| opentelemetry_otlp::MetricExporter::builder() | ||
| .with_http() | ||
| .with_endpoint(endpoint) | ||
| .with_timeout(Duration::from_secs(10)) | ||
| .with_protocol(config.otlp_protocol) | ||
| .build() | ||
| } | ||
|
|
@@ -242,7 +236,6 @@ fn init_otlp_tracer_provider( | |
| let exporter = opentelemetry_otlp::SpanExporter::builder() | ||
| .with_tonic() | ||
| .with_endpoint(otlp_endpoint) | ||
| .with_timeout(Duration::from_secs(10)) | ||
|
Contributor
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. Since this is now being read from the env what is the default if it's not set?
Contributor
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. It looks like the defaults were already 10s: https://opentelemetry.io/docs/languages/sdk-configuration/otlp-exporter/#timeout-configuration |
||
| .build() | ||
| .expect("Failed to build OTLP span exporter for tracing"); | ||
|
|
||
|
|
||
There was a problem hiding this comment.
Choose a reason for hiding this comment
The reason will be displayed to describe this comment to others. Learn more.
Is there a constant in the opentelemetry_otlp create we can use?