Skip to content

Commit 6397a93

Browse files
bors[bot]nightkr
andauthored
Merge #322
322: Helpers for reporting controller errors as K8s events r=teozkr a=teozkr ## Description Fixes #321 ## Review Checklist - [x] Code contains useful comments - [x] (Integration-)Test cases added (or not applicable) - [x] Documentation added (or not applicable) - [x] Changelog updated (or not applicable) Co-authored-by: Teo Klestrup Röijezon <[email protected]>
2 parents 020906f + 0798470 commit 6397a93

File tree

5 files changed

+244
-2
lines changed

5 files changed

+244
-2
lines changed

CHANGELOG.md

+5-1
Original file line numberDiff line numberDiff line change
@@ -4,8 +4,11 @@ All notable changes to this project will be documented in this file.
44

55
## [Unreleased]
66

7+
### Added
8+
- Infrastructure for logging errors as K8s events ([#322])
9+
710
### Changed
8-
- BREAKING: kube 0.68 -> 0.69 ([#319]).
11+
- BREAKING: kube 0.68 -> 0.69.1 ([#319, [#322]]).
912

1013
### Removed
1114
- Chrono's time 0.1 compatibility ([#310]).
@@ -14,6 +17,7 @@ All notable changes to this project will be documented in this file.
1417
[#310]: https://github.com/stackabletech/operator-rs/pull/310
1518
[#319]: https://github.com/stackabletech/operator-rs/pull/319
1619
[#320]: https://github.com/stackabletech/operator-rs/pull/320
20+
[#322]: https://github.com/stackabletech/operator-rs/pull/322
1721

1822
## [0.10.0] - 2022-02-04
1923

Cargo.toml

+1-1
Original file line numberDiff line numberDiff line change
@@ -16,7 +16,7 @@ either = "1.6.1"
1616
futures = "0.3.19"
1717
json-patch = "0.2.6"
1818
k8s-openapi = { version = "0.14.0", default-features = false, features = ["schemars", "v1_22"] }
19-
kube = { version = "0.69.0", features = ["jsonpatch", "runtime", "derive"] }
19+
kube = { version = "0.69.1", features = ["jsonpatch", "runtime", "derive"] }
2020
lazy_static = "1.4.0"
2121
product-config = { git = "https://github.com/stackabletech/product-config.git", tag = "0.3.0" }
2222
rand = "0.8.4"

src/logging/controller.rs

+78
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,78 @@
1+
//! Facilities for reporting Kubernetes controller outcomes
2+
//!
3+
//! The primary entry point is [`report_controller_reconcilied`].
4+
5+
use std::error::Error;
6+
7+
use kube::{
8+
core::DynamicObject,
9+
runtime::{
10+
controller::{self, ReconcilerAction},
11+
reflector::ObjectRef,
12+
},
13+
Resource,
14+
};
15+
use tracing;
16+
17+
use crate::{client::Client, logging::k8s_events::publish_controller_error_as_k8s_event};
18+
19+
/// [`Error`] extensions that help report reconciliation errors
20+
///
21+
/// This should be implemented for reconciler error types.
22+
pub trait ReconcilerError: Error {
23+
/// `PascalCase`d name for the error category
24+
///
25+
/// This can typically be implemented by delegating to [`strum_macros::EnumDiscriminants`] and [`strum_macros::IntoStaticStr`].
26+
fn category(&self) -> &'static str;
27+
28+
/// A reference to a secondary object providing additional context, if any
29+
///
30+
/// This should be [`Some`] if the error happens while evaluating some related object
31+
/// (for example: when writing a [`StatefulSet`] owned by your controller object).
32+
fn secondary_object(&self) -> Option<ObjectRef<DynamicObject>> {
33+
None
34+
}
35+
}
36+
37+
/// Reports the controller reconciliation result to all relevant targets
38+
///
39+
/// Currently this means that the result is reported to:
40+
/// * The current [`tracing`] `Subscriber`, typically at least stderr
41+
/// * Kubernetes events, if there is an error that is relevant to the end user
42+
pub fn report_controller_reconciled<K, ReconcileErr, QueueErr>(
43+
client: &Client,
44+
controller_name: &str,
45+
result: &Result<(ObjectRef<K>, ReconcilerAction), controller::Error<ReconcileErr, QueueErr>>,
46+
) where
47+
K: Resource,
48+
ReconcileErr: ReconcilerError,
49+
QueueErr: std::error::Error,
50+
{
51+
match result {
52+
Ok((obj, _)) => {
53+
tracing::info!(
54+
controller.name = controller_name,
55+
object = %obj,
56+
"Reconciled object"
57+
);
58+
}
59+
Err(err) => report_controller_error(client, controller_name, err),
60+
}
61+
}
62+
63+
/// Reports an error to the operator administrator and, if relevant, the end user
64+
fn report_controller_error<ReconcileErr, QueueErr>(
65+
client: &Client,
66+
controller_name: &str,
67+
error: &controller::Error<ReconcileErr, QueueErr>,
68+
) where
69+
ReconcileErr: ReconcilerError,
70+
QueueErr: std::error::Error,
71+
{
72+
tracing::error!(
73+
controller.name = controller_name,
74+
error = &*error as &dyn std::error::Error,
75+
"Failed to reconcile object",
76+
);
77+
publish_controller_error_as_k8s_event(client, controller_name, error);
78+
}

src/logging/k8s_events.rs

+157
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,157 @@
1+
//! Utilities for publishing Kubernetes events
2+
3+
use std::error::Error;
4+
5+
use crate::client::Client;
6+
use kube::runtime::{
7+
controller,
8+
events::{Event, EventType, Recorder, Reporter},
9+
};
10+
use tracing::Instrument;
11+
12+
use super::controller::ReconcilerError;
13+
14+
/// Converts an [`Error`] into a publishable Kubernetes [`Event`]
15+
fn error_to_event<E: ReconcilerError>(err: &E) -> Event {
16+
// Walk the whole error chain, so that we get all the full reason for the error
17+
let full_msg = {
18+
use std::fmt::Write;
19+
let mut buf = err.to_string();
20+
let mut err: &dyn Error = err;
21+
loop {
22+
err = match err.source() {
23+
Some(err) => {
24+
write!(buf, ": {}", err).unwrap();
25+
err
26+
}
27+
None => break buf,
28+
}
29+
}
30+
};
31+
Event {
32+
type_: EventType::Warning,
33+
reason: err.category().to_string(),
34+
note: Some(full_msg),
35+
action: "Reconcile".to_string(),
36+
secondary: err.secondary_object().map(|secondary| secondary.into()),
37+
}
38+
}
39+
40+
/// Reports an error coming from a controller to Kubernetes
41+
///
42+
/// This is inteded to be executed on the log entries returned by [`Controller::run`]
43+
#[tracing::instrument(skip(client))]
44+
pub fn publish_controller_error_as_k8s_event<ReconcileErr, QueueErr>(
45+
client: &Client,
46+
controller: &str,
47+
controller_error: &controller::Error<ReconcileErr, QueueErr>,
48+
) where
49+
ReconcileErr: ReconcilerError,
50+
QueueErr: Error,
51+
{
52+
let (error, obj) = match controller_error {
53+
controller::Error::ReconcilerFailed(err, obj) => (err, obj),
54+
// Other error types are intended for the operator administrator, and aren't linked to a specific object
55+
_ => return,
56+
};
57+
let recorder = Recorder::new(
58+
client.as_kube_client(),
59+
Reporter {
60+
controller: controller.to_string(),
61+
instance: None,
62+
},
63+
obj.clone().into(),
64+
);
65+
let event = error_to_event(error);
66+
// Run in the background
67+
tokio::spawn(
68+
async move {
69+
if let Err(err) = recorder.publish(event).await {
70+
tracing::error!(
71+
error = &err as &dyn std::error::Error,
72+
"Failed to report error as K8s event"
73+
);
74+
}
75+
}
76+
.in_current_span(),
77+
);
78+
}
79+
80+
#[cfg(test)]
81+
mod tests {
82+
use k8s_openapi::api::core::v1::ConfigMap;
83+
use kube::runtime::reflector::ObjectRef;
84+
use strum_macros::EnumDiscriminants;
85+
86+
use super::{error_to_event, ReconcilerError};
87+
88+
#[derive(Debug, thiserror::Error, EnumDiscriminants)]
89+
#[strum_discriminants(derive(strum_macros::IntoStaticStr))]
90+
enum ErrorFoo {
91+
#[error("bar failed")]
92+
Bar { source: ErrorBar },
93+
}
94+
#[derive(Debug, thiserror::Error)]
95+
enum ErrorBar {
96+
#[error("baz failed")]
97+
Baz { source: ErrorBaz },
98+
}
99+
#[derive(Debug, thiserror::Error)]
100+
enum ErrorBaz {
101+
#[error("couldn't find chocolate")]
102+
NoChocolate { descriptor: ObjectRef<ConfigMap> },
103+
}
104+
impl ErrorFoo {
105+
fn no_chocolate() -> Self {
106+
Self::Bar {
107+
source: ErrorBar::Baz {
108+
source: ErrorBaz::NoChocolate {
109+
descriptor: ObjectRef::new("chocolate-descriptor").within("cupboard"),
110+
},
111+
},
112+
}
113+
}
114+
}
115+
impl ReconcilerError for ErrorFoo {
116+
fn category(&self) -> &'static str {
117+
ErrorFooDiscriminants::from(self).into()
118+
}
119+
120+
fn secondary_object(&self) -> Option<ObjectRef<kube::core::DynamicObject>> {
121+
match self {
122+
ErrorFoo::Bar {
123+
source:
124+
ErrorBar::Baz {
125+
source: ErrorBaz::NoChocolate { descriptor },
126+
},
127+
} => Some(descriptor.clone().erase()),
128+
}
129+
}
130+
}
131+
132+
#[test]
133+
fn event_should_report_full_nested_message() {
134+
let err = ErrorFoo::no_chocolate();
135+
assert_eq!(
136+
error_to_event(&err).note.as_deref(),
137+
Some("bar failed: baz failed: couldn't find chocolate")
138+
);
139+
}
140+
141+
#[test]
142+
fn event_should_include_secondary_object() {
143+
let err = ErrorFoo::no_chocolate();
144+
let event = error_to_event(&err);
145+
let secondary = event.secondary.unwrap();
146+
assert_eq!(secondary.name.as_deref(), Some("chocolate-descriptor"));
147+
assert_eq!(secondary.namespace.as_deref(), Some("cupboard"));
148+
assert_eq!(secondary.kind.as_deref(), Some("ConfigMap"));
149+
}
150+
151+
#[test]
152+
fn event_should_include_reason_code() {
153+
let err = ErrorFoo::no_chocolate();
154+
let event = error_to_event(&err);
155+
assert_eq!(event.reason, "Bar");
156+
}
157+
}

src/logging.rs src/logging/mod.rs

+3
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,9 @@
11
use tracing;
22
use tracing_subscriber::EnvFilter;
33

4+
pub mod controller;
5+
mod k8s_events;
6+
47
/// Initializes `tracing` logging with options from the environment variable
58
/// given in the `env` parameter.
69
///

0 commit comments

Comments
 (0)