risingwave_error/
tonic.rs

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
// Copyright 2024 RisingWave Labs
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

pub mod extra;

use std::borrow::Cow;
use std::error::Error;
use std::sync::Arc;

use serde::{Deserialize, Serialize};
use thiserror_ext::AsReport;
use tonic::metadata::{MetadataMap, MetadataValue};

/// The key of the metadata field that contains the serialized error.
const ERROR_KEY: &str = "risingwave-error-bin";

/// The service name that the error is from. Used to provide better error message.
// TODO: also make it a field of `Extra`?
type ServiceName = Cow<'static, str>;

/// The error produced by the gRPC server and sent to the client on the wire.
#[derive(Debug, Serialize, Deserialize)]
struct ServerError {
    error: serde_error::Error,
    service_name: Option<ServiceName>,
    extra: extra::Extra,
}

impl std::fmt::Display for ServerError {
    fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
        self.error.fmt(f)
    }
}

impl std::error::Error for ServerError {
    fn source(&self) -> Option<&(dyn Error + 'static)> {
        self.error.source()
    }

    fn provide<'a>(&'a self, request: &mut std::error::Request<'a>) {
        // Provide self so that `ErrorIsFromTonicServerImpl` can work.
        request.provide_ref(self);
        // Provide extra fields.
        self.extra.provide(request);
    }
}

fn to_status<T>(error: &T, code: tonic::Code, service_name: Option<ServiceName>) -> tonic::Status
where
    T: ?Sized + std::error::Error,
{
    // Embed the whole error (`self`) and its source chain into the details field.
    // At the same time, set the message field to the error message of `self` (without source chain).
    // The redundancy of the current error's message is intentional in case the client ignores the `details` field.
    let source = ServerError {
        error: serde_error::Error::new(error),
        service_name,
        extra: extra::Extra::new(error),
    };
    let serialized = bincode::serialize(&source).unwrap();

    let mut metadata = MetadataMap::new();
    metadata.insert_bin(ERROR_KEY, MetadataValue::from_bytes(&serialized));

    let mut status = tonic::Status::with_metadata(code, error.to_report_string(), metadata);
    // Set the source of `tonic::Status`, though it's not likely to be used.
    // This is only available before serializing to the wire. That's why we need to manually embed it
    // into the `details` field.
    status.set_source(Arc::new(source));
    status
}

// TODO(error-handling): disallow constructing `tonic::Status` directly with `new` by clippy.
#[easy_ext::ext(ToTonicStatus)]
impl<T> T
where
    T: ?Sized + std::error::Error,
{
    /// Convert the error to [`tonic::Status`] with the given [`tonic::Code`] and service name.
    ///
    /// The source chain is preserved by pairing with [`TonicStatusWrapper`].
    pub fn to_status(
        &self,
        code: tonic::Code,
        service_name: impl Into<ServiceName>,
    ) -> tonic::Status {
        to_status(self, code, Some(service_name.into()))
    }

    /// Convert the error to [`tonic::Status`] with the given [`tonic::Code`] without specifying
    /// the service name. Prefer [`to_status`] if possible.
    ///
    /// The source chain is preserved by pairing with [`TonicStatusWrapper`].
    pub fn to_status_unnamed(&self, code: tonic::Code) -> tonic::Status {
        to_status(self, code, None)
    }
}

#[easy_ext::ext(ErrorIsFromTonicServerImpl)]
impl<T> T
where
    T: ?Sized + std::error::Error,
{
    /// Returns whether the error is from the implementation of a tonic server, i.e., created
    /// with [`ToTonicStatus::to_status`].
    ///
    /// This does not count errors initiated from the library, typically connection issues.
    /// As a result, this function can be used to decide whether an error should be retried.
    pub fn is_from_tonic_server_impl(&self) -> bool {
        std::error::request_ref::<ServerError>(self).is_some()
    }
}

/// A wrapper of [`tonic::Status`] that provides better error message and extracts
/// the source chain from the `details` field.
#[derive(Debug)]
pub struct TonicStatusWrapper {
    inner: tonic::Status,

    /// Optional service name from the client side.
    ///
    /// # Explanation
    ///
    /// [`tonic::Status`] is used for both client and server side. When the error is created on
    /// the server side, we encourage developers to provide the service name with
    /// [`ToTonicStatus::to_status`], so that the info can be included in the HTTP response and
    /// then extracted by the client side (in [`TonicStatusWrapper::new`]).
    ///
    /// However, if there's something wrong with the server side and the error is directly
    /// created on the client side, the approach above is not applicable. In this case, the
    /// caller should set a "client side" service name to provide better error message. This is
    /// achieved by [`TonicStatusWrapperExt::with_client_side_service_name`].
    client_side_service_name: Option<ServiceName>,
}

impl TonicStatusWrapper {
    /// Create a new [`TonicStatusWrapper`] from the given [`tonic::Status`] and extract
    /// the source chain from its `details` field.
    pub fn new(mut status: tonic::Status) -> Self {
        if status.source().is_none() {
            if let Some(value) = status.metadata().get_bin(ERROR_KEY) {
                if let Some(e) = value.to_bytes().ok().and_then(|serialized| {
                    bincode::deserialize::<ServerError>(serialized.as_ref()).ok()
                }) {
                    status.set_source(Arc::new(e));
                } else {
                    tracing::warn!("failed to deserialize error from gRPC metadata");
                }
            }
        }

        Self {
            inner: status,
            client_side_service_name: None,
        }
    }

    /// Returns the reference to the inner [`tonic::Status`].
    pub fn inner(&self) -> &tonic::Status {
        &self.inner
    }

    /// Consumes `self` and returns the inner [`tonic::Status`].
    pub fn into_inner(self) -> tonic::Status {
        self.inner
    }
}

impl From<tonic::Status> for TonicStatusWrapper {
    fn from(status: tonic::Status) -> Self {
        Self::new(status)
    }
}

impl std::fmt::Display for TonicStatusWrapper {
    fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
        write!(f, "gRPC request")?;

        if let Some(service_name) = self
            .source()
            .and_then(|s| s.downcast_ref::<ServerError>())
            .and_then(|s| s.service_name.as_ref())
            // if no service name from the server side, use the client side one
            .or(self.client_side_service_name.as_ref())
        {
            write!(f, " to {} service", service_name)?;
        }
        write!(f, " failed: {}: ", self.inner.code())?;

        #[expect(rw::format_error)] // intentionally format the source itself
        if let Some(source) = self.source() {
            // Prefer the source chain from the `details` field.
            write!(f, "{}", source)
        } else {
            write!(f, "{}", self.inner.message())
        }
    }
}

#[easy_ext::ext(TonicStatusWrapperExt)]
impl<T> T
where
    T: Into<TonicStatusWrapper>,
{
    /// Set the client side service name to provide better error message.
    ///
    /// See the documentation on the field `client_side_service_name` for more details.
    pub fn with_client_side_service_name(
        self,
        service_name: impl Into<ServiceName>,
    ) -> TonicStatusWrapper {
        let mut this = self.into();
        this.client_side_service_name = Some(service_name.into());
        this
    }
}

impl std::error::Error for TonicStatusWrapper {
    fn source(&self) -> Option<&(dyn std::error::Error + 'static)> {
        // Delegate to `self.inner` as if we're transparent.
        self.inner.source()
    }

    fn provide<'a>(&'a self, request: &mut std::error::Request<'a>) {
        // The source error, typically a `ServerError`, may provide additional information through `extra`.
        if let Some(source) = self.source() {
            source.provide(request);
        }
    }
}

#[cfg(test)]
mod tests {
    use super::*;

    #[test]
    fn test_source_chain_preserved() {
        #[derive(thiserror::Error, Debug)]
        #[error("{message}")]
        struct MyError {
            message: &'static str,
            source: Option<Box<MyError>>,
        }

        let original = MyError {
            message: "outer",
            source: Some(Box::new(MyError {
                message: "inner",
                source: None,
            })),
        };

        let server_status = original.to_status(tonic::Code::Internal, "test");
        let body = server_status.into_http();
        let client_status = tonic::Status::from_header_map(body.headers()).unwrap();

        let wrapper = TonicStatusWrapper::new(client_status);
        assert_eq!(
            wrapper.to_string(),
            "gRPC request to test service failed: Internal error: outer"
        );

        let source = wrapper.source().unwrap();
        assert!(source.is::<ServerError>());
        assert_eq!(source.to_string(), "outer");
        assert_eq!(source.source().unwrap().to_string(), "inner");
    }
}