risingwave_meta/backup_restore/
metrics.rs

1// Copyright 2025 RisingWave Labs
2//
3// Licensed under the Apache License, Version 2.0 (the "License");
4// you may not use this file except in compliance with the License.
5// You may obtain a copy of the License at
6//
7//     http://www.apache.org/licenses/LICENSE-2.0
8//
9// Unless required by applicable law or agreed to in writing, software
10// distributed under the License is distributed on an "AS IS" BASIS,
11// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12// See the License for the specific language governing permissions and
13// limitations under the License.
14
15use std::sync::LazyLock;
16
17use prometheus::{
18    Histogram, IntCounter, Registry, exponential_buckets, histogram_opts,
19    register_histogram_vec_with_registry, register_int_counter_with_registry,
20};
21use risingwave_common::monitor::GLOBAL_METRICS_REGISTRY;
22
23pub static GLOBAL_BACKUP_MANAGER_METRICS: LazyLock<BackupManagerMetrics> =
24    LazyLock::new(|| BackupManagerMetrics::new(&GLOBAL_METRICS_REGISTRY));
25
26#[derive(Clone)]
27pub struct BackupManagerMetrics {
28    pub job_count: IntCounter,
29    pub job_latency_success: Histogram,
30    pub job_latency_failure: Histogram,
31}
32
33impl Default for BackupManagerMetrics {
34    fn default() -> Self {
35        GLOBAL_BACKUP_MANAGER_METRICS.clone()
36    }
37}
38
39impl BackupManagerMetrics {
40    fn new(registry: &Registry) -> Self {
41        let job_count = register_int_counter_with_registry!(
42            "backup_job_count",
43            "total backup job count since meta node is started",
44            registry,
45        )
46        .unwrap();
47        let opts = histogram_opts!(
48            "backup_job_latency",
49            "latency of backup jobs since meta node is started",
50            exponential_buckets(1.0, 1.5, 20).unwrap(),
51        );
52        let job_latency =
53            register_histogram_vec_with_registry!(opts, &["state"], registry,).unwrap();
54        let job_latency_success = job_latency
55            .get_metric_with_label_values(&["success"])
56            .unwrap();
57        let job_latency_failure = job_latency
58            .get_metric_with_label_values(&["failure"])
59            .unwrap();
60        Self {
61            job_count,
62            job_latency_success,
63            job_latency_failure,
64        }
65    }
66}