risingwave_frontend/optimizer/plan_node/generic/
dedup.rs

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
// Copyright 2024 RisingWave Labs
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

use pretty_xmlish::{Pretty, Str, XmlNode};
use risingwave_common::catalog::{FieldDisplay, Schema};

use super::{DistillUnit, GenericPlanNode, GenericPlanRef};
use crate::optimizer::plan_node::utils::childless_record;
use crate::optimizer::property::FunctionalDependencySet;
use crate::OptimizerContextRef;

#[derive(Debug, Clone, PartialEq, Eq, Hash)]
pub struct Dedup<PlanRef> {
    pub input: PlanRef,
    /// Column indices of the columns to be deduplicated.
    pub dedup_cols: Vec<usize>,
}

impl<PlanRef: GenericPlanRef> Dedup<PlanRef> {
    fn dedup_cols_pretty<'a>(&self) -> Pretty<'a> {
        Pretty::Array(
            self.dedup_cols
                .iter()
                .map(|i| FieldDisplay(self.input.schema().fields.get(*i).unwrap()))
                .map(|fd| Pretty::display(&fd))
                .collect(),
        )
    }
}

impl<PlanRef: GenericPlanRef> DistillUnit for Dedup<PlanRef> {
    fn distill_with_name<'a>(&self, name: impl Into<Str<'a>>) -> XmlNode<'a> {
        childless_record(name, vec![("dedup_cols", self.dedup_cols_pretty())])
    }
}

impl<PlanRef: GenericPlanRef> GenericPlanNode for Dedup<PlanRef> {
    fn schema(&self) -> Schema {
        self.input.schema().clone()
    }

    fn stream_key(&self) -> Option<Vec<usize>> {
        Some(self.dedup_cols.clone())
    }

    fn ctx(&self) -> OptimizerContextRef {
        self.input.ctx()
    }

    fn functional_dependency(&self) -> FunctionalDependencySet {
        self.input.functional_dependency().clone()
    }
}