risingwave_expr_impl/scalar/overlay.rs
1// Copyright 2025 RisingWave Labs
2//
3// Licensed under the Apache License, Version 2.0 (the "License");
4// you may not use this file except in compliance with the License.
5// You may obtain a copy of the License at
6//
7// http://www.apache.org/licenses/LICENSE-2.0
8//
9// Unless required by applicable law or agreed to in writing, software
10// distributed under the License is distributed on an "AS IS" BASIS,
11// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12// See the License for the specific language governing permissions and
13// limitations under the License.
14
15use std::fmt::Write;
16
17use risingwave_expr::{ExprError, Result, function};
18
19/// Replaces a substring of the given string with a new substring.
20///
21/// ```slt
22/// query T
23/// select overlay('αβγδεζ' placing '💯' from 3);
24/// ----
25/// αβ💯δεζ
26/// ```
27#[function("overlay(varchar, varchar, int4) -> varchar")]
28pub fn overlay(s: &str, new_sub_str: &str, start: i32, writer: &mut impl Write) -> Result<()> {
29 let sub_len = new_sub_str
30 .chars()
31 .count()
32 .try_into()
33 .map_err(|_| ExprError::NumericOutOfRange)?;
34 overlay_for(s, new_sub_str, start, sub_len, writer)
35}
36
37/// Replaces a substring of the given string with a new substring.
38///
39/// ```slt
40/// statement error not positive
41/// select overlay('αβγδεζ' placing '①②③' from 0);
42///
43/// query T
44/// select overlay('αβγδεζ' placing '①②③' from 10);
45/// ----
46/// αβγδεζ①②③
47///
48/// query T
49/// select overlay('αβγδεζ' placing '①②③' from 4 for 2);
50/// ----
51/// αβγ①②③ζ
52///
53/// query T
54/// select overlay('αβγδεζ' placing '①②③' from 4);
55/// ----
56/// αβγ①②③
57///
58/// query T
59/// select overlay('αβγδεζ' placing '①②③' from 2 for 4);
60/// ----
61/// α①②③ζ
62///
63/// query T
64/// select overlay('αβγδεζ' placing '①②③' from 2 for 7);
65/// ----
66/// α①②③
67///
68/// query T
69/// select overlay('αβγδεζ' placing '①②③' from 4 for 0);
70/// ----
71/// αβγ①②③δεζ
72///
73/// query T
74/// select overlay('αβγδεζ' placing '①②③' from 4 for -2);
75/// ----
76/// αβγ①②③βγδεζ
77///
78/// query T
79/// select overlay('αβγδεζ' placing '①②③' from 4 for -1000);
80/// ----
81/// αβγ①②③αβγδεζ
82/// ```
83#[function("overlay(varchar, varchar, int4, int4) -> varchar")]
84pub fn overlay_for(
85 s: &str,
86 new_sub_str: &str,
87 start: i32,
88 count: i32,
89 writer: &mut impl Write,
90) -> Result<()> {
91 if start <= 0 {
92 return Err(ExprError::InvalidParam {
93 name: "start",
94 reason: format!("{start} is not positive").into(),
95 });
96 }
97
98 let mut chars = s.char_indices().skip(start as usize - 1).peekable();
99
100 // write the substring before the overlay.
101 let leading = match chars.peek() {
102 Some((i, _)) => &s[..*i],
103 None => s,
104 };
105 writer.write_str(leading).unwrap();
106
107 // write the new substring.
108 writer.write_str(new_sub_str).unwrap();
109
110 let Ok(count) = count.try_into() else {
111 // For negative `count`, which is rare in practice, we hand over to `substr`
112 let start_right = start
113 .checked_add(count)
114 .ok_or(ExprError::NumericOutOfRange)?;
115 return super::substr::substr_start(s, start_right, writer);
116 };
117
118 // write the substring after the overlay.
119 if let Some((i, _)) = chars.nth(count) {
120 writer.write_str(&s[i..]).unwrap();
121 }
122
123 Ok(())
124}
125
126#[cfg(test)]
127mod tests {
128 use super::*;
129
130 #[test]
131 fn test_overlay() {
132 case("aaa__aaa", "XY", 4, None, "aaaXYaaa");
133 // Place at end.
134 case("aaa", "XY", 4, None, "aaaXY");
135 // Place at start.
136 case("aaa", "XY", 1, Some(0), "XYaaa");
137 // Replace shorter string.
138 case("aaa_aaa", "XYZ", 4, Some(1), "aaaXYZaaa");
139 case("aaaaaa", "XYZ", 4, Some(0), "aaaXYZaaa");
140 // Replace longer string.
141 case("aaa___aaa", "X", 4, Some(3), "aaaXaaa");
142 // start too large.
143 case("aaa", "XY", 123, None, "aaaXY");
144 // count too small or large.
145 case("aaa", "X", 4, Some(-123), "aaaXaaa");
146 case("aaa_", "X", 4, Some(123), "aaaX");
147 // very large start and count
148 case("aaa", "X", i32::MAX, Some(i32::MAX), "aaaX");
149
150 #[track_caller]
151 fn case(s: &str, new_sub_str: &str, start: i32, count: Option<i32>, expected: &str) {
152 let mut writer = String::new();
153 match count {
154 None => overlay(s, new_sub_str, start, &mut writer),
155 Some(count) => overlay_for(s, new_sub_str, start, count, &mut writer),
156 }
157 .unwrap();
158 assert_eq!(writer, expected);
159 }
160 }
161}