risingwave_expr_impl/scalar/jsonb_delete.rs
1// Copyright 2025 RisingWave Labs
2//
3// Licensed under the Apache License, Version 2.0 (the "License");
4// you may not use this file except in compliance with the License.
5// You may obtain a copy of the License at
6//
7// http://www.apache.org/licenses/LICENSE-2.0
8//
9// Unless required by applicable law or agreed to in writing, software
10// distributed under the License is distributed on an "AS IS" BASIS,
11// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12// See the License for the specific language governing permissions and
13// limitations under the License.
14
15use std::collections::HashSet;
16
17use jsonbb::{Value, ValueRef};
18use risingwave_common::types::{JsonbRef, JsonbVal, ListRef};
19use risingwave_expr::{ExprError, Result, function};
20
21/// Removes a key (and its value) from a JSON object, or matching string value(s) from a JSON array.
22///
23/// Examples:
24///
25/// ```slt
26/// # remove key from object
27/// query T
28/// SELECT '{"a": "b", "c": "d"}'::jsonb - 'a';
29/// ----
30/// {"c": "d"}
31///
32/// # remove matching value from array
33/// query T
34/// SELECT '["a", "b", "c", "b"]'::jsonb - 'b';
35/// ----
36/// ["a", "c"]
37///
38/// query error cannot delete from scalar
39/// SELECT '1'::jsonb - 'b';
40/// ```
41#[function("subtract(jsonb, varchar) -> jsonb")]
42fn jsonb_remove(v: JsonbRef<'_>, key: &str) -> Result<JsonbVal> {
43 match v.into() {
44 ValueRef::Object(obj) => Ok(JsonbVal::from(Value::object(
45 obj.iter().filter(|(k, _)| *k != key),
46 ))),
47 ValueRef::Array(arr) => Ok(JsonbVal::from(Value::array(
48 arr.iter().filter(|value| value.as_str() != Some(key)),
49 ))),
50 _ => Err(ExprError::InvalidParam {
51 name: "jsonb",
52 reason: "cannot delete from scalar".into(),
53 }),
54 }
55}
56
57/// Deletes all matching keys or array elements from the left operand.
58///
59/// Examples:
60///
61/// ```slt
62/// query T
63/// SELECT '{"a": "b", "c": "d"}'::jsonb - '{a,c}'::text[];
64/// ----
65/// {}
66///
67/// query error cannot delete from scalar
68/// SELECT '1'::jsonb - '{a,c}'::text[];
69/// ```
70#[function("subtract(jsonb, varchar[]) -> jsonb")]
71fn jsonb_remove_keys(v: JsonbRef<'_>, keys: ListRef<'_>) -> Result<JsonbVal> {
72 let keys_set: HashSet<&str> = keys.iter().flatten().map(|s| s.into_utf8()).collect();
73
74 match v.into() {
75 ValueRef::Object(obj) => Ok(JsonbVal::from(Value::object(
76 obj.iter().filter(|(k, _)| !keys_set.contains(*k)),
77 ))),
78 ValueRef::Array(arr) => {
79 Ok(JsonbVal::from(Value::array(arr.iter().filter(
80 |value| match value.as_str() {
81 Some(s) => !keys_set.contains(s),
82 None => true,
83 },
84 ))))
85 }
86 _ => Err(ExprError::InvalidParam {
87 name: "jsonb",
88 reason: "cannot delete from scalar".into(),
89 }),
90 }
91}
92
93/// Deletes the array element with the specified index (negative integers count from the end).
94/// Throws an error if JSON value is not an array.
95///
96/// Examples:
97///
98/// ```slt
99/// query T
100/// SELECT '["a", "b"]'::jsonb - 1;
101/// ----
102/// ["a"]
103///
104/// query T
105/// SELECT '["a", "b"]'::jsonb - -1;
106/// ----
107/// ["a"]
108///
109/// query T
110/// SELECT '["a", "b"]'::jsonb - 2;
111/// ----
112/// ["a", "b"]
113///
114/// query T
115/// SELECT '["a", "b"]'::jsonb - -3;
116/// ----
117/// ["a", "b"]
118///
119/// query error cannot delete from scalar
120/// SELECT '1'::jsonb - 1;
121///
122/// query error cannot delete from object using integer index
123/// SELECT '{"a": 1}'::jsonb - 1;
124/// ```
125#[function("subtract(jsonb, int4) -> jsonb")]
126fn jsonb_remove_index(v: JsonbRef<'_>, index: i32) -> Result<JsonbVal> {
127 let array = match v.into() {
128 ValueRef::Array(array) => array,
129 ValueRef::Object(_) => {
130 return Err(ExprError::InvalidParam {
131 name: "jsonb",
132 reason: "cannot delete from object using integer index".into(),
133 });
134 }
135 _ => {
136 return Err(ExprError::InvalidParam {
137 name: "jsonb",
138 reason: "cannot delete from scalar".into(),
139 });
140 }
141 };
142 let Some(idx) = normalize_array_index(array.len(), index) else {
143 // out of bounds index returns original value
144 return Ok(JsonbVal::from(v));
145 };
146 Ok(JsonbVal::from(Value::array(
147 array
148 .iter()
149 .enumerate()
150 .filter(|&(i, _)| i != idx)
151 .map(|(_, v)| v),
152 )))
153}
154
155/// Deletes the field or array element at the specified path, where path elements can be
156/// either field keys or array indexes.
157///
158/// Examples:
159///
160/// ```slt
161/// # Basic test case
162/// query T
163/// SELECT '["a", {"b":1}]'::jsonb #- '{1,b}';
164/// ----
165/// ["a", {}]
166///
167/// # Invalid path
168/// query error path element at position 1 is null
169/// SELECT '["a", {"b":1}]'::jsonb #- array[null];
170///
171/// # Removing non-existent key from an object
172/// query T
173/// SELECT '{"a": 1, "b": 2}'::jsonb #- '{c}';
174/// ----
175/// {"a": 1, "b": 2}
176///
177/// # Removing an existing key from an object
178/// query T
179/// SELECT '{"a": 1, "b": 2}'::jsonb #- '{a}';
180/// ----
181/// {"b": 2}
182///
183/// # Removing an item from an array by positive index
184/// query T
185/// SELECT '["a", "b", "c"]'::jsonb #- '{1}';
186/// ----
187/// ["a", "c"]
188///
189/// # Removing an item from an array by negative index
190/// query T
191/// SELECT '["a", "b", "c"]'::jsonb #- '{-1}';
192/// ----
193/// ["a", "b"]
194///
195/// # Removing a non-existent index from an array
196/// query T
197/// SELECT '["a", "b", "c"]'::jsonb #- '{3}';
198/// ----
199/// ["a", "b", "c"]
200///
201/// # Path element is not an integer for array
202/// query error path element at position 1 is not an integer: "a"
203/// SELECT '["a", "b", "c"]'::jsonb #- '{a}';
204///
205/// # Path to deeply nested value
206/// query T
207/// SELECT '{"a": {"b": {"c": [1, 2, 3]}}}'::jsonb #- '{a,b,c,1}';
208/// ----
209/// {"a": {"b": {"c": [1, 3]}}}
210///
211/// # Path terminates early (before reaching the final depth of the JSON)
212/// query T
213/// SELECT '{"a": {"b": {"c": [1, 2, 3]}}}'::jsonb #- '{a}';
214/// ----
215/// {}
216///
217/// # Removing non-existent path in nested structure
218/// query T
219/// SELECT '{"a": {"b": {"c": [1, 2, 3]}}}'::jsonb #- '{a,x}';
220/// ----
221/// {"a": {"b": {"c": [1, 2, 3]}}}
222///
223/// # Path is longer than the depth of the JSON structure
224/// query T
225/// SELECT '{"a": 1}'::jsonb #- '{a,b}';
226/// ----
227/// {"a": 1}
228///
229/// # Edge case: Removing root
230/// query T
231/// SELECT '{"a": 1}'::jsonb #- '{}';
232/// ----
233/// {"a": 1}
234///
235/// # Edge case: Empty array
236/// query T
237/// SELECT '[]'::jsonb #- '{a}';
238/// ----
239/// []
240///
241/// # Edge case: Empty object
242/// query T
243/// SELECT '{}'::jsonb #- '{null}';
244/// ----
245/// {}
246///
247/// query error cannot delete path in scalar
248/// SELECT '1'::jsonb #- '{}';
249/// ```
250#[function("jsonb_delete_path(jsonb, varchar[]) -> jsonb")]
251fn jsonb_delete_path(v: JsonbRef<'_>, path: ListRef<'_>) -> Result<JsonbVal> {
252 if v.is_scalar() {
253 return Err(ExprError::InvalidParam {
254 name: "jsonb",
255 reason: "cannot delete path in scalar".into(),
256 });
257 }
258 if path.is_empty() {
259 return Ok(JsonbVal::from(v));
260 }
261 let jsonb: ValueRef<'_> = v.into();
262 let mut builder = jsonbb::Builder::<Vec<u8>>::with_capacity(jsonb.capacity());
263 jsonbb_remove_path(jsonb, path, 0, &mut builder)?;
264 Ok(JsonbVal::from(builder.finish()))
265}
266
267// Recursively remove `path[i..]` from `jsonb` and write the result to `builder`.
268// Panics if `i` is out of bounds.
269fn jsonbb_remove_path(
270 jsonb: ValueRef<'_>,
271 path: ListRef<'_>,
272 i: usize,
273 builder: &mut jsonbb::Builder,
274) -> Result<()> {
275 match jsonb {
276 ValueRef::Object(obj) => {
277 if obj.is_empty() {
278 builder.add_value(jsonb);
279 return Ok(());
280 }
281 let key = path
282 .get(i)
283 .unwrap()
284 .ok_or_else(|| ExprError::InvalidParam {
285 name: "path",
286 reason: format!("path element at position {} is null", i + 1).into(),
287 })?
288 .into_utf8();
289 if !obj.contains_key(key) {
290 builder.add_value(jsonb);
291 return Ok(());
292 }
293 builder.begin_object();
294 for (k, v) in obj.iter() {
295 if k != key {
296 builder.add_string(k);
297 builder.add_value(v);
298 continue;
299 }
300 if i != path.len() - 1 {
301 builder.add_string(k);
302 // recursively remove path[i+1..] from v
303 jsonbb_remove_path(v, path, i + 1, builder)?;
304 }
305 }
306 builder.end_object();
307 Ok(())
308 }
309 ValueRef::Array(array) => {
310 if array.is_empty() {
311 builder.add_value(jsonb);
312 return Ok(());
313 }
314 let key = path
315 .get(i)
316 .unwrap()
317 .ok_or_else(|| ExprError::InvalidParam {
318 name: "path",
319 reason: format!("path element at position {} is null", i + 1).into(),
320 })?
321 .into_utf8();
322 let idx = key.parse::<i32>().map_err(|_| ExprError::InvalidParam {
323 name: "path",
324 reason: format!(
325 "path element at position {} is not an integer: \"{}\"",
326 i + 1,
327 key
328 )
329 .into(),
330 })?;
331 let Some(idx) = normalize_array_index(array.len(), idx) else {
332 // out of bounds index returns original value
333 builder.add_value(jsonb);
334 return Ok(());
335 };
336 builder.begin_array();
337 for (j, v) in array.iter().enumerate() {
338 if j != idx {
339 builder.add_value(v);
340 continue;
341 }
342 if i != path.len() - 1 {
343 // recursively remove path[i+1..] from v
344 jsonbb_remove_path(v, path, i + 1, builder)?;
345 }
346 }
347 builder.end_array();
348 Ok(())
349 }
350 _ => {
351 builder.add_value(jsonb);
352 Ok(())
353 }
354 }
355}
356
357/// Normalizes an array index to `0..len`.
358/// Negative indices count from the end. i.e. `-len..0 => 0..len`.
359/// Returns `None` if index is out of bounds.
360fn normalize_array_index(len: usize, index: i32) -> Option<usize> {
361 if index < -(len as i32) || index >= (len as i32) {
362 return None;
363 }
364 if index >= 0 {
365 Some(index as usize)
366 } else {
367 Some((len as i32 + index) as usize)
368 }
369}
370
371/// Recursively removes all object fields that have null values from the given JSON value.
372/// Null values that are not object fields are untouched.
373///
374/// Examples:
375///
376/// ```slt
377/// query T
378/// SELECT jsonb_strip_nulls('[{"f1":1, "f2":null}, 2, null, 3]');
379/// ----
380/// [{"f1": 1}, 2, null, 3]
381/// ```
382#[function("jsonb_strip_nulls(jsonb) -> jsonb")]
383fn jsonb_strip_nulls(v: JsonbRef<'_>) -> JsonbVal {
384 let jsonb: ValueRef<'_> = v.into();
385 let mut builder = jsonbb::Builder::<Vec<u8>>::with_capacity(jsonb.capacity());
386 jsonbb_strip_nulls(jsonb, &mut builder);
387 JsonbVal::from(builder.finish())
388}
389
390/// Recursively removes all object fields that have null values from the given JSON value.
391fn jsonbb_strip_nulls(jsonb: ValueRef<'_>, builder: &mut jsonbb::Builder) {
392 match jsonb {
393 ValueRef::Object(obj) => {
394 builder.begin_object();
395 for (k, v) in obj.iter() {
396 if let ValueRef::Null = v {
397 continue;
398 }
399 builder.add_string(k);
400 jsonbb_strip_nulls(v, builder);
401 }
402 builder.end_object();
403 }
404 ValueRef::Array(array) => {
405 builder.begin_array();
406 for v in array.iter() {
407 jsonbb_strip_nulls(v, builder);
408 }
409 builder.end_array();
410 }
411 _ => builder.add_value(jsonb),
412 }
413}