1use std::collections::HashMap;
16use std::sync::LazyLock;
17
18use bk_tree::{BKTree, metrics};
19use itertools::Itertools;
20use risingwave_common::session_config::USER_NAME_WILD_CARD;
21use risingwave_common::types::{DataType, ListValue, ScalarImpl, Timestamptz};
22use risingwave_common::{bail_not_implemented, current_cluster_version, no_function};
23use thiserror_ext::AsReport;
24
25use crate::Binder;
26use crate::binder::Clause;
27use crate::error::{ErrorCode, Result};
28use crate::expr::{CastContext, Expr, ExprImpl, ExprType, FunctionCall, Literal, Now};
29
30impl Binder {
31 pub(super) fn bind_builtin_scalar_function(
32 &mut self,
33 function_name: &str,
34 inputs: Vec<ExprImpl>,
35 variadic: bool,
36 ) -> Result<ExprImpl> {
37 type Inputs = Vec<ExprImpl>;
38
39 type Handle = Box<dyn Fn(&mut Binder, Inputs) -> Result<ExprImpl> + Sync + Send>;
40
41 fn rewrite(r#type: ExprType, rewriter: fn(Inputs) -> Result<Inputs>) -> Handle {
42 Box::new(move |_binder, mut inputs| {
43 inputs = (rewriter)(inputs)?;
44 Ok(FunctionCall::new(r#type, inputs)?.into())
45 })
46 }
47
48 fn raw_call(r#type: ExprType) -> Handle {
49 rewrite(r#type, Ok)
50 }
51
52 fn guard_by_len<const E: usize>(
53 handle: impl Fn(&mut Binder, [ExprImpl; E]) -> Result<ExprImpl> + Sync + Send + 'static,
54 ) -> Handle {
55 Box::new(move |binder, inputs| {
56 let input_len = inputs.len();
57 let Ok(inputs) = inputs.try_into() else {
58 return Err(ErrorCode::ExprError(
59 format!("unexpected arguments number {}, expect {}", input_len, E).into(),
60 )
61 .into());
62 };
63 handle(binder, inputs)
64 })
65 }
66
67 fn raw<F: Fn(&mut Binder, Inputs) -> Result<ExprImpl> + Sync + Send + 'static>(
68 f: F,
69 ) -> Handle {
70 Box::new(f)
71 }
72
73 fn dispatch_by_len(mapping: Vec<(usize, Handle)>) -> Handle {
74 Box::new(move |binder, inputs| {
75 for (len, handle) in &mapping {
76 if inputs.len() == *len {
77 return handle(binder, inputs);
78 }
79 }
80 Err(ErrorCode::ExprError("unexpected arguments number".into()).into())
81 })
82 }
83
84 fn raw_literal(literal: ExprImpl) -> Handle {
85 Box::new(move |_binder, _inputs| Ok(literal.clone()))
86 }
87
88 fn now() -> Handle {
89 guard_by_len(move |binder, []| {
90 binder.ensure_now_function_allowed()?;
91 Ok(Now.into())
94 })
95 }
96
97 fn pi() -> Handle {
98 raw_literal(ExprImpl::literal_f64(std::f64::consts::PI))
99 }
100
101 fn proctime() -> Handle {
102 Box::new(move |binder, inputs| {
103 binder.ensure_proctime_function_allowed()?;
104 raw_call(ExprType::Proctime)(binder, inputs)
105 })
106 }
107
108 fn session_user() -> Handle {
110 guard_by_len(|binder, []| {
111 Ok(ExprImpl::literal_varchar(
112 binder.auth_context.user_name.clone(),
113 ))
114 })
115 }
116
117 fn current_user() -> Handle {
121 guard_by_len(|binder, []| {
122 Ok(ExprImpl::literal_varchar(
123 binder.auth_context.user_name.clone(),
124 ))
125 })
126 }
127
128 fn current_database() -> Handle {
131 guard_by_len(|binder, []| Ok(ExprImpl::literal_varchar(binder.db_name.clone())))
132 }
133
134 static HANDLES: LazyLock<HashMap<&'static str, Handle>> = LazyLock::new(|| {
138 [
139 (
140 "booleq",
141 rewrite(ExprType::Equal, rewrite_two_bool_inputs),
142 ),
143 (
144 "boolne",
145 rewrite(ExprType::NotEqual, rewrite_two_bool_inputs),
146 ),
147 ("coalesce", rewrite(ExprType::Coalesce, |inputs| {
148 if inputs.iter().any(ExprImpl::has_table_function) {
149 return Err(ErrorCode::BindError("table functions are not allowed in COALESCE".into()).into());
150 }
151 Ok(inputs)
152 })),
153 (
154 "nullif",
155 rewrite(ExprType::Case, rewrite_nullif_to_case_when),
156 ),
157 (
158 "round",
159 dispatch_by_len(vec![
160 (2, raw_call(ExprType::RoundDigit)),
161 (1, raw_call(ExprType::Round)),
162 ]),
163 ),
164 ("pow", raw_call(ExprType::Pow)),
165 ("power", raw_call(ExprType::Pow)),
167 ("ceil", raw_call(ExprType::Ceil)),
168 ("ceiling", raw_call(ExprType::Ceil)),
169 ("floor", raw_call(ExprType::Floor)),
170 ("trunc", raw_call(ExprType::Trunc)),
171 ("abs", raw_call(ExprType::Abs)),
172 ("exp", raw_call(ExprType::Exp)),
173 ("ln", raw_call(ExprType::Ln)),
174 ("log", raw_call(ExprType::Log10)),
175 ("log10", raw_call(ExprType::Log10)),
176 ("mod", raw_call(ExprType::Modulus)),
177 ("sin", raw_call(ExprType::Sin)),
178 ("cos", raw_call(ExprType::Cos)),
179 ("tan", raw_call(ExprType::Tan)),
180 ("cot", raw_call(ExprType::Cot)),
181 ("asin", raw_call(ExprType::Asin)),
182 ("acos", raw_call(ExprType::Acos)),
183 ("atan", raw_call(ExprType::Atan)),
184 ("atan2", raw_call(ExprType::Atan2)),
185 ("sind", raw_call(ExprType::Sind)),
186 ("cosd", raw_call(ExprType::Cosd)),
187 ("cotd", raw_call(ExprType::Cotd)),
188 ("tand", raw_call(ExprType::Tand)),
189 ("sinh", raw_call(ExprType::Sinh)),
190 ("cosh", raw_call(ExprType::Cosh)),
191 ("tanh", raw_call(ExprType::Tanh)),
192 ("coth", raw_call(ExprType::Coth)),
193 ("asinh", raw_call(ExprType::Asinh)),
194 ("acosh", raw_call(ExprType::Acosh)),
195 ("atanh", raw_call(ExprType::Atanh)),
196 ("asind", raw_call(ExprType::Asind)),
197 ("acosd", raw_call(ExprType::Acosd)),
198 ("atand", raw_call(ExprType::Atand)),
199 ("atan2d", raw_call(ExprType::Atan2d)),
200 ("degrees", raw_call(ExprType::Degrees)),
201 ("radians", raw_call(ExprType::Radians)),
202 ("sqrt", raw_call(ExprType::Sqrt)),
203 ("cbrt", raw_call(ExprType::Cbrt)),
204 ("sign", raw_call(ExprType::Sign)),
205 ("scale", raw_call(ExprType::Scale)),
206 ("min_scale", raw_call(ExprType::MinScale)),
207 ("trim_scale", raw_call(ExprType::TrimScale)),
208 ("gamma", raw_call(ExprType::Gamma)),
209 ("lgamma", raw_call(ExprType::Lgamma)),
210 (
212 "to_timestamp",
213 dispatch_by_len(vec![
214 (1, raw_call(ExprType::SecToTimestamptz)),
215 (2, raw_call(ExprType::CharToTimestamptz)),
216 ]),
217 ),
218 ("date_trunc", raw_call(ExprType::DateTrunc)),
219 ("date_bin", raw_call(ExprType::DateBin)),
220 ("date_part", raw_call(ExprType::DatePart)),
221 ("make_date", raw_call(ExprType::MakeDate)),
222 ("make_time", raw_call(ExprType::MakeTime)),
223 ("make_timestamp", raw_call(ExprType::MakeTimestamp)),
224 ("make_timestamptz", raw_call(ExprType::MakeTimestamptz)),
225 ("timezone", guard_by_len(|_binder, [arg0, arg1]| {
226 Ok(FunctionCall::new(ExprType::AtTimeZone, vec![arg1, arg0])?.into())
228 })),
229 ("to_date", raw_call(ExprType::CharToDate)),
230 ("substr", raw_call(ExprType::Substr)),
232 ("length", raw_call(ExprType::Length)),
233 ("upper", raw_call(ExprType::Upper)),
234 ("lower", raw_call(ExprType::Lower)),
235 ("trim", raw_call(ExprType::Trim)),
236 ("replace", raw_call(ExprType::Replace)),
237 ("overlay", raw_call(ExprType::Overlay)),
238 ("btrim", raw_call(ExprType::Trim)),
239 ("ltrim", raw_call(ExprType::Ltrim)),
240 ("rtrim", raw_call(ExprType::Rtrim)),
241 ("md5", raw_call(ExprType::Md5)),
242 ("to_char", raw_call(ExprType::ToChar)),
243 (
244 "concat",
245 rewrite(ExprType::ConcatWs, rewrite_concat_to_concat_ws),
246 ),
247 ("concat_ws", raw_call(ExprType::ConcatWs)),
248 ("format", raw_call(ExprType::Format)),
249 ("translate", raw_call(ExprType::Translate)),
250 ("split_part", raw_call(ExprType::SplitPart)),
251 ("char_length", raw_call(ExprType::CharLength)),
252 ("character_length", raw_call(ExprType::CharLength)),
253 ("repeat", raw_call(ExprType::Repeat)),
254 ("ascii", raw_call(ExprType::Ascii)),
255 ("octet_length", raw_call(ExprType::OctetLength)),
256 ("bit_length", raw_call(ExprType::BitLength)),
257 ("regexp_match", raw_call(ExprType::RegexpMatch)),
258 ("regexp_replace", raw_call(ExprType::RegexpReplace)),
259 ("regexp_count", raw_call(ExprType::RegexpCount)),
260 ("regexp_split_to_array", raw_call(ExprType::RegexpSplitToArray)),
261 ("chr", raw_call(ExprType::Chr)),
262 ("starts_with", raw_call(ExprType::StartsWith)),
263 ("initcap", raw_call(ExprType::Initcap)),
264 ("lpad", raw_call(ExprType::Lpad)),
265 ("rpad", raw_call(ExprType::Rpad)),
266 ("reverse", raw_call(ExprType::Reverse)),
267 ("strpos", raw_call(ExprType::Position)),
268 ("to_ascii", raw_call(ExprType::ToAscii)),
269 ("to_hex", raw_call(ExprType::ToHex)),
270 ("quote_ident", raw_call(ExprType::QuoteIdent)),
271 ("quote_literal", guard_by_len(|_binder, [mut input]| {
272 if input.return_type() != DataType::Varchar {
273 FunctionCall::cast_mut(&mut input, &DataType::Varchar, CastContext::Explicit)?;
276 }
277 Ok(FunctionCall::new_unchecked(ExprType::QuoteLiteral, vec![input], DataType::Varchar).into())
278 })),
279 ("quote_nullable", guard_by_len(|_binder, [mut input]| {
280 if input.return_type() != DataType::Varchar {
281 FunctionCall::cast_mut(&mut input, &DataType::Varchar, CastContext::Explicit)?;
284 }
285 Ok(FunctionCall::new_unchecked(ExprType::QuoteNullable, vec![input], DataType::Varchar).into())
286 })),
287 ("string_to_array", raw_call(ExprType::StringToArray)),
288 ("get_bit", raw_call(ExprType::GetBit)),
289 ("get_byte", raw_call(ExprType::GetByte)),
290 ("set_bit", raw_call(ExprType::SetBit)),
291 ("set_byte", raw_call(ExprType::SetByte)),
292 ("bit_count", raw_call(ExprType::BitCount)),
293 ("encode", raw_call(ExprType::Encode)),
294 ("decode", raw_call(ExprType::Decode)),
295 ("convert_from", raw_call(ExprType::ConvertFrom)),
296 ("convert_to", raw_call(ExprType::ConvertTo)),
297 ("sha1", raw_call(ExprType::Sha1)),
298 ("sha224", raw_call(ExprType::Sha224)),
299 ("sha256", raw_call(ExprType::Sha256)),
300 ("sha384", raw_call(ExprType::Sha384)),
301 ("sha512", raw_call(ExprType::Sha512)),
302 ("encrypt", raw_call(ExprType::Encrypt)),
303 ("decrypt", raw_call(ExprType::Decrypt)),
304 ("hmac", raw_call(ExprType::Hmac)),
305 ("crc32", raw_call(ExprType::Crc32)),
306 ("crc32c", raw_call(ExprType::Crc32c)),
307 ("secure_compare", raw_call(ExprType::SecureCompare)),
308 ("left", raw_call(ExprType::Left)),
309 ("right", raw_call(ExprType::Right)),
310 ("inet_aton", raw_call(ExprType::InetAton)),
311 ("inet_ntoa", raw_call(ExprType::InetNtoa)),
312 ("int8send", raw_call(ExprType::PgwireSend)),
313 ("int8recv", guard_by_len(|_binder, [mut input]| {
314 let hint = if !input.is_untyped() && input.return_type() == DataType::Varchar {
316 " Consider `decode` or cast."
317 } else {
318 ""
319 };
320 input.cast_implicit_mut(&DataType::Bytea).map_err(|e| {
321 ErrorCode::BindError(format!("{} in `recv`.{hint}", e.as_report()))
322 })?;
323 Ok(FunctionCall::new_unchecked(ExprType::PgwireRecv, vec![input], DataType::Int64).into())
324 })),
325 ("array_cat", raw_call(ExprType::ArrayCat)),
327 ("array_append", raw_call(ExprType::ArrayAppend)),
328 ("array_join", raw_call(ExprType::ArrayToString)),
329 ("array_prepend", raw_call(ExprType::ArrayPrepend)),
330 ("array_to_string", raw_call(ExprType::ArrayToString)),
331 ("array_distinct", raw_call(ExprType::ArrayDistinct)),
332 ("array_min", raw_call(ExprType::ArrayMin)),
333 ("array_sort", raw_call(ExprType::ArraySort)),
334 ("array_length", raw_call(ExprType::ArrayLength)),
335 ("cardinality", raw_call(ExprType::Cardinality)),
336 ("array_remove", raw_call(ExprType::ArrayRemove)),
337 ("array_replace", raw_call(ExprType::ArrayReplace)),
338 ("array_reverse", raw_call(ExprType::ArrayReverse)),
339 ("array_max", raw_call(ExprType::ArrayMax)),
340 ("array_sum", raw_call(ExprType::ArraySum)),
341 ("array_position", raw_call(ExprType::ArrayPosition)),
342 ("array_positions", raw_call(ExprType::ArrayPositions)),
343 ("array_contains", raw_call(ExprType::ArrayContains)),
344 ("arraycontains", raw_call(ExprType::ArrayContains)),
345 ("array_contained", raw_call(ExprType::ArrayContained)),
346 ("arraycontained", raw_call(ExprType::ArrayContained)),
347 ("array_flatten", guard_by_len(|_binder, [input]| {
348 input.ensure_array_type().map_err(|_| ErrorCode::BindError("array_flatten expects `any[][]` input".into()))?;
349 let return_type = input.return_type().into_list_elem();
350 if !return_type.is_array() {
351 return Err(ErrorCode::BindError("array_flatten expects `any[][]` input".into()).into());
352 }
353 Ok(FunctionCall::new_unchecked(ExprType::ArrayFlatten, vec![input], return_type).into())
354 })),
355 ("trim_array", raw_call(ExprType::TrimArray)),
356 (
357 "array_ndims",
358 guard_by_len(|_binder, [input]| {
359 input.ensure_array_type()?;
360
361 let n = input.return_type().array_ndims()
362 .try_into().map_err(|_| ErrorCode::BindError("array_ndims integer overflow".into()))?;
363 Ok(ExprImpl::literal_int(n))
364 }),
365 ),
366 (
367 "array_lower",
368 guard_by_len(|binder, [arg0, arg1]| {
369 let ndims_expr = binder.bind_builtin_scalar_function("array_ndims", vec![arg0], false)?;
371 let arg1 = arg1.cast_implicit(&DataType::Int32)?;
372
373 FunctionCall::new(
374 ExprType::Case,
375 vec![
376 FunctionCall::new(
377 ExprType::And,
378 vec![
379 FunctionCall::new(ExprType::LessThan, vec![ExprImpl::literal_int(0), arg1.clone()])?.into(),
380 FunctionCall::new(ExprType::LessThanOrEqual, vec![arg1, ndims_expr])?.into(),
381 ],
382 )?.into(),
383 ExprImpl::literal_int(1),
384 ],
385 ).map(Into::into)
386 }),
387 ),
388 ("array_upper", raw_call(ExprType::ArrayLength)), ("array_dims", raw_call(ExprType::ArrayDims)),
390 ("hex_to_int256", raw_call(ExprType::HexToInt256)),
392 ("jsonb_object_field", raw_call(ExprType::JsonbAccess)),
394 ("jsonb_array_element", raw_call(ExprType::JsonbAccess)),
395 ("jsonb_object_field_text", raw_call(ExprType::JsonbAccessStr)),
396 ("jsonb_array_element_text", raw_call(ExprType::JsonbAccessStr)),
397 ("jsonb_extract_path", raw_call(ExprType::JsonbExtractPath)),
398 ("jsonb_extract_path_text", raw_call(ExprType::JsonbExtractPathText)),
399 ("jsonb_typeof", raw_call(ExprType::JsonbTypeof)),
400 ("jsonb_array_length", raw_call(ExprType::JsonbArrayLength)),
401 ("jsonb_concat", raw_call(ExprType::JsonbConcat)),
402 ("jsonb_object", raw_call(ExprType::JsonbObject)),
403 ("jsonb_pretty", raw_call(ExprType::JsonbPretty)),
404 ("jsonb_contains", raw_call(ExprType::JsonbContains)),
405 ("jsonb_contained", raw_call(ExprType::JsonbContained)),
406 ("jsonb_exists", raw_call(ExprType::JsonbExists)),
407 ("jsonb_exists_any", raw_call(ExprType::JsonbExistsAny)),
408 ("jsonb_exists_all", raw_call(ExprType::JsonbExistsAll)),
409 ("jsonb_delete", raw_call(ExprType::Subtract)),
410 ("jsonb_delete_path", raw_call(ExprType::JsonbDeletePath)),
411 ("jsonb_strip_nulls", raw_call(ExprType::JsonbStripNulls)),
412 ("to_jsonb", raw_call(ExprType::ToJsonb)),
413 ("jsonb_build_array", raw_call(ExprType::JsonbBuildArray)),
414 ("jsonb_build_object", raw_call(ExprType::JsonbBuildObject)),
415 ("jsonb_populate_record", raw_call(ExprType::JsonbPopulateRecord)),
416 ("jsonb_path_match", raw_call(ExprType::JsonbPathMatch)),
417 ("jsonb_path_exists", raw_call(ExprType::JsonbPathExists)),
418 ("jsonb_path_query_array", raw_call(ExprType::JsonbPathQueryArray)),
419 ("jsonb_path_query_first", raw_call(ExprType::JsonbPathQueryFirst)),
420 ("jsonb_set", raw_call(ExprType::JsonbSet)),
421 ("jsonb_populate_map", raw_call(ExprType::JsonbPopulateMap)),
422 ("jsonb_to_array", raw_call(ExprType::JsonbToArray)),
423 ("map_from_entries", raw_call(ExprType::MapFromEntries)),
425 ("map_access", raw_call(ExprType::MapAccess)),
426 ("map_keys", raw_call(ExprType::MapKeys)),
427 ("map_values", raw_call(ExprType::MapValues)),
428 ("map_entries", raw_call(ExprType::MapEntries)),
429 ("map_from_key_values", raw_call(ExprType::MapFromKeyValues)),
430 ("map_cat", raw_call(ExprType::MapCat)),
431 ("map_contains", raw_call(ExprType::MapContains)),
432 ("map_delete", raw_call(ExprType::MapDelete)),
433 ("map_insert", raw_call(ExprType::MapInsert)),
434 ("map_length", raw_call(ExprType::MapLength)),
435 ("l2_distance", raw_call(ExprType::L2Distance)),
437 ("cosine_distance", raw_call(ExprType::CosineDistance)),
438 ("l1_distance", raw_call(ExprType::L1Distance)),
439 ("inner_product", raw_call(ExprType::InnerProduct)),
440 ("vector_norm", raw_call(ExprType::L2Norm)),
441 ("l2_normalize", raw_call(ExprType::L2Normalize)),
442 ("subvector", guard_by_len(|_, [vector_expr, start_expr, len_expr]| {
443 let dimensions = if let DataType::Vector(length) = vector_expr.return_type() {
444 length as i32
445 } else {
446 return Err(ErrorCode::BindError("subvector expects `vector(dim)` input".into()).into());
447 };
448 let start = start_expr
449 .try_fold_const()
450 .transpose()?
451 .and_then(|datum| match datum {
452 Some(ScalarImpl::Int32(v)) => Some(v),
453 _ => None,
454 })
455 .ok_or_else(|| ErrorCode::ExprError("`start` must be an Int32 constant".into()))?;
456
457 let len = len_expr
458 .try_fold_const()
459 .transpose()?
460 .and_then(|datum| match datum {
461 Some(ScalarImpl::Int32(v)) => Some(v),
462 _ => None,
463 })
464 .ok_or_else(|| ErrorCode::ExprError("`count` must be an Int32 constant".into()))?;
465 if len < 1 || len > DataType::VEC_MAX_SIZE as i32 {
466 return Err(ErrorCode::InvalidParameterValue(format!("Invalid vector size: expected 1..={}, got {}", DataType::VEC_MAX_SIZE, len)).into());
467 }
468
469 let end = start + len - 1;
470
471 if start < 1 || end > dimensions {
472 return Err(ErrorCode::InvalidParameterValue(format!(
473 "vector slice range out of bounds: start={}, end={}, valid range is [1, {}]",
474 start,
475 end,
476 dimensions
477 )).into());
478 }
479
480 Ok(FunctionCall::new_unchecked(ExprType::Subvector, vec![vector_expr, start_expr, len_expr], DataType::Vector(len as usize)).into())
481 })),
482 ("pi", pi()),
484 ("greatest", raw_call(ExprType::Greatest)),
486 ("least", raw_call(ExprType::Least)),
487 (
489 "pg_typeof",
490 guard_by_len(|_binder, [input]| {
491 let v = match input.is_untyped() {
492 true => "unknown".into(),
493 false => input.return_type().to_string(),
494 };
495 Ok(ExprImpl::literal_varchar(v))
496 }),
497 ),
498 ("current_catalog", current_database()),
499 ("current_database", current_database()),
500 ("current_schema", guard_by_len(|binder, []| {
501 Ok(binder
502 .first_valid_schema()
503 .map(|schema| ExprImpl::literal_varchar(schema.name()))
504 .unwrap_or_else(|_| ExprImpl::literal_null(DataType::Varchar)))
505 })),
506 ("current_schemas", raw(|binder, mut inputs| {
507 let no_match_err = ErrorCode::ExprError(
508 "No function matches the given name and argument types. You might need to add explicit type casts.".into()
509 );
510 if inputs.len() != 1 {
511 return Err(no_match_err.into());
512 }
513 let input = inputs
514 .pop()
515 .unwrap()
516 .enforce_bool_clause("current_schemas")
517 .map_err(|_| no_match_err)?;
518
519 let ExprImpl::Literal(literal) = &input else {
520 bail_not_implemented!("Only boolean literals are supported in `current_schemas`.");
521 };
522
523 let Some(bool) = literal.get_data().as_ref().map(|bool| bool.clone().into_bool()) else {
524 return Ok(ExprImpl::literal_null(DataType::Varchar.list()));
525 };
526
527 let paths = if bool {
528 binder.search_path.path()
529 } else {
530 binder.search_path.real_path()
531 };
532
533 let mut schema_names = vec![];
534 for path in paths {
535 let mut schema_name = path;
536 if schema_name == USER_NAME_WILD_CARD {
537 schema_name = &binder.auth_context.user_name;
538 }
539
540 if binder
541 .catalog
542 .get_schema_by_name(&binder.db_name, schema_name)
543 .is_ok()
544 {
545 schema_names.push(schema_name.as_str());
546 }
547 }
548
549 Ok(ExprImpl::literal_list(
550 ListValue::from_iter(schema_names),
551 DataType::Varchar,
552 ))
553 })),
554 ("session_user", session_user()),
555 ("current_role", current_user()),
556 ("current_user", current_user()),
557 ("user", current_user()),
558 ("pg_get_userbyid", raw_call(ExprType::PgGetUserbyid)),
559 ("pg_get_indexdef", raw_call(ExprType::PgGetIndexdef)),
560 ("pg_get_viewdef", raw_call(ExprType::PgGetViewdef)),
561 ("pg_index_column_has_property", raw_call(ExprType::PgIndexColumnHasProperty)),
562 ("pg_relation_size", raw(|_binder, mut inputs| {
563 if inputs.is_empty() {
564 return Err(ErrorCode::ExprError(
565 "function pg_relation_size() does not exist".into(),
566 )
567 .into());
568 }
569 inputs[0].cast_to_regclass_mut()?;
570 Ok(FunctionCall::new(ExprType::PgRelationSize, inputs)?.into())
571 })),
572 ("pg_get_serial_sequence", raw_literal(ExprImpl::literal_null(DataType::Varchar))),
573 ("pg_table_size", guard_by_len(|_binder, [mut input]| {
574 input.cast_to_regclass_mut()?;
575 Ok(FunctionCall::new(ExprType::PgRelationSize, vec![input])?.into())
576 })),
577 ("pg_indexes_size", guard_by_len(|_binder, [mut input]| {
578 input.cast_to_regclass_mut()?;
579 Ok(FunctionCall::new(ExprType::PgIndexesSize, vec![input])?.into())
580 })),
581 ("pg_get_expr", raw(|_binder, inputs| {
582 if inputs.len() == 2 || inputs.len() == 3 {
583 Ok(ExprImpl::literal_varchar("".into()))
585 } else {
586 Err(ErrorCode::ExprError(
587 "Too many/few arguments for pg_catalog.pg_get_expr()".into(),
588 )
589 .into())
590 }
591 })),
592 ("pg_my_temp_schema", guard_by_len(|_binder, []| {
593 Ok(ExprImpl::literal_int(
595 0,
597 ))
598 })),
599 ("current_setting", guard_by_len(|binder, [input]| {
600 let input = if let ExprImpl::Literal(literal) = &input &&
601 let Some(ScalarImpl::Utf8(input)) = literal.get_data()
602 {
603 input
604 } else {
605 return Err(ErrorCode::ExprError(
606 "Only literal is supported in `setting_name`.".into(),
607 )
608 .into());
609 };
610 let session_config = binder.session_config.read();
611 Ok(ExprImpl::literal_varchar(session_config.get(input.as_ref())?))
612 })),
613 ("set_config", guard_by_len(|binder, [arg0, arg1, arg2]| {
614 let setting_name = if let ExprImpl::Literal(literal) = &arg0 && let Some(ScalarImpl::Utf8(input)) = literal.get_data() {
615 input
616 } else {
617 return Err(ErrorCode::ExprError(
618 "Only string literal is supported in `setting_name`.".into(),
619 )
620 .into());
621 };
622
623 let new_value = if let ExprImpl::Literal(literal) = &arg1 && let Some(ScalarImpl::Utf8(input)) = literal.get_data() {
624 input
625 } else {
626 return Err(ErrorCode::ExprError(
627 "Only string literal is supported in `setting_name`.".into(),
628 )
629 .into());
630 };
631
632 let is_local = if let ExprImpl::Literal(literal) = &arg2 && let Some(ScalarImpl::Bool(input)) = literal.get_data() {
633 input
634 } else {
635 return Err(ErrorCode::ExprError(
636 "Only bool literal is supported in `is_local`.".into(),
637 )
638 .into());
639 };
640
641 if *is_local {
642 return Err(ErrorCode::ExprError(
643 "`is_local = true` is not supported now.".into(),
644 )
645 .into());
646 }
647
648 let mut session_config = binder.session_config.write();
649
650 session_config.set(setting_name, new_value.to_string(), &mut ())?;
652
653 Ok(ExprImpl::literal_varchar(new_value.to_string()))
654 })),
655 ("format_type", raw_call(ExprType::FormatType)),
656 ("pg_table_is_visible", raw_call(ExprType::PgTableIsVisible)),
657 ("pg_type_is_visible", raw_literal(ExprImpl::literal_bool(true))),
658 ("pg_get_constraintdef", raw_literal(ExprImpl::literal_null(DataType::Varchar))),
659 ("pg_get_partkeydef", raw_literal(ExprImpl::literal_null(DataType::Varchar))),
660 ("pg_encoding_to_char", raw_literal(ExprImpl::literal_varchar("UTF8".into()))),
661 ("has_database_privilege", raw(|binder, mut inputs| {
662 if inputs.len() == 2 {
663 inputs.insert(0, ExprImpl::literal_varchar(binder.auth_context.user_name.clone()));
664 }
665 if inputs.len() == 3 {
666 Ok(FunctionCall::new(ExprType::HasDatabasePrivilege, inputs)?.into())
667 } else {
668 Err(ErrorCode::ExprError(
669 "Too many/few arguments for pg_catalog.has_database_privilege()".into(),
670 )
671 .into())
672 }
673 })),
674 ("has_table_privilege", raw(|binder, mut inputs| {
675 if inputs.len() == 2 {
676 inputs.insert(0, ExprImpl::literal_varchar(binder.auth_context.user_name.clone()));
677 }
678 if inputs.len() == 3 {
679 if inputs[1].return_type() == DataType::Varchar {
680 inputs[1].cast_to_regclass_mut()?;
681 }
682 Ok(FunctionCall::new(ExprType::HasTablePrivilege, inputs)?.into())
683 } else {
684 Err(ErrorCode::ExprError(
685 "Too many/few arguments for pg_catalog.has_table_privilege()".into(),
686 )
687 .into())
688 }
689 })),
690 ("has_any_column_privilege", raw(|binder, mut inputs| {
691 if inputs.len() == 2 {
692 inputs.insert(0, ExprImpl::literal_varchar(binder.auth_context.user_name.clone()));
693 }
694 if inputs.len() == 3 {
695 if inputs[1].return_type() == DataType::Varchar {
696 inputs[1].cast_to_regclass_mut()?;
697 }
698 Ok(FunctionCall::new(ExprType::HasAnyColumnPrivilege, inputs)?.into())
699 } else {
700 Err(ErrorCode::ExprError(
701 "Too many/few arguments for pg_catalog.has_any_column_privilege()".into(),
702 )
703 .into())
704 }
705 })),
706 ("has_schema_privilege", raw(|binder, mut inputs| {
707 if inputs.len() == 2 {
708 inputs.insert(0, ExprImpl::literal_varchar(binder.auth_context.user_name.clone()));
709 }
710 if inputs.len() == 3 {
711 Ok(FunctionCall::new(ExprType::HasSchemaPrivilege, inputs)?.into())
712 } else {
713 Err(ErrorCode::ExprError(
714 "Too many/few arguments for pg_catalog.has_schema_privilege()".into(),
715 )
716 .into())
717 }
718 })),
719 ("has_function_privilege", raw(|binder, mut inputs| {
720 if inputs.len() == 2 {
721 inputs.insert(0, ExprImpl::literal_varchar(binder.auth_context.user_name.clone()));
722 }
723 if inputs.len() == 3 {
724 Ok(FunctionCall::new(ExprType::HasFunctionPrivilege, inputs)?.into())
725 } else {
726 Err(ErrorCode::ExprError(
727 "Too many/few arguments for pg_catalog.has_function_privilege()".into(),
728 )
729 .into())
730 }
731 })),
732 ("pg_stat_get_numscans", raw_literal(ExprImpl::literal_bigint(0))),
733 ("pg_backend_pid", raw(|binder, _inputs| {
734 Ok(ExprImpl::literal_int(binder.session_id.0))
736 })),
737 ("pg_cancel_backend", guard_by_len(|_binder, [_input]| {
738 Ok(ExprImpl::literal_bool(false))
740 })),
741 ("pg_terminate_backend", guard_by_len(|_binder, [_input]| {
742 Ok(ExprImpl::literal_bool(false))
745 })),
746 ("pg_tablespace_location", guard_by_len(|_binder, [_input]| {
747 Ok(ExprImpl::literal_null(DataType::Varchar))
748 })),
749 ("pg_postmaster_start_time", guard_by_len(|_binder, []| {
750 let server_start_time = risingwave_variables::get_server_start_time();
751 let datum = server_start_time.map(Timestamptz::from).map(ScalarImpl::from);
752 let literal = Literal::new(datum, DataType::Timestamptz);
753 Ok(literal.into())
754 })),
755 ("col_description", raw_call(ExprType::ColDescription)),
759 ("obj_description", raw_literal(ExprImpl::literal_varchar("".to_owned()))),
760 ("shobj_description", raw_literal(ExprImpl::literal_varchar("".to_owned()))),
761 ("pg_is_in_recovery", raw_call(ExprType::PgIsInRecovery)),
762 ("rw_recovery_status", raw_call(ExprType::RwRecoveryStatus)),
763 ("rw_cluster_id", raw_call(ExprType::RwClusterId)),
764 ("rw_epoch_to_ts", raw_call(ExprType::RwEpochToTs)),
765 ("rw_fragment_vnodes", raw_call(ExprType::RwFragmentVnodes)),
766 ("rw_actor_vnodes", raw_call(ExprType::RwActorVnodes)),
767 ("rw_vnode", raw_call(ExprType::VnodeUser)),
769 ("rw_license", raw_call(ExprType::License)),
770 ("rw_test_paid_tier", raw_call(ExprType::TestFeature)), ("rw_test_feature", raw_call(ExprType::TestFeature)), ("version", raw_literal(ExprImpl::literal_varchar(current_cluster_version()))),
774 ("now", now()),
776 ("current_timestamp", now()),
777 ("proctime", proctime()),
778 ("pg_sleep", raw_call(ExprType::PgSleep)),
779 ("pg_sleep_for", raw_call(ExprType::PgSleepFor)),
780 ("random", raw_call(ExprType::Random)),
781 ("date", guard_by_len(|_binder, [input]| {
787 input.cast_explicit(&DataType::Date).map_err(Into::into)
788 })),
789
790 ("openai_embedding", guard_by_len(|_binder, [arg0, arg1]| {
792 if let ExprImpl::Literal(config) = &arg0 && let Some(ScalarImpl::Jsonb(_config)) = config.get_data() {
794 Ok(FunctionCall::new(ExprType::OpenaiEmbedding, vec![arg0, arg1])?.into())
795 } else {
796 Err(ErrorCode::InvalidInputSyntax(
797 "`embedding_config` must be constant jsonb".to_owned(),
798 ).into())
799 }
800 })),
801 ]
802 .into_iter()
803 .collect()
804 });
805
806 static FUNCTIONS_BKTREE: LazyLock<BKTree<&str>> = LazyLock::new(|| {
807 let mut tree = BKTree::new(metrics::Levenshtein);
808
809 for k in HANDLES.keys() {
811 tree.add(*k);
812 }
813
814 tree
815 });
816
817 if variadic {
818 let func = match function_name {
819 "format" => ExprType::FormatVariadic,
820 "concat" => ExprType::ConcatVariadic,
821 "concat_ws" => ExprType::ConcatWsVariadic,
822 "jsonb_build_array" => ExprType::JsonbBuildArrayVariadic,
823 "jsonb_build_object" => ExprType::JsonbBuildObjectVariadic,
824 "jsonb_extract_path" => ExprType::JsonbExtractPathVariadic,
825 "jsonb_extract_path_text" => ExprType::JsonbExtractPathTextVariadic,
826 _ => {
827 return Err(ErrorCode::BindError(format!(
828 "VARIADIC argument is not allowed in function \"{}\"",
829 function_name
830 ))
831 .into());
832 }
833 };
834 return Ok(FunctionCall::new(func, inputs)?.into());
835 }
836
837 match HANDLES.get(function_name) {
839 Some(handle) => handle(self, inputs),
840 None => {
841 let allowed_distance = if function_name.len() > 3 { 2 } else { 1 };
842
843 let candidates = FUNCTIONS_BKTREE
844 .find(function_name, allowed_distance)
845 .map(|(_idx, c)| c)
846 .join(" or ");
847
848 Err(no_function!(
849 candidates = (!candidates.is_empty()).then_some(candidates),
850 "{}({})",
851 function_name,
852 inputs.iter().map(|e| e.return_type()).join(", ")
853 )
854 .into())
855 }
856 }
857 }
858
859 fn ensure_now_function_allowed(&self) -> Result<()> {
860 if self.is_for_stream()
861 && !matches!(
862 self.context.clause,
863 Some(Clause::Where)
864 | Some(Clause::Having)
865 | Some(Clause::JoinOn)
866 | Some(Clause::From)
867 )
868 {
869 return Err(ErrorCode::InvalidInputSyntax(format!(
870 "For streaming queries, `NOW()` function is only allowed in `WHERE`, `HAVING`, `ON` and `FROM`. Found in clause: {:?}. \
871 Please refer to https://docs.risingwave.com/processing/sql/temporal-filters for more information",
872 self.context.clause
873 ))
874 .into());
875 }
876 if matches!(self.context.clause, Some(Clause::GeneratedColumn)) {
877 return Err(ErrorCode::InvalidInputSyntax(
878 "Cannot use `NOW()` function in generated columns. Do you want `PROCTIME()`?"
879 .to_owned(),
880 )
881 .into());
882 }
883 Ok(())
884 }
885
886 fn ensure_proctime_function_allowed(&self) -> Result<()> {
887 if !self.is_for_ddl() {
888 return Err(ErrorCode::InvalidInputSyntax(
889 "Function `PROCTIME()` is only allowed in CREATE TABLE/SOURCE. Is `NOW()` what you want?".to_owned(),
890 )
891 .into());
892 }
893 Ok(())
894 }
895}
896
897fn rewrite_concat_to_concat_ws(inputs: Vec<ExprImpl>) -> Result<Vec<ExprImpl>> {
898 if inputs.is_empty() {
899 Err(ErrorCode::BindError(
900 "Function `concat` takes at least 1 arguments (0 given)".to_owned(),
901 )
902 .into())
903 } else {
904 let inputs = std::iter::once(ExprImpl::literal_varchar("".to_owned()))
905 .chain(inputs)
906 .collect();
907 Ok(inputs)
908 }
909}
910
911fn rewrite_nullif_to_case_when(inputs: Vec<ExprImpl>) -> Result<Vec<ExprImpl>> {
914 if inputs.len() != 2 {
915 Err(ErrorCode::BindError("Function `nullif` must contain 2 arguments".to_owned()).into())
916 } else {
917 let inputs = vec![
918 FunctionCall::new(ExprType::Equal, inputs.clone())?.into(),
919 Literal::new(None, inputs[0].return_type()).into(),
920 inputs[0].clone(),
921 ];
922 Ok(inputs)
923 }
924}
925
926fn rewrite_two_bool_inputs(mut inputs: Vec<ExprImpl>) -> Result<Vec<ExprImpl>> {
927 if inputs.len() != 2 {
928 return Err(
929 ErrorCode::BindError("function must contain only 2 arguments".to_owned()).into(),
930 );
931 }
932 let left = inputs.pop().unwrap();
933 let right = inputs.pop().unwrap();
934 Ok(vec![
935 left.cast_implicit(&DataType::Boolean)?,
936 right.cast_implicit(&DataType::Boolean)?,
937 ])
938}