1use std::collections::HashMap;
16use std::sync::LazyLock;
17
18use bk_tree::{BKTree, metrics};
19use itertools::Itertools;
20use risingwave_common::session_config::USER_NAME_WILD_CARD;
21use risingwave_common::types::{DataType, ListValue, ScalarImpl, Timestamptz};
22use risingwave_common::{bail_not_implemented, current_cluster_version, no_function};
23use thiserror_ext::AsReport;
24
25use crate::Binder;
26use crate::binder::Clause;
27use crate::error::{ErrorCode, Result};
28use crate::expr::{CastContext, Expr, ExprImpl, ExprType, FunctionCall, Literal, Now};
29
30impl Binder {
31 pub(super) fn bind_builtin_scalar_function(
32 &mut self,
33 function_name: &str,
34 inputs: Vec<ExprImpl>,
35 variadic: bool,
36 ) -> Result<ExprImpl> {
37 type Inputs = Vec<ExprImpl>;
38
39 type Handle = Box<dyn Fn(&mut Binder, Inputs) -> Result<ExprImpl> + Sync + Send>;
40
41 fn rewrite(r#type: ExprType, rewriter: fn(Inputs) -> Result<Inputs>) -> Handle {
42 Box::new(move |_binder, mut inputs| {
43 inputs = (rewriter)(inputs)?;
44 Ok(FunctionCall::new(r#type, inputs)?.into())
45 })
46 }
47
48 fn raw_call(r#type: ExprType) -> Handle {
49 rewrite(r#type, Ok)
50 }
51
52 fn guard_by_len<const E: usize>(
53 handle: impl Fn(&mut Binder, [ExprImpl; E]) -> Result<ExprImpl> + Sync + Send + 'static,
54 ) -> Handle {
55 Box::new(move |binder, inputs| {
56 let input_len = inputs.len();
57 let Ok(inputs) = inputs.try_into() else {
58 return Err(ErrorCode::ExprError(
59 format!("unexpected arguments number {}, expect {}", input_len, E).into(),
60 )
61 .into());
62 };
63 handle(binder, inputs)
64 })
65 }
66
67 fn raw<F: Fn(&mut Binder, Inputs) -> Result<ExprImpl> + Sync + Send + 'static>(
68 f: F,
69 ) -> Handle {
70 Box::new(f)
71 }
72
73 fn dispatch_by_len(mapping: Vec<(usize, Handle)>) -> Handle {
74 Box::new(move |binder, inputs| {
75 for (len, handle) in &mapping {
76 if inputs.len() == *len {
77 return handle(binder, inputs);
78 }
79 }
80 Err(ErrorCode::ExprError("unexpected arguments number".into()).into())
81 })
82 }
83
84 fn raw_literal(literal: ExprImpl) -> Handle {
85 Box::new(move |_binder, _inputs| Ok(literal.clone()))
86 }
87
88 fn now() -> Handle {
89 guard_by_len(move |binder, []| {
90 binder.ensure_now_function_allowed()?;
91 Ok(Now.into())
94 })
95 }
96
97 fn pi() -> Handle {
98 raw_literal(ExprImpl::literal_f64(std::f64::consts::PI))
99 }
100
101 fn proctime() -> Handle {
102 Box::new(move |binder, inputs| {
103 binder.ensure_proctime_function_allowed()?;
104 raw_call(ExprType::Proctime)(binder, inputs)
105 })
106 }
107
108 fn session_user() -> Handle {
110 guard_by_len(|binder, []| {
111 Ok(ExprImpl::literal_varchar(
112 binder.auth_context.user_name.clone(),
113 ))
114 })
115 }
116
117 fn current_user() -> Handle {
121 guard_by_len(|binder, []| {
122 Ok(ExprImpl::literal_varchar(
123 binder.auth_context.user_name.clone(),
124 ))
125 })
126 }
127
128 fn current_database() -> Handle {
131 guard_by_len(|binder, []| Ok(ExprImpl::literal_varchar(binder.db_name.clone())))
132 }
133
134 static HANDLES: LazyLock<HashMap<&'static str, Handle>> = LazyLock::new(|| {
138 [
139 (
140 "booleq",
141 rewrite(ExprType::Equal, rewrite_two_bool_inputs),
142 ),
143 (
144 "boolne",
145 rewrite(ExprType::NotEqual, rewrite_two_bool_inputs),
146 ),
147 ("coalesce", rewrite(ExprType::Coalesce, |inputs| {
148 if inputs.iter().any(ExprImpl::has_table_function) {
149 return Err(ErrorCode::BindError("table functions are not allowed in COALESCE".into()).into());
150 }
151 Ok(inputs)
152 })),
153 (
154 "nullif",
155 rewrite(ExprType::Case, rewrite_nullif_to_case_when),
156 ),
157 (
158 "round",
159 dispatch_by_len(vec![
160 (2, raw_call(ExprType::RoundDigit)),
161 (1, raw_call(ExprType::Round)),
162 ]),
163 ),
164 ("pow", raw_call(ExprType::Pow)),
165 ("power", raw_call(ExprType::Pow)),
167 ("ceil", raw_call(ExprType::Ceil)),
168 ("ceiling", raw_call(ExprType::Ceil)),
169 ("floor", raw_call(ExprType::Floor)),
170 ("trunc", raw_call(ExprType::Trunc)),
171 ("abs", raw_call(ExprType::Abs)),
172 ("exp", raw_call(ExprType::Exp)),
173 ("ln", raw_call(ExprType::Ln)),
174 ("log", raw_call(ExprType::Log10)),
175 ("log10", raw_call(ExprType::Log10)),
176 ("mod", raw_call(ExprType::Modulus)),
177 ("sin", raw_call(ExprType::Sin)),
178 ("cos", raw_call(ExprType::Cos)),
179 ("tan", raw_call(ExprType::Tan)),
180 ("cot", raw_call(ExprType::Cot)),
181 ("asin", raw_call(ExprType::Asin)),
182 ("acos", raw_call(ExprType::Acos)),
183 ("atan", raw_call(ExprType::Atan)),
184 ("atan2", raw_call(ExprType::Atan2)),
185 ("sind", raw_call(ExprType::Sind)),
186 ("cosd", raw_call(ExprType::Cosd)),
187 ("cotd", raw_call(ExprType::Cotd)),
188 ("tand", raw_call(ExprType::Tand)),
189 ("sinh", raw_call(ExprType::Sinh)),
190 ("cosh", raw_call(ExprType::Cosh)),
191 ("tanh", raw_call(ExprType::Tanh)),
192 ("coth", raw_call(ExprType::Coth)),
193 ("asinh", raw_call(ExprType::Asinh)),
194 ("acosh", raw_call(ExprType::Acosh)),
195 ("atanh", raw_call(ExprType::Atanh)),
196 ("asind", raw_call(ExprType::Asind)),
197 ("acosd", raw_call(ExprType::Acosd)),
198 ("atand", raw_call(ExprType::Atand)),
199 ("atan2d", raw_call(ExprType::Atan2d)),
200 ("degrees", raw_call(ExprType::Degrees)),
201 ("radians", raw_call(ExprType::Radians)),
202 ("sqrt", raw_call(ExprType::Sqrt)),
203 ("cbrt", raw_call(ExprType::Cbrt)),
204 ("sign", raw_call(ExprType::Sign)),
205 ("scale", raw_call(ExprType::Scale)),
206 ("min_scale", raw_call(ExprType::MinScale)),
207 ("trim_scale", raw_call(ExprType::TrimScale)),
208 ("gamma", raw_call(ExprType::Gamma)),
209 ("lgamma", raw_call(ExprType::Lgamma)),
210 (
212 "to_timestamp",
213 dispatch_by_len(vec![
214 (1, raw_call(ExprType::SecToTimestamptz)),
215 (2, raw_call(ExprType::CharToTimestamptz)),
216 ]),
217 ),
218 ("date_trunc", raw_call(ExprType::DateTrunc)),
219 ("date_bin", raw_call(ExprType::DateBin)),
220 ("date_part", raw_call(ExprType::DatePart)),
221 ("make_date", raw_call(ExprType::MakeDate)),
222 ("make_time", raw_call(ExprType::MakeTime)),
223 ("make_timestamp", raw_call(ExprType::MakeTimestamp)),
224 ("make_timestamptz", raw_call(ExprType::MakeTimestamptz)),
225 ("timezone", guard_by_len(|_binder, [arg0, arg1]| {
226 Ok(FunctionCall::new(ExprType::AtTimeZone, vec![arg1, arg0])?.into())
228 })),
229 ("to_date", raw_call(ExprType::CharToDate)),
230 ("substr", raw_call(ExprType::Substr)),
232 ("length", raw_call(ExprType::Length)),
233 ("upper", raw_call(ExprType::Upper)),
234 ("lower", raw_call(ExprType::Lower)),
235 ("trim", raw_call(ExprType::Trim)),
236 ("replace", raw_call(ExprType::Replace)),
237 ("overlay", raw_call(ExprType::Overlay)),
238 ("btrim", raw_call(ExprType::Trim)),
239 ("ltrim", raw_call(ExprType::Ltrim)),
240 ("rtrim", raw_call(ExprType::Rtrim)),
241 ("md5", raw_call(ExprType::Md5)),
242 ("to_char", raw_call(ExprType::ToChar)),
243 (
244 "concat",
245 rewrite(ExprType::ConcatWs, rewrite_concat_to_concat_ws),
246 ),
247 ("concat_ws", raw_call(ExprType::ConcatWs)),
248 ("format", raw_call(ExprType::Format)),
249 ("translate", raw_call(ExprType::Translate)),
250 ("split_part", raw_call(ExprType::SplitPart)),
251 ("char_length", raw_call(ExprType::CharLength)),
252 ("character_length", raw_call(ExprType::CharLength)),
253 ("repeat", raw_call(ExprType::Repeat)),
254 ("ascii", raw_call(ExprType::Ascii)),
255 ("octet_length", raw_call(ExprType::OctetLength)),
256 ("bit_length", raw_call(ExprType::BitLength)),
257 ("regexp_match", raw_call(ExprType::RegexpMatch)),
258 ("regexp_replace", raw_call(ExprType::RegexpReplace)),
259 ("regexp_count", raw_call(ExprType::RegexpCount)),
260 ("regexp_split_to_array", raw_call(ExprType::RegexpSplitToArray)),
261 ("chr", raw_call(ExprType::Chr)),
262 ("starts_with", raw_call(ExprType::StartsWith)),
263 ("initcap", raw_call(ExprType::Initcap)),
264 ("lpad", raw_call(ExprType::Lpad)),
265 ("rpad", raw_call(ExprType::Rpad)),
266 ("reverse", raw_call(ExprType::Reverse)),
267 ("strpos", raw_call(ExprType::Position)),
268 ("to_ascii", raw_call(ExprType::ToAscii)),
269 ("to_hex", raw_call(ExprType::ToHex)),
270 ("quote_ident", raw_call(ExprType::QuoteIdent)),
271 ("quote_literal", guard_by_len(|_binder, [mut input]| {
272 if input.return_type() != DataType::Varchar {
273 FunctionCall::cast_mut(&mut input, &DataType::Varchar, CastContext::Explicit)?;
276 }
277 Ok(FunctionCall::new_unchecked(ExprType::QuoteLiteral, vec![input], DataType::Varchar).into())
278 })),
279 ("quote_nullable", guard_by_len(|_binder, [mut input]| {
280 if input.return_type() != DataType::Varchar {
281 FunctionCall::cast_mut(&mut input, &DataType::Varchar, CastContext::Explicit)?;
284 }
285 Ok(FunctionCall::new_unchecked(ExprType::QuoteNullable, vec![input], DataType::Varchar).into())
286 })),
287 ("string_to_array", raw_call(ExprType::StringToArray)),
288 ("get_bit", raw_call(ExprType::GetBit)),
289 ("get_byte", raw_call(ExprType::GetByte)),
290 ("set_bit", raw_call(ExprType::SetBit)),
291 ("set_byte", raw_call(ExprType::SetByte)),
292 ("bit_count", raw_call(ExprType::BitCount)),
293 ("encode", raw_call(ExprType::Encode)),
294 ("decode", raw_call(ExprType::Decode)),
295 ("convert_from", raw_call(ExprType::ConvertFrom)),
296 ("convert_to", raw_call(ExprType::ConvertTo)),
297 ("sha1", raw_call(ExprType::Sha1)),
298 ("sha224", raw_call(ExprType::Sha224)),
299 ("sha256", raw_call(ExprType::Sha256)),
300 ("sha384", raw_call(ExprType::Sha384)),
301 ("sha512", raw_call(ExprType::Sha512)),
302 ("encrypt", raw_call(ExprType::Encrypt)),
303 ("decrypt", raw_call(ExprType::Decrypt)),
304 ("hmac", raw_call(ExprType::Hmac)),
305 ("secure_compare", raw_call(ExprType::SecureCompare)),
306 ("left", raw_call(ExprType::Left)),
307 ("right", raw_call(ExprType::Right)),
308 ("inet_aton", raw_call(ExprType::InetAton)),
309 ("inet_ntoa", raw_call(ExprType::InetNtoa)),
310 ("int8send", raw_call(ExprType::PgwireSend)),
311 ("int8recv", guard_by_len(|_binder, [mut input]| {
312 let hint = if !input.is_untyped() && input.return_type() == DataType::Varchar {
314 " Consider `decode` or cast."
315 } else {
316 ""
317 };
318 input.cast_implicit_mut(&DataType::Bytea).map_err(|e| {
319 ErrorCode::BindError(format!("{} in `recv`.{hint}", e.as_report()))
320 })?;
321 Ok(FunctionCall::new_unchecked(ExprType::PgwireRecv, vec![input], DataType::Int64).into())
322 })),
323 ("array_cat", raw_call(ExprType::ArrayCat)),
325 ("array_append", raw_call(ExprType::ArrayAppend)),
326 ("array_join", raw_call(ExprType::ArrayToString)),
327 ("array_prepend", raw_call(ExprType::ArrayPrepend)),
328 ("array_to_string", raw_call(ExprType::ArrayToString)),
329 ("array_distinct", raw_call(ExprType::ArrayDistinct)),
330 ("array_min", raw_call(ExprType::ArrayMin)),
331 ("array_sort", raw_call(ExprType::ArraySort)),
332 ("array_length", raw_call(ExprType::ArrayLength)),
333 ("cardinality", raw_call(ExprType::Cardinality)),
334 ("array_remove", raw_call(ExprType::ArrayRemove)),
335 ("array_replace", raw_call(ExprType::ArrayReplace)),
336 ("array_reverse", raw_call(ExprType::ArrayReverse)),
337 ("array_max", raw_call(ExprType::ArrayMax)),
338 ("array_sum", raw_call(ExprType::ArraySum)),
339 ("array_position", raw_call(ExprType::ArrayPosition)),
340 ("array_positions", raw_call(ExprType::ArrayPositions)),
341 ("array_contains", raw_call(ExprType::ArrayContains)),
342 ("arraycontains", raw_call(ExprType::ArrayContains)),
343 ("array_contained", raw_call(ExprType::ArrayContained)),
344 ("arraycontained", raw_call(ExprType::ArrayContained)),
345 ("array_flatten", guard_by_len(|_binder, [input]| {
346 input.ensure_array_type().map_err(|_| ErrorCode::BindError("array_flatten expects `any[][]` input".into()))?;
347 let return_type = input.return_type().into_list_elem();
348 if !return_type.is_array() {
349 return Err(ErrorCode::BindError("array_flatten expects `any[][]` input".into()).into());
350 }
351 Ok(FunctionCall::new_unchecked(ExprType::ArrayFlatten, vec![input], return_type).into())
352 })),
353 ("trim_array", raw_call(ExprType::TrimArray)),
354 (
355 "array_ndims",
356 guard_by_len(|_binder, [input]| {
357 input.ensure_array_type()?;
358
359 let n = input.return_type().array_ndims()
360 .try_into().map_err(|_| ErrorCode::BindError("array_ndims integer overflow".into()))?;
361 Ok(ExprImpl::literal_int(n))
362 }),
363 ),
364 (
365 "array_lower",
366 guard_by_len(|binder, [arg0, arg1]| {
367 let ndims_expr = binder.bind_builtin_scalar_function("array_ndims", vec![arg0], false)?;
369 let arg1 = arg1.cast_implicit(&DataType::Int32)?;
370
371 FunctionCall::new(
372 ExprType::Case,
373 vec![
374 FunctionCall::new(
375 ExprType::And,
376 vec![
377 FunctionCall::new(ExprType::LessThan, vec![ExprImpl::literal_int(0), arg1.clone()])?.into(),
378 FunctionCall::new(ExprType::LessThanOrEqual, vec![arg1, ndims_expr])?.into(),
379 ],
380 )?.into(),
381 ExprImpl::literal_int(1),
382 ],
383 ).map(Into::into)
384 }),
385 ),
386 ("array_upper", raw_call(ExprType::ArrayLength)), ("array_dims", raw_call(ExprType::ArrayDims)),
388 ("hex_to_int256", raw_call(ExprType::HexToInt256)),
390 ("jsonb_object_field", raw_call(ExprType::JsonbAccess)),
392 ("jsonb_array_element", raw_call(ExprType::JsonbAccess)),
393 ("jsonb_object_field_text", raw_call(ExprType::JsonbAccessStr)),
394 ("jsonb_array_element_text", raw_call(ExprType::JsonbAccessStr)),
395 ("jsonb_extract_path", raw_call(ExprType::JsonbExtractPath)),
396 ("jsonb_extract_path_text", raw_call(ExprType::JsonbExtractPathText)),
397 ("jsonb_typeof", raw_call(ExprType::JsonbTypeof)),
398 ("jsonb_array_length", raw_call(ExprType::JsonbArrayLength)),
399 ("jsonb_concat", raw_call(ExprType::JsonbConcat)),
400 ("jsonb_object", raw_call(ExprType::JsonbObject)),
401 ("jsonb_pretty", raw_call(ExprType::JsonbPretty)),
402 ("jsonb_contains", raw_call(ExprType::JsonbContains)),
403 ("jsonb_contained", raw_call(ExprType::JsonbContained)),
404 ("jsonb_exists", raw_call(ExprType::JsonbExists)),
405 ("jsonb_exists_any", raw_call(ExprType::JsonbExistsAny)),
406 ("jsonb_exists_all", raw_call(ExprType::JsonbExistsAll)),
407 ("jsonb_delete", raw_call(ExprType::Subtract)),
408 ("jsonb_delete_path", raw_call(ExprType::JsonbDeletePath)),
409 ("jsonb_strip_nulls", raw_call(ExprType::JsonbStripNulls)),
410 ("to_jsonb", raw_call(ExprType::ToJsonb)),
411 ("jsonb_build_array", raw_call(ExprType::JsonbBuildArray)),
412 ("jsonb_build_object", raw_call(ExprType::JsonbBuildObject)),
413 ("jsonb_populate_record", raw_call(ExprType::JsonbPopulateRecord)),
414 ("jsonb_path_match", raw_call(ExprType::JsonbPathMatch)),
415 ("jsonb_path_exists", raw_call(ExprType::JsonbPathExists)),
416 ("jsonb_path_query_array", raw_call(ExprType::JsonbPathQueryArray)),
417 ("jsonb_path_query_first", raw_call(ExprType::JsonbPathQueryFirst)),
418 ("jsonb_set", raw_call(ExprType::JsonbSet)),
419 ("jsonb_populate_map", raw_call(ExprType::JsonbPopulateMap)),
420 ("jsonb_to_array", raw_call(ExprType::JsonbToArray)),
421 ("map_from_entries", raw_call(ExprType::MapFromEntries)),
423 ("map_access", raw_call(ExprType::MapAccess)),
424 ("map_keys", raw_call(ExprType::MapKeys)),
425 ("map_values", raw_call(ExprType::MapValues)),
426 ("map_entries", raw_call(ExprType::MapEntries)),
427 ("map_from_key_values", raw_call(ExprType::MapFromKeyValues)),
428 ("map_cat", raw_call(ExprType::MapCat)),
429 ("map_contains", raw_call(ExprType::MapContains)),
430 ("map_delete", raw_call(ExprType::MapDelete)),
431 ("map_insert", raw_call(ExprType::MapInsert)),
432 ("map_length", raw_call(ExprType::MapLength)),
433 ("l2_distance", raw_call(ExprType::L2Distance)),
435 ("cosine_distance", raw_call(ExprType::CosineDistance)),
436 ("l1_distance", raw_call(ExprType::L1Distance)),
437 ("inner_product", raw_call(ExprType::InnerProduct)),
438 ("vector_norm", raw_call(ExprType::L2Norm)),
439 ("l2_normalize", raw_call(ExprType::L2Normalize)),
440 ("subvector", guard_by_len(|_, [vector_expr, start_expr, len_expr]| {
441 let dimensions = if let DataType::Vector(length) = vector_expr.return_type() {
442 length as i32
443 } else {
444 return Err(ErrorCode::BindError("subvector expects `vector(dim)` input".into()).into());
445 };
446 let start = start_expr
447 .try_fold_const()
448 .transpose()?
449 .and_then(|datum| match datum {
450 Some(ScalarImpl::Int32(v)) => Some(v),
451 _ => None,
452 })
453 .ok_or_else(|| ErrorCode::ExprError("`start` must be an Int32 constant".into()))?;
454
455 let len = len_expr
456 .try_fold_const()
457 .transpose()?
458 .and_then(|datum| match datum {
459 Some(ScalarImpl::Int32(v)) => Some(v),
460 _ => None,
461 })
462 .ok_or_else(|| ErrorCode::ExprError("`count` must be an Int32 constant".into()))?;
463 if len < 1 || len > DataType::VEC_MAX_SIZE as i32 {
464 return Err(ErrorCode::InvalidParameterValue(format!("Invalid vector size: expected 1..={}, got {}", DataType::VEC_MAX_SIZE, len)).into());
465 }
466
467 let end = start + len - 1;
468
469 if start < 1 || end > dimensions {
470 return Err(ErrorCode::InvalidParameterValue(format!(
471 "vector slice range out of bounds: start={}, end={}, valid range is [1, {}]",
472 start,
473 end,
474 dimensions
475 )).into());
476 }
477
478 Ok(FunctionCall::new_unchecked(ExprType::Subvector, vec![vector_expr, start_expr, len_expr], DataType::Vector(len as usize)).into())
479 })),
480 ("pi", pi()),
482 ("greatest", raw_call(ExprType::Greatest)),
484 ("least", raw_call(ExprType::Least)),
485 (
487 "pg_typeof",
488 guard_by_len(|_binder, [input]| {
489 let v = match input.is_untyped() {
490 true => "unknown".into(),
491 false => input.return_type().to_string(),
492 };
493 Ok(ExprImpl::literal_varchar(v))
494 }),
495 ),
496 ("current_catalog", current_database()),
497 ("current_database", current_database()),
498 ("current_schema", guard_by_len(|binder, []| {
499 Ok(binder
500 .first_valid_schema()
501 .map(|schema| ExprImpl::literal_varchar(schema.name()))
502 .unwrap_or_else(|_| ExprImpl::literal_null(DataType::Varchar)))
503 })),
504 ("current_schemas", raw(|binder, mut inputs| {
505 let no_match_err = ErrorCode::ExprError(
506 "No function matches the given name and argument types. You might need to add explicit type casts.".into()
507 );
508 if inputs.len() != 1 {
509 return Err(no_match_err.into());
510 }
511 let input = inputs
512 .pop()
513 .unwrap()
514 .enforce_bool_clause("current_schemas")
515 .map_err(|_| no_match_err)?;
516
517 let ExprImpl::Literal(literal) = &input else {
518 bail_not_implemented!("Only boolean literals are supported in `current_schemas`.");
519 };
520
521 let Some(bool) = literal.get_data().as_ref().map(|bool| bool.clone().into_bool()) else {
522 return Ok(ExprImpl::literal_null(DataType::Varchar.list()));
523 };
524
525 let paths = if bool {
526 binder.search_path.path()
527 } else {
528 binder.search_path.real_path()
529 };
530
531 let mut schema_names = vec![];
532 for path in paths {
533 let mut schema_name = path;
534 if schema_name == USER_NAME_WILD_CARD {
535 schema_name = &binder.auth_context.user_name;
536 }
537
538 if binder
539 .catalog
540 .get_schema_by_name(&binder.db_name, schema_name)
541 .is_ok()
542 {
543 schema_names.push(schema_name.as_str());
544 }
545 }
546
547 Ok(ExprImpl::literal_list(
548 ListValue::from_iter(schema_names),
549 DataType::Varchar,
550 ))
551 })),
552 ("session_user", session_user()),
553 ("current_role", current_user()),
554 ("current_user", current_user()),
555 ("user", current_user()),
556 ("pg_get_userbyid", raw_call(ExprType::PgGetUserbyid)),
557 ("pg_get_indexdef", raw_call(ExprType::PgGetIndexdef)),
558 ("pg_get_viewdef", raw_call(ExprType::PgGetViewdef)),
559 ("pg_index_column_has_property", raw_call(ExprType::PgIndexColumnHasProperty)),
560 ("pg_relation_size", raw(|_binder, mut inputs| {
561 if inputs.is_empty() {
562 return Err(ErrorCode::ExprError(
563 "function pg_relation_size() does not exist".into(),
564 )
565 .into());
566 }
567 inputs[0].cast_to_regclass_mut()?;
568 Ok(FunctionCall::new(ExprType::PgRelationSize, inputs)?.into())
569 })),
570 ("pg_get_serial_sequence", raw_literal(ExprImpl::literal_null(DataType::Varchar))),
571 ("pg_table_size", guard_by_len(|_binder, [mut input]| {
572 input.cast_to_regclass_mut()?;
573 Ok(FunctionCall::new(ExprType::PgRelationSize, vec![input])?.into())
574 })),
575 ("pg_indexes_size", guard_by_len(|_binder, [mut input]| {
576 input.cast_to_regclass_mut()?;
577 Ok(FunctionCall::new(ExprType::PgIndexesSize, vec![input])?.into())
578 })),
579 ("pg_get_expr", raw(|_binder, inputs| {
580 if inputs.len() == 2 || inputs.len() == 3 {
581 Ok(ExprImpl::literal_varchar("".into()))
583 } else {
584 Err(ErrorCode::ExprError(
585 "Too many/few arguments for pg_catalog.pg_get_expr()".into(),
586 )
587 .into())
588 }
589 })),
590 ("pg_my_temp_schema", guard_by_len(|_binder, []| {
591 Ok(ExprImpl::literal_int(
593 0,
595 ))
596 })),
597 ("current_setting", guard_by_len(|binder, [input]| {
598 let input = if let ExprImpl::Literal(literal) = &input &&
599 let Some(ScalarImpl::Utf8(input)) = literal.get_data()
600 {
601 input
602 } else {
603 return Err(ErrorCode::ExprError(
604 "Only literal is supported in `setting_name`.".into(),
605 )
606 .into());
607 };
608 let session_config = binder.session_config.read();
609 Ok(ExprImpl::literal_varchar(session_config.get(input.as_ref())?))
610 })),
611 ("set_config", guard_by_len(|binder, [arg0, arg1, arg2]| {
612 let setting_name = if let ExprImpl::Literal(literal) = &arg0 && let Some(ScalarImpl::Utf8(input)) = literal.get_data() {
613 input
614 } else {
615 return Err(ErrorCode::ExprError(
616 "Only string literal is supported in `setting_name`.".into(),
617 )
618 .into());
619 };
620
621 let new_value = if let ExprImpl::Literal(literal) = &arg1 && let Some(ScalarImpl::Utf8(input)) = literal.get_data() {
622 input
623 } else {
624 return Err(ErrorCode::ExprError(
625 "Only string literal is supported in `setting_name`.".into(),
626 )
627 .into());
628 };
629
630 let is_local = if let ExprImpl::Literal(literal) = &arg2 && let Some(ScalarImpl::Bool(input)) = literal.get_data() {
631 input
632 } else {
633 return Err(ErrorCode::ExprError(
634 "Only bool literal is supported in `is_local`.".into(),
635 )
636 .into());
637 };
638
639 if *is_local {
640 return Err(ErrorCode::ExprError(
641 "`is_local = true` is not supported now.".into(),
642 )
643 .into());
644 }
645
646 let mut session_config = binder.session_config.write();
647
648 session_config.set(setting_name, new_value.to_string(), &mut ())?;
650
651 Ok(ExprImpl::literal_varchar(new_value.to_string()))
652 })),
653 ("format_type", raw_call(ExprType::FormatType)),
654 ("pg_table_is_visible", raw_call(ExprType::PgTableIsVisible)),
655 ("pg_type_is_visible", raw_literal(ExprImpl::literal_bool(true))),
656 ("pg_get_constraintdef", raw_literal(ExprImpl::literal_null(DataType::Varchar))),
657 ("pg_get_partkeydef", raw_literal(ExprImpl::literal_null(DataType::Varchar))),
658 ("pg_encoding_to_char", raw_literal(ExprImpl::literal_varchar("UTF8".into()))),
659 ("has_database_privilege", raw(|binder, mut inputs| {
660 if inputs.len() == 2 {
661 inputs.insert(0, ExprImpl::literal_varchar(binder.auth_context.user_name.clone()));
662 }
663 if inputs.len() == 3 {
664 Ok(FunctionCall::new(ExprType::HasDatabasePrivilege, inputs)?.into())
665 } else {
666 Err(ErrorCode::ExprError(
667 "Too many/few arguments for pg_catalog.has_database_privilege()".into(),
668 )
669 .into())
670 }
671 })),
672 ("has_table_privilege", raw(|binder, mut inputs| {
673 if inputs.len() == 2 {
674 inputs.insert(0, ExprImpl::literal_varchar(binder.auth_context.user_name.clone()));
675 }
676 if inputs.len() == 3 {
677 if inputs[1].return_type() == DataType::Varchar {
678 inputs[1].cast_to_regclass_mut()?;
679 }
680 Ok(FunctionCall::new(ExprType::HasTablePrivilege, inputs)?.into())
681 } else {
682 Err(ErrorCode::ExprError(
683 "Too many/few arguments for pg_catalog.has_table_privilege()".into(),
684 )
685 .into())
686 }
687 })),
688 ("has_any_column_privilege", raw(|binder, mut inputs| {
689 if inputs.len() == 2 {
690 inputs.insert(0, ExprImpl::literal_varchar(binder.auth_context.user_name.clone()));
691 }
692 if inputs.len() == 3 {
693 if inputs[1].return_type() == DataType::Varchar {
694 inputs[1].cast_to_regclass_mut()?;
695 }
696 Ok(FunctionCall::new(ExprType::HasAnyColumnPrivilege, inputs)?.into())
697 } else {
698 Err(ErrorCode::ExprError(
699 "Too many/few arguments for pg_catalog.has_any_column_privilege()".into(),
700 )
701 .into())
702 }
703 })),
704 ("has_schema_privilege", raw(|binder, mut inputs| {
705 if inputs.len() == 2 {
706 inputs.insert(0, ExprImpl::literal_varchar(binder.auth_context.user_name.clone()));
707 }
708 if inputs.len() == 3 {
709 Ok(FunctionCall::new(ExprType::HasSchemaPrivilege, inputs)?.into())
710 } else {
711 Err(ErrorCode::ExprError(
712 "Too many/few arguments for pg_catalog.has_schema_privilege()".into(),
713 )
714 .into())
715 }
716 })),
717 ("has_function_privilege", raw(|binder, mut inputs| {
718 if inputs.len() == 2 {
719 inputs.insert(0, ExprImpl::literal_varchar(binder.auth_context.user_name.clone()));
720 }
721 if inputs.len() == 3 {
722 Ok(FunctionCall::new(ExprType::HasFunctionPrivilege, inputs)?.into())
723 } else {
724 Err(ErrorCode::ExprError(
725 "Too many/few arguments for pg_catalog.has_function_privilege()".into(),
726 )
727 .into())
728 }
729 })),
730 ("pg_stat_get_numscans", raw_literal(ExprImpl::literal_bigint(0))),
731 ("pg_backend_pid", raw(|binder, _inputs| {
732 Ok(ExprImpl::literal_int(binder.session_id.0))
734 })),
735 ("pg_cancel_backend", guard_by_len(|_binder, [_input]| {
736 Ok(ExprImpl::literal_bool(false))
738 })),
739 ("pg_terminate_backend", guard_by_len(|_binder, [_input]| {
740 Ok(ExprImpl::literal_bool(false))
743 })),
744 ("pg_tablespace_location", guard_by_len(|_binder, [_input]| {
745 Ok(ExprImpl::literal_null(DataType::Varchar))
746 })),
747 ("pg_postmaster_start_time", guard_by_len(|_binder, []| {
748 let server_start_time = risingwave_variables::get_server_start_time();
749 let datum = server_start_time.map(Timestamptz::from).map(ScalarImpl::from);
750 let literal = Literal::new(datum, DataType::Timestamptz);
751 Ok(literal.into())
752 })),
753 ("col_description", raw_call(ExprType::ColDescription)),
757 ("obj_description", raw_literal(ExprImpl::literal_varchar("".to_owned()))),
758 ("shobj_description", raw_literal(ExprImpl::literal_varchar("".to_owned()))),
759 ("pg_is_in_recovery", raw_call(ExprType::PgIsInRecovery)),
760 ("rw_recovery_status", raw_call(ExprType::RwRecoveryStatus)),
761 ("rw_cluster_id", raw_call(ExprType::RwClusterId)),
762 ("rw_epoch_to_ts", raw_call(ExprType::RwEpochToTs)),
763 ("rw_fragment_vnodes", raw_call(ExprType::RwFragmentVnodes)),
764 ("rw_actor_vnodes", raw_call(ExprType::RwActorVnodes)),
765 ("rw_vnode", raw_call(ExprType::VnodeUser)),
767 ("rw_license", raw_call(ExprType::License)),
768 ("rw_test_paid_tier", raw_call(ExprType::TestFeature)), ("rw_test_feature", raw_call(ExprType::TestFeature)), ("version", raw_literal(ExprImpl::literal_varchar(current_cluster_version()))),
772 ("now", now()),
774 ("current_timestamp", now()),
775 ("proctime", proctime()),
776 ("pg_sleep", raw_call(ExprType::PgSleep)),
777 ("pg_sleep_for", raw_call(ExprType::PgSleepFor)),
778 ("random", raw_call(ExprType::Random)),
779 ("date", guard_by_len(|_binder, [input]| {
785 input.cast_explicit(&DataType::Date).map_err(Into::into)
786 })),
787
788 ("openai_embedding", guard_by_len(|_binder, [arg0, arg1]| {
790 if let ExprImpl::Literal(config) = &arg0 && let Some(ScalarImpl::Jsonb(_config)) = config.get_data() {
792 Ok(FunctionCall::new(ExprType::OpenaiEmbedding, vec![arg0, arg1])?.into())
793 } else {
794 Err(ErrorCode::InvalidInputSyntax(
795 "`embedding_config` must be constant jsonb".to_owned(),
796 ).into())
797 }
798 })),
799 ]
800 .into_iter()
801 .collect()
802 });
803
804 static FUNCTIONS_BKTREE: LazyLock<BKTree<&str>> = LazyLock::new(|| {
805 let mut tree = BKTree::new(metrics::Levenshtein);
806
807 for k in HANDLES.keys() {
809 tree.add(*k);
810 }
811
812 tree
813 });
814
815 if variadic {
816 let func = match function_name {
817 "format" => ExprType::FormatVariadic,
818 "concat" => ExprType::ConcatVariadic,
819 "concat_ws" => ExprType::ConcatWsVariadic,
820 "jsonb_build_array" => ExprType::JsonbBuildArrayVariadic,
821 "jsonb_build_object" => ExprType::JsonbBuildObjectVariadic,
822 "jsonb_extract_path" => ExprType::JsonbExtractPathVariadic,
823 "jsonb_extract_path_text" => ExprType::JsonbExtractPathTextVariadic,
824 _ => {
825 return Err(ErrorCode::BindError(format!(
826 "VARIADIC argument is not allowed in function \"{}\"",
827 function_name
828 ))
829 .into());
830 }
831 };
832 return Ok(FunctionCall::new(func, inputs)?.into());
833 }
834
835 match HANDLES.get(function_name) {
837 Some(handle) => handle(self, inputs),
838 None => {
839 let allowed_distance = if function_name.len() > 3 { 2 } else { 1 };
840
841 let candidates = FUNCTIONS_BKTREE
842 .find(function_name, allowed_distance)
843 .map(|(_idx, c)| c)
844 .join(" or ");
845
846 Err(no_function!(
847 candidates = (!candidates.is_empty()).then_some(candidates),
848 "{}({})",
849 function_name,
850 inputs.iter().map(|e| e.return_type()).join(", ")
851 )
852 .into())
853 }
854 }
855 }
856
857 fn ensure_now_function_allowed(&self) -> Result<()> {
858 if self.is_for_stream()
859 && !matches!(
860 self.context.clause,
861 Some(Clause::Where)
862 | Some(Clause::Having)
863 | Some(Clause::JoinOn)
864 | Some(Clause::From)
865 )
866 {
867 return Err(ErrorCode::InvalidInputSyntax(format!(
868 "For streaming queries, `NOW()` function is only allowed in `WHERE`, `HAVING`, `ON` and `FROM`. Found in clause: {:?}. \
869 Please please refer to https://www.risingwave.dev/docs/current/sql-pattern-temporal-filters/ for more information",
870 self.context.clause
871 ))
872 .into());
873 }
874 if matches!(self.context.clause, Some(Clause::GeneratedColumn)) {
875 return Err(ErrorCode::InvalidInputSyntax(
876 "Cannot use `NOW()` function in generated columns. Do you want `PROCTIME()`?"
877 .to_owned(),
878 )
879 .into());
880 }
881 Ok(())
882 }
883
884 fn ensure_proctime_function_allowed(&self) -> Result<()> {
885 if !self.is_for_ddl() {
886 return Err(ErrorCode::InvalidInputSyntax(
887 "Function `PROCTIME()` is only allowed in CREATE TABLE/SOURCE. Is `NOW()` what you want?".to_owned(),
888 )
889 .into());
890 }
891 Ok(())
892 }
893}
894
895fn rewrite_concat_to_concat_ws(inputs: Vec<ExprImpl>) -> Result<Vec<ExprImpl>> {
896 if inputs.is_empty() {
897 Err(ErrorCode::BindError(
898 "Function `concat` takes at least 1 arguments (0 given)".to_owned(),
899 )
900 .into())
901 } else {
902 let inputs = std::iter::once(ExprImpl::literal_varchar("".to_owned()))
903 .chain(inputs)
904 .collect();
905 Ok(inputs)
906 }
907}
908
909fn rewrite_nullif_to_case_when(inputs: Vec<ExprImpl>) -> Result<Vec<ExprImpl>> {
912 if inputs.len() != 2 {
913 Err(ErrorCode::BindError("Function `nullif` must contain 2 arguments".to_owned()).into())
914 } else {
915 let inputs = vec![
916 FunctionCall::new(ExprType::Equal, inputs.clone())?.into(),
917 Literal::new(None, inputs[0].return_type()).into(),
918 inputs[0].clone(),
919 ];
920 Ok(inputs)
921 }
922}
923
924fn rewrite_two_bool_inputs(mut inputs: Vec<ExprImpl>) -> Result<Vec<ExprImpl>> {
925 if inputs.len() != 2 {
926 return Err(
927 ErrorCode::BindError("function must contain only 2 arguments".to_owned()).into(),
928 );
929 }
930 let left = inputs.pop().unwrap();
931 let right = inputs.pop().unwrap();
932 Ok(vec![
933 left.cast_implicit(&DataType::Boolean)?,
934 right.cast_implicit(&DataType::Boolean)?,
935 ])
936}