1use std::collections::HashMap;
16use std::sync::LazyLock;
17
18use bk_tree::{BKTree, metrics};
19use itertools::Itertools;
20use risingwave_common::session_config::USER_NAME_WILD_CARD;
21use risingwave_common::types::{DataType, ListValue, ScalarImpl, Timestamptz};
22use risingwave_common::{bail_not_implemented, current_cluster_version, no_function};
23use thiserror_ext::AsReport;
24
25use crate::Binder;
26use crate::binder::Clause;
27use crate::error::{ErrorCode, Result};
28use crate::expr::{CastContext, Expr, ExprImpl, ExprType, FunctionCall, Literal, Now};
29
30impl Binder {
31 pub(super) fn bind_builtin_scalar_function(
32 &mut self,
33 function_name: &str,
34 inputs: Vec<ExprImpl>,
35 variadic: bool,
36 ) -> Result<ExprImpl> {
37 type Inputs = Vec<ExprImpl>;
38
39 type Handle = Box<dyn Fn(&mut Binder, Inputs) -> Result<ExprImpl> + Sync + Send>;
40
41 fn rewrite(r#type: ExprType, rewriter: fn(Inputs) -> Result<Inputs>) -> Handle {
42 Box::new(move |_binder, mut inputs| {
43 inputs = (rewriter)(inputs)?;
44 Ok(FunctionCall::new(r#type, inputs)?.into())
45 })
46 }
47
48 fn raw_call(r#type: ExprType) -> Handle {
49 rewrite(r#type, Ok)
50 }
51
52 fn guard_by_len<const E: usize>(
53 handle: impl Fn(&mut Binder, [ExprImpl; E]) -> Result<ExprImpl> + Sync + Send + 'static,
54 ) -> Handle {
55 Box::new(move |binder, inputs| {
56 let input_len = inputs.len();
57 let Ok(inputs) = inputs.try_into() else {
58 return Err(ErrorCode::ExprError(
59 format!("unexpected arguments number {}, expect {}", input_len, E).into(),
60 )
61 .into());
62 };
63 handle(binder, inputs)
64 })
65 }
66
67 fn raw<F: Fn(&mut Binder, Inputs) -> Result<ExprImpl> + Sync + Send + 'static>(
68 f: F,
69 ) -> Handle {
70 Box::new(f)
71 }
72
73 fn dispatch_by_len(mapping: Vec<(usize, Handle)>) -> Handle {
74 Box::new(move |binder, inputs| {
75 for (len, handle) in &mapping {
76 if inputs.len() == *len {
77 return handle(binder, inputs);
78 }
79 }
80 Err(ErrorCode::ExprError("unexpected arguments number".into()).into())
81 })
82 }
83
84 fn raw_literal(literal: ExprImpl) -> Handle {
85 Box::new(move |_binder, _inputs| Ok(literal.clone()))
86 }
87
88 fn now() -> Handle {
89 guard_by_len(move |binder, []| {
90 binder.ensure_now_function_allowed()?;
91 Ok(Now.into())
94 })
95 }
96
97 fn pi() -> Handle {
98 raw_literal(ExprImpl::literal_f64(std::f64::consts::PI))
99 }
100
101 fn proctime() -> Handle {
102 Box::new(move |binder, inputs| {
103 binder.ensure_proctime_function_allowed()?;
104 raw_call(ExprType::Proctime)(binder, inputs)
105 })
106 }
107
108 fn session_user() -> Handle {
110 guard_by_len(|binder, []| {
111 Ok(ExprImpl::literal_varchar(
112 binder.auth_context.user_name.clone(),
113 ))
114 })
115 }
116
117 fn current_user() -> Handle {
121 guard_by_len(|binder, []| {
122 Ok(ExprImpl::literal_varchar(
123 binder.auth_context.user_name.clone(),
124 ))
125 })
126 }
127
128 fn current_database() -> Handle {
131 guard_by_len(|binder, []| Ok(ExprImpl::literal_varchar(binder.db_name.clone())))
132 }
133
134 static HANDLES: LazyLock<HashMap<&'static str, Handle>> = LazyLock::new(|| {
138 [
139 (
140 "booleq",
141 rewrite(ExprType::Equal, rewrite_two_bool_inputs),
142 ),
143 (
144 "boolne",
145 rewrite(ExprType::NotEqual, rewrite_two_bool_inputs),
146 ),
147 ("coalesce", rewrite(ExprType::Coalesce, |inputs| {
148 if inputs.iter().any(ExprImpl::has_table_function) {
149 return Err(ErrorCode::BindError("table functions are not allowed in COALESCE".into()).into());
150 }
151 Ok(inputs)
152 })),
153 (
154 "nullif",
155 rewrite(ExprType::Case, rewrite_nullif_to_case_when),
156 ),
157 (
158 "round",
159 dispatch_by_len(vec![
160 (2, raw_call(ExprType::RoundDigit)),
161 (1, raw_call(ExprType::Round)),
162 ]),
163 ),
164 ("pow", raw_call(ExprType::Pow)),
165 ("power", raw_call(ExprType::Pow)),
167 ("ceil", raw_call(ExprType::Ceil)),
168 ("ceiling", raw_call(ExprType::Ceil)),
169 ("floor", raw_call(ExprType::Floor)),
170 ("trunc", raw_call(ExprType::Trunc)),
171 ("abs", raw_call(ExprType::Abs)),
172 ("exp", raw_call(ExprType::Exp)),
173 ("ln", raw_call(ExprType::Ln)),
174 ("log", raw_call(ExprType::Log10)),
175 ("log10", raw_call(ExprType::Log10)),
176 ("mod", raw_call(ExprType::Modulus)),
177 ("sin", raw_call(ExprType::Sin)),
178 ("cos", raw_call(ExprType::Cos)),
179 ("tan", raw_call(ExprType::Tan)),
180 ("cot", raw_call(ExprType::Cot)),
181 ("asin", raw_call(ExprType::Asin)),
182 ("acos", raw_call(ExprType::Acos)),
183 ("atan", raw_call(ExprType::Atan)),
184 ("atan2", raw_call(ExprType::Atan2)),
185 ("sind", raw_call(ExprType::Sind)),
186 ("cosd", raw_call(ExprType::Cosd)),
187 ("cotd", raw_call(ExprType::Cotd)),
188 ("tand", raw_call(ExprType::Tand)),
189 ("sinh", raw_call(ExprType::Sinh)),
190 ("cosh", raw_call(ExprType::Cosh)),
191 ("tanh", raw_call(ExprType::Tanh)),
192 ("coth", raw_call(ExprType::Coth)),
193 ("asinh", raw_call(ExprType::Asinh)),
194 ("acosh", raw_call(ExprType::Acosh)),
195 ("atanh", raw_call(ExprType::Atanh)),
196 ("asind", raw_call(ExprType::Asind)),
197 ("acosd", raw_call(ExprType::Acosd)),
198 ("atand", raw_call(ExprType::Atand)),
199 ("atan2d", raw_call(ExprType::Atan2d)),
200 ("degrees", raw_call(ExprType::Degrees)),
201 ("radians", raw_call(ExprType::Radians)),
202 ("sqrt", raw_call(ExprType::Sqrt)),
203 ("cbrt", raw_call(ExprType::Cbrt)),
204 ("sign", raw_call(ExprType::Sign)),
205 ("scale", raw_call(ExprType::Scale)),
206 ("min_scale", raw_call(ExprType::MinScale)),
207 ("trim_scale", raw_call(ExprType::TrimScale)),
208 (
210 "to_timestamp",
211 dispatch_by_len(vec![
212 (1, raw_call(ExprType::SecToTimestamptz)),
213 (2, raw_call(ExprType::CharToTimestamptz)),
214 ]),
215 ),
216 ("date_trunc", raw_call(ExprType::DateTrunc)),
217 ("date_bin", raw_call(ExprType::DateBin)),
218 ("date_part", raw_call(ExprType::DatePart)),
219 ("make_date", raw_call(ExprType::MakeDate)),
220 ("make_time", raw_call(ExprType::MakeTime)),
221 ("make_timestamp", raw_call(ExprType::MakeTimestamp)),
222 ("make_timestamptz", raw_call(ExprType::MakeTimestamptz)),
223 ("timezone", guard_by_len(|_binder, [arg0, arg1]| {
224 Ok(FunctionCall::new(ExprType::AtTimeZone, vec![arg1, arg0])?.into())
226 })),
227 ("to_date", raw_call(ExprType::CharToDate)),
228 ("substr", raw_call(ExprType::Substr)),
230 ("length", raw_call(ExprType::Length)),
231 ("upper", raw_call(ExprType::Upper)),
232 ("lower", raw_call(ExprType::Lower)),
233 ("trim", raw_call(ExprType::Trim)),
234 ("replace", raw_call(ExprType::Replace)),
235 ("overlay", raw_call(ExprType::Overlay)),
236 ("btrim", raw_call(ExprType::Trim)),
237 ("ltrim", raw_call(ExprType::Ltrim)),
238 ("rtrim", raw_call(ExprType::Rtrim)),
239 ("md5", raw_call(ExprType::Md5)),
240 ("to_char", raw_call(ExprType::ToChar)),
241 (
242 "concat",
243 rewrite(ExprType::ConcatWs, rewrite_concat_to_concat_ws),
244 ),
245 ("concat_ws", raw_call(ExprType::ConcatWs)),
246 ("format", raw_call(ExprType::Format)),
247 ("translate", raw_call(ExprType::Translate)),
248 ("split_part", raw_call(ExprType::SplitPart)),
249 ("char_length", raw_call(ExprType::CharLength)),
250 ("character_length", raw_call(ExprType::CharLength)),
251 ("repeat", raw_call(ExprType::Repeat)),
252 ("ascii", raw_call(ExprType::Ascii)),
253 ("octet_length", raw_call(ExprType::OctetLength)),
254 ("bit_length", raw_call(ExprType::BitLength)),
255 ("regexp_match", raw_call(ExprType::RegexpMatch)),
256 ("regexp_replace", raw_call(ExprType::RegexpReplace)),
257 ("regexp_count", raw_call(ExprType::RegexpCount)),
258 ("regexp_split_to_array", raw_call(ExprType::RegexpSplitToArray)),
259 ("chr", raw_call(ExprType::Chr)),
260 ("starts_with", raw_call(ExprType::StartsWith)),
261 ("initcap", raw_call(ExprType::Initcap)),
262 ("lpad", raw_call(ExprType::Lpad)),
263 ("rpad", raw_call(ExprType::Rpad)),
264 ("reverse", raw_call(ExprType::Reverse)),
265 ("strpos", raw_call(ExprType::Position)),
266 ("to_ascii", raw_call(ExprType::ToAscii)),
267 ("to_hex", raw_call(ExprType::ToHex)),
268 ("quote_ident", raw_call(ExprType::QuoteIdent)),
269 ("quote_literal", guard_by_len(|_binder, [mut input]| {
270 if input.return_type() != DataType::Varchar {
271 FunctionCall::cast_mut(&mut input, &DataType::Varchar, CastContext::Explicit)?;
274 }
275 Ok(FunctionCall::new_unchecked(ExprType::QuoteLiteral, vec![input], DataType::Varchar).into())
276 })),
277 ("quote_nullable", guard_by_len(|_binder, [mut input]| {
278 if input.return_type() != DataType::Varchar {
279 FunctionCall::cast_mut(&mut input, &DataType::Varchar, CastContext::Explicit)?;
282 }
283 Ok(FunctionCall::new_unchecked(ExprType::QuoteNullable, vec![input], DataType::Varchar).into())
284 })),
285 ("string_to_array", raw_call(ExprType::StringToArray)),
286 ("get_bit", raw_call(ExprType::GetBit)),
287 ("get_byte", raw_call(ExprType::GetByte)),
288 ("set_bit", raw_call(ExprType::SetBit)),
289 ("set_byte", raw_call(ExprType::SetByte)),
290 ("bit_count", raw_call(ExprType::BitCount)),
291 ("encode", raw_call(ExprType::Encode)),
292 ("decode", raw_call(ExprType::Decode)),
293 ("convert_from", raw_call(ExprType::ConvertFrom)),
294 ("convert_to", raw_call(ExprType::ConvertTo)),
295 ("sha1", raw_call(ExprType::Sha1)),
296 ("sha224", raw_call(ExprType::Sha224)),
297 ("sha256", raw_call(ExprType::Sha256)),
298 ("sha384", raw_call(ExprType::Sha384)),
299 ("sha512", raw_call(ExprType::Sha512)),
300 ("encrypt", raw_call(ExprType::Encrypt)),
301 ("decrypt", raw_call(ExprType::Decrypt)),
302 ("hmac", raw_call(ExprType::Hmac)),
303 ("secure_compare", raw_call(ExprType::SecureCompare)),
304 ("left", raw_call(ExprType::Left)),
305 ("right", raw_call(ExprType::Right)),
306 ("inet_aton", raw_call(ExprType::InetAton)),
307 ("inet_ntoa", raw_call(ExprType::InetNtoa)),
308 ("int8send", raw_call(ExprType::PgwireSend)),
309 ("int8recv", guard_by_len(|_binder, [mut input]| {
310 let hint = if !input.is_untyped() && input.return_type() == DataType::Varchar {
312 " Consider `decode` or cast."
313 } else {
314 ""
315 };
316 input.cast_implicit_mut(&DataType::Bytea).map_err(|e| {
317 ErrorCode::BindError(format!("{} in `recv`.{hint}", e.as_report()))
318 })?;
319 Ok(FunctionCall::new_unchecked(ExprType::PgwireRecv, vec![input], DataType::Int64).into())
320 })),
321 ("array_cat", raw_call(ExprType::ArrayCat)),
323 ("array_append", raw_call(ExprType::ArrayAppend)),
324 ("array_join", raw_call(ExprType::ArrayToString)),
325 ("array_prepend", raw_call(ExprType::ArrayPrepend)),
326 ("array_to_string", raw_call(ExprType::ArrayToString)),
327 ("array_distinct", raw_call(ExprType::ArrayDistinct)),
328 ("array_min", raw_call(ExprType::ArrayMin)),
329 ("array_sort", raw_call(ExprType::ArraySort)),
330 ("array_length", raw_call(ExprType::ArrayLength)),
331 ("cardinality", raw_call(ExprType::Cardinality)),
332 ("array_remove", raw_call(ExprType::ArrayRemove)),
333 ("array_replace", raw_call(ExprType::ArrayReplace)),
334 ("array_max", raw_call(ExprType::ArrayMax)),
335 ("array_sum", raw_call(ExprType::ArraySum)),
336 ("array_position", raw_call(ExprType::ArrayPosition)),
337 ("array_positions", raw_call(ExprType::ArrayPositions)),
338 ("array_contains", raw_call(ExprType::ArrayContains)),
339 ("arraycontains", raw_call(ExprType::ArrayContains)),
340 ("array_contained", raw_call(ExprType::ArrayContained)),
341 ("arraycontained", raw_call(ExprType::ArrayContained)),
342 ("array_flatten", guard_by_len(|_binder, [input]| {
343 input.ensure_array_type().map_err(|_| ErrorCode::BindError("array_flatten expects `any[][]` input".into()))?;
344 let return_type = input.return_type().into_list_elem();
345 if !return_type.is_array() {
346 return Err(ErrorCode::BindError("array_flatten expects `any[][]` input".into()).into());
347 }
348 Ok(FunctionCall::new_unchecked(ExprType::ArrayFlatten, vec![input], return_type).into())
349 })),
350 ("trim_array", raw_call(ExprType::TrimArray)),
351 (
352 "array_ndims",
353 guard_by_len(|_binder, [input]| {
354 input.ensure_array_type()?;
355
356 let n = input.return_type().array_ndims()
357 .try_into().map_err(|_| ErrorCode::BindError("array_ndims integer overflow".into()))?;
358 Ok(ExprImpl::literal_int(n))
359 }),
360 ),
361 (
362 "array_lower",
363 guard_by_len(|binder, [arg0, arg1]| {
364 let ndims_expr = binder.bind_builtin_scalar_function("array_ndims", vec![arg0], false)?;
366 let arg1 = arg1.cast_implicit(&DataType::Int32)?;
367
368 FunctionCall::new(
369 ExprType::Case,
370 vec![
371 FunctionCall::new(
372 ExprType::And,
373 vec![
374 FunctionCall::new(ExprType::LessThan, vec![ExprImpl::literal_int(0), arg1.clone()])?.into(),
375 FunctionCall::new(ExprType::LessThanOrEqual, vec![arg1, ndims_expr])?.into(),
376 ],
377 )?.into(),
378 ExprImpl::literal_int(1),
379 ],
380 ).map(Into::into)
381 }),
382 ),
383 ("array_upper", raw_call(ExprType::ArrayLength)), ("array_dims", raw_call(ExprType::ArrayDims)),
385 ("hex_to_int256", raw_call(ExprType::HexToInt256)),
387 ("jsonb_object_field", raw_call(ExprType::JsonbAccess)),
389 ("jsonb_array_element", raw_call(ExprType::JsonbAccess)),
390 ("jsonb_object_field_text", raw_call(ExprType::JsonbAccessStr)),
391 ("jsonb_array_element_text", raw_call(ExprType::JsonbAccessStr)),
392 ("jsonb_extract_path", raw_call(ExprType::JsonbExtractPath)),
393 ("jsonb_extract_path_text", raw_call(ExprType::JsonbExtractPathText)),
394 ("jsonb_typeof", raw_call(ExprType::JsonbTypeof)),
395 ("jsonb_array_length", raw_call(ExprType::JsonbArrayLength)),
396 ("jsonb_concat", raw_call(ExprType::JsonbConcat)),
397 ("jsonb_object", raw_call(ExprType::JsonbObject)),
398 ("jsonb_pretty", raw_call(ExprType::JsonbPretty)),
399 ("jsonb_contains", raw_call(ExprType::JsonbContains)),
400 ("jsonb_contained", raw_call(ExprType::JsonbContained)),
401 ("jsonb_exists", raw_call(ExprType::JsonbExists)),
402 ("jsonb_exists_any", raw_call(ExprType::JsonbExistsAny)),
403 ("jsonb_exists_all", raw_call(ExprType::JsonbExistsAll)),
404 ("jsonb_delete", raw_call(ExprType::Subtract)),
405 ("jsonb_delete_path", raw_call(ExprType::JsonbDeletePath)),
406 ("jsonb_strip_nulls", raw_call(ExprType::JsonbStripNulls)),
407 ("to_jsonb", raw_call(ExprType::ToJsonb)),
408 ("jsonb_build_array", raw_call(ExprType::JsonbBuildArray)),
409 ("jsonb_build_object", raw_call(ExprType::JsonbBuildObject)),
410 ("jsonb_populate_record", raw_call(ExprType::JsonbPopulateRecord)),
411 ("jsonb_path_match", raw_call(ExprType::JsonbPathMatch)),
412 ("jsonb_path_exists", raw_call(ExprType::JsonbPathExists)),
413 ("jsonb_path_query_array", raw_call(ExprType::JsonbPathQueryArray)),
414 ("jsonb_path_query_first", raw_call(ExprType::JsonbPathQueryFirst)),
415 ("jsonb_set", raw_call(ExprType::JsonbSet)),
416 ("jsonb_populate_map", raw_call(ExprType::JsonbPopulateMap)),
417 ("jsonb_to_array", raw_call(ExprType::JsonbToArray)),
418 ("map_from_entries", raw_call(ExprType::MapFromEntries)),
420 ("map_access", raw_call(ExprType::MapAccess)),
421 ("map_keys", raw_call(ExprType::MapKeys)),
422 ("map_values", raw_call(ExprType::MapValues)),
423 ("map_entries", raw_call(ExprType::MapEntries)),
424 ("map_from_key_values", raw_call(ExprType::MapFromKeyValues)),
425 ("map_cat", raw_call(ExprType::MapCat)),
426 ("map_contains", raw_call(ExprType::MapContains)),
427 ("map_delete", raw_call(ExprType::MapDelete)),
428 ("map_insert", raw_call(ExprType::MapInsert)),
429 ("map_length", raw_call(ExprType::MapLength)),
430 ("l2_distance", raw_call(ExprType::L2Distance)),
432 ("cosine_distance", raw_call(ExprType::CosineDistance)),
433 ("l1_distance", raw_call(ExprType::L1Distance)),
434 ("inner_product", raw_call(ExprType::InnerProduct)),
435 ("vector_norm", raw_call(ExprType::L2Norm)),
436 ("l2_normalize", raw_call(ExprType::L2Normalize)),
437 ("subvector", guard_by_len(|_, [vector_expr, start_expr, len_expr]| {
438 let dimensions = if let DataType::Vector(length) = vector_expr.return_type() {
439 length as i32
440 } else {
441 return Err(ErrorCode::BindError("subvector expects `vector(dim)` input".into()).into());
442 };
443 let start = start_expr
444 .try_fold_const()
445 .transpose()?
446 .and_then(|datum| match datum {
447 Some(ScalarImpl::Int32(v)) => Some(v),
448 _ => None,
449 })
450 .ok_or_else(|| ErrorCode::ExprError("`start` must be an Int32 constant".into()))?;
451
452 let len = len_expr
453 .try_fold_const()
454 .transpose()?
455 .and_then(|datum| match datum {
456 Some(ScalarImpl::Int32(v)) => Some(v),
457 _ => None,
458 })
459 .ok_or_else(|| ErrorCode::ExprError("`count` must be an Int32 constant".into()))?;
460 if len < 1 || len > DataType::VEC_MAX_SIZE as i32 {
461 return Err(ErrorCode::InvalidParameterValue(format!("Invalid vector size: expected 1..={}, got {}", DataType::VEC_MAX_SIZE, len)).into());
462 }
463
464 let end = start + len - 1;
465
466 if start < 1 || end > dimensions {
467 return Err(ErrorCode::InvalidParameterValue(format!(
468 "vector slice range out of bounds: start={}, end={}, valid range is [1, {}]",
469 start,
470 end,
471 dimensions
472 )).into());
473 }
474
475 Ok(FunctionCall::new_unchecked(ExprType::Subvector, vec![vector_expr, start_expr, len_expr], DataType::Vector(len as usize)).into())
476 })),
477 ("pi", pi()),
479 ("greatest", raw_call(ExprType::Greatest)),
481 ("least", raw_call(ExprType::Least)),
482 (
484 "pg_typeof",
485 guard_by_len(|_binder, [input]| {
486 let v = match input.is_untyped() {
487 true => "unknown".into(),
488 false => input.return_type().to_string(),
489 };
490 Ok(ExprImpl::literal_varchar(v))
491 }),
492 ),
493 ("current_catalog", current_database()),
494 ("current_database", current_database()),
495 ("current_schema", guard_by_len(|binder, []| {
496 Ok(binder
497 .first_valid_schema()
498 .map(|schema| ExprImpl::literal_varchar(schema.name()))
499 .unwrap_or_else(|_| ExprImpl::literal_null(DataType::Varchar)))
500 })),
501 ("current_schemas", raw(|binder, mut inputs| {
502 let no_match_err = ErrorCode::ExprError(
503 "No function matches the given name and argument types. You might need to add explicit type casts.".into()
504 );
505 if inputs.len() != 1 {
506 return Err(no_match_err.into());
507 }
508 let input = inputs
509 .pop()
510 .unwrap()
511 .enforce_bool_clause("current_schemas")
512 .map_err(|_| no_match_err)?;
513
514 let ExprImpl::Literal(literal) = &input else {
515 bail_not_implemented!("Only boolean literals are supported in `current_schemas`.");
516 };
517
518 let Some(bool) = literal.get_data().as_ref().map(|bool| bool.clone().into_bool()) else {
519 return Ok(ExprImpl::literal_null(DataType::Varchar.list()));
520 };
521
522 let paths = if bool {
523 binder.search_path.path()
524 } else {
525 binder.search_path.real_path()
526 };
527
528 let mut schema_names = vec![];
529 for path in paths {
530 let mut schema_name = path;
531 if schema_name == USER_NAME_WILD_CARD {
532 schema_name = &binder.auth_context.user_name;
533 }
534
535 if binder
536 .catalog
537 .get_schema_by_name(&binder.db_name, schema_name)
538 .is_ok()
539 {
540 schema_names.push(schema_name.as_str());
541 }
542 }
543
544 Ok(ExprImpl::literal_list(
545 ListValue::from_iter(schema_names),
546 DataType::Varchar,
547 ))
548 })),
549 ("session_user", session_user()),
550 ("current_role", current_user()),
551 ("current_user", current_user()),
552 ("user", current_user()),
553 ("pg_get_userbyid", raw_call(ExprType::PgGetUserbyid)),
554 ("pg_get_indexdef", raw_call(ExprType::PgGetIndexdef)),
555 ("pg_get_viewdef", raw_call(ExprType::PgGetViewdef)),
556 ("pg_index_column_has_property", raw_call(ExprType::PgIndexColumnHasProperty)),
557 ("pg_relation_size", raw(|_binder, mut inputs| {
558 if inputs.is_empty() {
559 return Err(ErrorCode::ExprError(
560 "function pg_relation_size() does not exist".into(),
561 )
562 .into());
563 }
564 inputs[0].cast_to_regclass_mut()?;
565 Ok(FunctionCall::new(ExprType::PgRelationSize, inputs)?.into())
566 })),
567 ("pg_get_serial_sequence", raw_literal(ExprImpl::literal_null(DataType::Varchar))),
568 ("pg_table_size", guard_by_len(|_binder, [mut input]| {
569 input.cast_to_regclass_mut()?;
570 Ok(FunctionCall::new(ExprType::PgRelationSize, vec![input])?.into())
571 })),
572 ("pg_indexes_size", guard_by_len(|_binder, [mut input]| {
573 input.cast_to_regclass_mut()?;
574 Ok(FunctionCall::new(ExprType::PgIndexesSize, vec![input])?.into())
575 })),
576 ("pg_get_expr", raw(|_binder, inputs| {
577 if inputs.len() == 2 || inputs.len() == 3 {
578 Ok(ExprImpl::literal_varchar("".into()))
580 } else {
581 Err(ErrorCode::ExprError(
582 "Too many/few arguments for pg_catalog.pg_get_expr()".into(),
583 )
584 .into())
585 }
586 })),
587 ("pg_my_temp_schema", guard_by_len(|_binder, []| {
588 Ok(ExprImpl::literal_int(
590 0,
592 ))
593 })),
594 ("current_setting", guard_by_len(|binder, [input]| {
595 let input = if let ExprImpl::Literal(literal) = &input &&
596 let Some(ScalarImpl::Utf8(input)) = literal.get_data()
597 {
598 input
599 } else {
600 return Err(ErrorCode::ExprError(
601 "Only literal is supported in `setting_name`.".into(),
602 )
603 .into());
604 };
605 let session_config = binder.session_config.read();
606 Ok(ExprImpl::literal_varchar(session_config.get(input.as_ref())?))
607 })),
608 ("set_config", guard_by_len(|binder, [arg0, arg1, arg2]| {
609 let setting_name = if let ExprImpl::Literal(literal) = &arg0 && let Some(ScalarImpl::Utf8(input)) = literal.get_data() {
610 input
611 } else {
612 return Err(ErrorCode::ExprError(
613 "Only string literal is supported in `setting_name`.".into(),
614 )
615 .into());
616 };
617
618 let new_value = if let ExprImpl::Literal(literal) = &arg1 && let Some(ScalarImpl::Utf8(input)) = literal.get_data() {
619 input
620 } else {
621 return Err(ErrorCode::ExprError(
622 "Only string literal is supported in `setting_name`.".into(),
623 )
624 .into());
625 };
626
627 let is_local = if let ExprImpl::Literal(literal) = &arg2 && let Some(ScalarImpl::Bool(input)) = literal.get_data() {
628 input
629 } else {
630 return Err(ErrorCode::ExprError(
631 "Only bool literal is supported in `is_local`.".into(),
632 )
633 .into());
634 };
635
636 if *is_local {
637 return Err(ErrorCode::ExprError(
638 "`is_local = true` is not supported now.".into(),
639 )
640 .into());
641 }
642
643 let mut session_config = binder.session_config.write();
644
645 session_config.set(setting_name, new_value.to_string(), &mut ())?;
647
648 Ok(ExprImpl::literal_varchar(new_value.to_string()))
649 })),
650 ("format_type", raw_call(ExprType::FormatType)),
651 ("pg_table_is_visible", raw_call(ExprType::PgTableIsVisible)),
652 ("pg_type_is_visible", raw_literal(ExprImpl::literal_bool(true))),
653 ("pg_get_constraintdef", raw_literal(ExprImpl::literal_null(DataType::Varchar))),
654 ("pg_get_partkeydef", raw_literal(ExprImpl::literal_null(DataType::Varchar))),
655 ("pg_encoding_to_char", raw_literal(ExprImpl::literal_varchar("UTF8".into()))),
656 ("has_database_privilege", raw(|binder, mut inputs| {
657 if inputs.len() == 2 {
658 inputs.insert(0, ExprImpl::literal_varchar(binder.auth_context.user_name.clone()));
659 }
660 if inputs.len() == 3 {
661 Ok(FunctionCall::new(ExprType::HasDatabasePrivilege, inputs)?.into())
662 } else {
663 Err(ErrorCode::ExprError(
664 "Too many/few arguments for pg_catalog.has_database_privilege()".into(),
665 )
666 .into())
667 }
668 })),
669 ("has_table_privilege", raw(|binder, mut inputs| {
670 if inputs.len() == 2 {
671 inputs.insert(0, ExprImpl::literal_varchar(binder.auth_context.user_name.clone()));
672 }
673 if inputs.len() == 3 {
674 if inputs[1].return_type() == DataType::Varchar {
675 inputs[1].cast_to_regclass_mut()?;
676 }
677 Ok(FunctionCall::new(ExprType::HasTablePrivilege, inputs)?.into())
678 } else {
679 Err(ErrorCode::ExprError(
680 "Too many/few arguments for pg_catalog.has_table_privilege()".into(),
681 )
682 .into())
683 }
684 })),
685 ("has_any_column_privilege", raw(|binder, mut inputs| {
686 if inputs.len() == 2 {
687 inputs.insert(0, ExprImpl::literal_varchar(binder.auth_context.user_name.clone()));
688 }
689 if inputs.len() == 3 {
690 if inputs[1].return_type() == DataType::Varchar {
691 inputs[1].cast_to_regclass_mut()?;
692 }
693 Ok(FunctionCall::new(ExprType::HasAnyColumnPrivilege, inputs)?.into())
694 } else {
695 Err(ErrorCode::ExprError(
696 "Too many/few arguments for pg_catalog.has_any_column_privilege()".into(),
697 )
698 .into())
699 }
700 })),
701 ("has_schema_privilege", raw(|binder, mut inputs| {
702 if inputs.len() == 2 {
703 inputs.insert(0, ExprImpl::literal_varchar(binder.auth_context.user_name.clone()));
704 }
705 if inputs.len() == 3 {
706 Ok(FunctionCall::new(ExprType::HasSchemaPrivilege, inputs)?.into())
707 } else {
708 Err(ErrorCode::ExprError(
709 "Too many/few arguments for pg_catalog.has_schema_privilege()".into(),
710 )
711 .into())
712 }
713 })),
714 ("has_function_privilege", raw(|binder, mut inputs| {
715 if inputs.len() == 2 {
716 inputs.insert(0, ExprImpl::literal_varchar(binder.auth_context.user_name.clone()));
717 }
718 if inputs.len() == 3 {
719 Ok(FunctionCall::new(ExprType::HasFunctionPrivilege, inputs)?.into())
720 } else {
721 Err(ErrorCode::ExprError(
722 "Too many/few arguments for pg_catalog.has_function_privilege()".into(),
723 )
724 .into())
725 }
726 })),
727 ("pg_stat_get_numscans", raw_literal(ExprImpl::literal_bigint(0))),
728 ("pg_backend_pid", raw(|binder, _inputs| {
729 Ok(ExprImpl::literal_int(binder.session_id.0))
731 })),
732 ("pg_cancel_backend", guard_by_len(|_binder, [_input]| {
733 Ok(ExprImpl::literal_bool(false))
735 })),
736 ("pg_terminate_backend", guard_by_len(|_binder, [_input]| {
737 Ok(ExprImpl::literal_bool(false))
740 })),
741 ("pg_tablespace_location", guard_by_len(|_binder, [_input]| {
742 Ok(ExprImpl::literal_null(DataType::Varchar))
743 })),
744 ("pg_postmaster_start_time", guard_by_len(|_binder, []| {
745 let server_start_time = risingwave_variables::get_server_start_time();
746 let datum = server_start_time.map(Timestamptz::from).map(ScalarImpl::from);
747 let literal = Literal::new(datum, DataType::Timestamptz);
748 Ok(literal.into())
749 })),
750 ("col_description", raw_call(ExprType::ColDescription)),
754 ("obj_description", raw_literal(ExprImpl::literal_varchar("".to_owned()))),
755 ("shobj_description", raw_literal(ExprImpl::literal_varchar("".to_owned()))),
756 ("pg_is_in_recovery", raw_call(ExprType::PgIsInRecovery)),
757 ("rw_recovery_status", raw_call(ExprType::RwRecoveryStatus)),
758 ("rw_epoch_to_ts", raw_call(ExprType::RwEpochToTs)),
759 ("rw_vnode", raw_call(ExprType::VnodeUser)),
761 ("rw_license", raw_call(ExprType::License)),
762 ("rw_test_paid_tier", raw_call(ExprType::TestFeature)), ("rw_test_feature", raw_call(ExprType::TestFeature)), ("version", raw_literal(ExprImpl::literal_varchar(current_cluster_version()))),
766 ("now", now()),
768 ("current_timestamp", now()),
769 ("proctime", proctime()),
770 ("pg_sleep", raw_call(ExprType::PgSleep)),
771 ("pg_sleep_for", raw_call(ExprType::PgSleepFor)),
772 ("random", raw_call(ExprType::Random)),
773 ("date", guard_by_len(|_binder, [input]| {
779 input.cast_explicit(&DataType::Date).map_err(Into::into)
780 })),
781
782 ("openai_embedding", guard_by_len(|_binder, [arg0, arg1]| {
784 if let ExprImpl::Literal(config) = &arg0 && let Some(ScalarImpl::Jsonb(_config)) = config.get_data() {
786 Ok(FunctionCall::new(ExprType::OpenaiEmbedding, vec![arg0, arg1])?.into())
787 } else {
788 Err(ErrorCode::InvalidInputSyntax(
789 "`embedding_config` must be constant jsonb".to_owned(),
790 ).into())
791 }
792 })),
793 ]
794 .into_iter()
795 .collect()
796 });
797
798 static FUNCTIONS_BKTREE: LazyLock<BKTree<&str>> = LazyLock::new(|| {
799 let mut tree = BKTree::new(metrics::Levenshtein);
800
801 for k in HANDLES.keys() {
803 tree.add(*k);
804 }
805
806 tree
807 });
808
809 if variadic {
810 let func = match function_name {
811 "format" => ExprType::FormatVariadic,
812 "concat" => ExprType::ConcatVariadic,
813 "concat_ws" => ExprType::ConcatWsVariadic,
814 "jsonb_build_array" => ExprType::JsonbBuildArrayVariadic,
815 "jsonb_build_object" => ExprType::JsonbBuildObjectVariadic,
816 "jsonb_extract_path" => ExprType::JsonbExtractPathVariadic,
817 "jsonb_extract_path_text" => ExprType::JsonbExtractPathTextVariadic,
818 _ => {
819 return Err(ErrorCode::BindError(format!(
820 "VARIADIC argument is not allowed in function \"{}\"",
821 function_name
822 ))
823 .into());
824 }
825 };
826 return Ok(FunctionCall::new(func, inputs)?.into());
827 }
828
829 match HANDLES.get(function_name) {
831 Some(handle) => handle(self, inputs),
832 None => {
833 let allowed_distance = if function_name.len() > 3 { 2 } else { 1 };
834
835 let candidates = FUNCTIONS_BKTREE
836 .find(function_name, allowed_distance)
837 .map(|(_idx, c)| c)
838 .join(" or ");
839
840 Err(no_function!(
841 candidates = (!candidates.is_empty()).then_some(candidates),
842 "{}({})",
843 function_name,
844 inputs.iter().map(|e| e.return_type()).join(", ")
845 )
846 .into())
847 }
848 }
849 }
850
851 fn ensure_now_function_allowed(&self) -> Result<()> {
852 if self.is_for_stream()
853 && !matches!(
854 self.context.clause,
855 Some(Clause::Where)
856 | Some(Clause::Having)
857 | Some(Clause::JoinOn)
858 | Some(Clause::From)
859 )
860 {
861 return Err(ErrorCode::InvalidInputSyntax(format!(
862 "For streaming queries, `NOW()` function is only allowed in `WHERE`, `HAVING`, `ON` and `FROM`. Found in clause: {:?}. \
863 Please please refer to https://www.risingwave.dev/docs/current/sql-pattern-temporal-filters/ for more information",
864 self.context.clause
865 ))
866 .into());
867 }
868 if matches!(self.context.clause, Some(Clause::GeneratedColumn)) {
869 return Err(ErrorCode::InvalidInputSyntax(
870 "Cannot use `NOW()` function in generated columns. Do you want `PROCTIME()`?"
871 .to_owned(),
872 )
873 .into());
874 }
875 Ok(())
876 }
877
878 fn ensure_proctime_function_allowed(&self) -> Result<()> {
879 if !self.is_for_ddl() {
880 return Err(ErrorCode::InvalidInputSyntax(
881 "Function `PROCTIME()` is only allowed in CREATE TABLE/SOURCE. Is `NOW()` what you want?".to_owned(),
882 )
883 .into());
884 }
885 Ok(())
886 }
887}
888
889fn rewrite_concat_to_concat_ws(inputs: Vec<ExprImpl>) -> Result<Vec<ExprImpl>> {
890 if inputs.is_empty() {
891 Err(ErrorCode::BindError(
892 "Function `concat` takes at least 1 arguments (0 given)".to_owned(),
893 )
894 .into())
895 } else {
896 let inputs = std::iter::once(ExprImpl::literal_varchar("".to_owned()))
897 .chain(inputs)
898 .collect();
899 Ok(inputs)
900 }
901}
902
903fn rewrite_nullif_to_case_when(inputs: Vec<ExprImpl>) -> Result<Vec<ExprImpl>> {
906 if inputs.len() != 2 {
907 Err(ErrorCode::BindError("Function `nullif` must contain 2 arguments".to_owned()).into())
908 } else {
909 let inputs = vec![
910 FunctionCall::new(ExprType::Equal, inputs.clone())?.into(),
911 Literal::new(None, inputs[0].return_type()).into(),
912 inputs[0].clone(),
913 ];
914 Ok(inputs)
915 }
916}
917
918fn rewrite_two_bool_inputs(mut inputs: Vec<ExprImpl>) -> Result<Vec<ExprImpl>> {
919 if inputs.len() != 2 {
920 return Err(
921 ErrorCode::BindError("function must contain only 2 arguments".to_owned()).into(),
922 );
923 }
924 let left = inputs.pop().unwrap();
925 let right = inputs.pop().unwrap();
926 Ok(vec![
927 left.cast_implicit(&DataType::Boolean)?,
928 right.cast_implicit(&DataType::Boolean)?,
929 ])
930}