1use std::collections::HashMap;
16use std::sync::LazyLock;
17
18use bk_tree::{BKTree, metrics};
19use itertools::Itertools;
20use risingwave_common::session_config::USER_NAME_WILD_CARD;
21use risingwave_common::types::{DataType, ListValue, ScalarImpl, Timestamptz};
22use risingwave_common::{bail_not_implemented, current_cluster_version, no_function};
23use thiserror_ext::AsReport;
24
25use crate::Binder;
26use crate::binder::Clause;
27use crate::error::{ErrorCode, Result};
28use crate::expr::{CastContext, Expr, ExprImpl, ExprType, FunctionCall, Literal, Now};
29
30impl Binder {
31 pub(super) fn bind_builtin_scalar_function(
32 &mut self,
33 function_name: &str,
34 inputs: Vec<ExprImpl>,
35 variadic: bool,
36 ) -> Result<ExprImpl> {
37 type Inputs = Vec<ExprImpl>;
38
39 type Handle = Box<dyn Fn(&mut Binder, Inputs) -> Result<ExprImpl> + Sync + Send>;
40
41 fn rewrite(r#type: ExprType, rewriter: fn(Inputs) -> Result<Inputs>) -> Handle {
42 Box::new(move |_binder, mut inputs| {
43 inputs = (rewriter)(inputs)?;
44 Ok(FunctionCall::new(r#type, inputs)?.into())
45 })
46 }
47
48 fn raw_call(r#type: ExprType) -> Handle {
49 rewrite(r#type, Ok)
50 }
51
52 fn guard_by_len<const E: usize>(
53 handle: impl Fn(&mut Binder, [ExprImpl; E]) -> Result<ExprImpl> + Sync + Send + 'static,
54 ) -> Handle {
55 Box::new(move |binder, inputs| {
56 let input_len = inputs.len();
57 let Ok(inputs) = inputs.try_into() else {
58 return Err(ErrorCode::ExprError(
59 format!("unexpected arguments number {}, expect {}", input_len, E).into(),
60 )
61 .into());
62 };
63 handle(binder, inputs)
64 })
65 }
66
67 fn raw<F: Fn(&mut Binder, Inputs) -> Result<ExprImpl> + Sync + Send + 'static>(
68 f: F,
69 ) -> Handle {
70 Box::new(f)
71 }
72
73 fn dispatch_by_len(mapping: Vec<(usize, Handle)>) -> Handle {
74 Box::new(move |binder, inputs| {
75 for (len, handle) in &mapping {
76 if inputs.len() == *len {
77 return handle(binder, inputs);
78 }
79 }
80 Err(ErrorCode::ExprError("unexpected arguments number".into()).into())
81 })
82 }
83
84 fn raw_literal(literal: ExprImpl) -> Handle {
85 Box::new(move |_binder, _inputs| Ok(literal.clone()))
86 }
87
88 fn now() -> Handle {
89 guard_by_len(move |binder, []| {
90 binder.ensure_now_function_allowed()?;
91 Ok(Now.into())
94 })
95 }
96
97 fn pi() -> Handle {
98 raw_literal(ExprImpl::literal_f64(std::f64::consts::PI))
99 }
100
101 fn proctime() -> Handle {
102 Box::new(move |binder, inputs| {
103 binder.ensure_proctime_function_allowed()?;
104 raw_call(ExprType::Proctime)(binder, inputs)
105 })
106 }
107
108 fn session_user() -> Handle {
110 guard_by_len(|binder, []| {
111 Ok(ExprImpl::literal_varchar(
112 binder.auth_context.user_name.clone(),
113 ))
114 })
115 }
116
117 fn current_user() -> Handle {
121 guard_by_len(|binder, []| {
122 Ok(ExprImpl::literal_varchar(
123 binder.auth_context.user_name.clone(),
124 ))
125 })
126 }
127
128 fn current_database() -> Handle {
131 guard_by_len(|binder, []| Ok(ExprImpl::literal_varchar(binder.db_name.clone())))
132 }
133
134 static HANDLES: LazyLock<HashMap<&'static str, Handle>> = LazyLock::new(|| {
138 [
139 (
140 "booleq",
141 rewrite(ExprType::Equal, rewrite_two_bool_inputs),
142 ),
143 (
144 "boolne",
145 rewrite(ExprType::NotEqual, rewrite_two_bool_inputs),
146 ),
147 ("coalesce", rewrite(ExprType::Coalesce, |inputs| {
148 if inputs.iter().any(ExprImpl::has_table_function) {
149 return Err(ErrorCode::BindError("table functions are not allowed in COALESCE".into()).into());
150 }
151 Ok(inputs)
152 })),
153 (
154 "nullif",
155 rewrite(ExprType::Case, rewrite_nullif_to_case_when),
156 ),
157 (
158 "round",
159 dispatch_by_len(vec![
160 (2, raw_call(ExprType::RoundDigit)),
161 (1, raw_call(ExprType::Round)),
162 ]),
163 ),
164 ("pow", raw_call(ExprType::Pow)),
165 ("power", raw_call(ExprType::Pow)),
167 ("ceil", raw_call(ExprType::Ceil)),
168 ("ceiling", raw_call(ExprType::Ceil)),
169 ("floor", raw_call(ExprType::Floor)),
170 ("trunc", raw_call(ExprType::Trunc)),
171 ("abs", raw_call(ExprType::Abs)),
172 ("exp", raw_call(ExprType::Exp)),
173 ("ln", raw_call(ExprType::Ln)),
174 ("log", raw_call(ExprType::Log10)),
175 ("log10", raw_call(ExprType::Log10)),
176 ("mod", raw_call(ExprType::Modulus)),
177 ("sin", raw_call(ExprType::Sin)),
178 ("cos", raw_call(ExprType::Cos)),
179 ("tan", raw_call(ExprType::Tan)),
180 ("cot", raw_call(ExprType::Cot)),
181 ("asin", raw_call(ExprType::Asin)),
182 ("acos", raw_call(ExprType::Acos)),
183 ("atan", raw_call(ExprType::Atan)),
184 ("atan2", raw_call(ExprType::Atan2)),
185 ("sind", raw_call(ExprType::Sind)),
186 ("cosd", raw_call(ExprType::Cosd)),
187 ("cotd", raw_call(ExprType::Cotd)),
188 ("tand", raw_call(ExprType::Tand)),
189 ("sinh", raw_call(ExprType::Sinh)),
190 ("cosh", raw_call(ExprType::Cosh)),
191 ("tanh", raw_call(ExprType::Tanh)),
192 ("coth", raw_call(ExprType::Coth)),
193 ("asinh", raw_call(ExprType::Asinh)),
194 ("acosh", raw_call(ExprType::Acosh)),
195 ("atanh", raw_call(ExprType::Atanh)),
196 ("asind", raw_call(ExprType::Asind)),
197 ("acosd", raw_call(ExprType::Acosd)),
198 ("atand", raw_call(ExprType::Atand)),
199 ("atan2d", raw_call(ExprType::Atan2d)),
200 ("degrees", raw_call(ExprType::Degrees)),
201 ("radians", raw_call(ExprType::Radians)),
202 ("sqrt", raw_call(ExprType::Sqrt)),
203 ("cbrt", raw_call(ExprType::Cbrt)),
204 ("sign", raw_call(ExprType::Sign)),
205 ("scale", raw_call(ExprType::Scale)),
206 ("min_scale", raw_call(ExprType::MinScale)),
207 ("trim_scale", raw_call(ExprType::TrimScale)),
208 (
210 "to_timestamp",
211 dispatch_by_len(vec![
212 (1, raw_call(ExprType::SecToTimestamptz)),
213 (2, raw_call(ExprType::CharToTimestamptz)),
214 ]),
215 ),
216 ("date_trunc", raw_call(ExprType::DateTrunc)),
217 ("date_bin", raw_call(ExprType::DateBin)),
218 ("date_part", raw_call(ExprType::DatePart)),
219 ("make_date", raw_call(ExprType::MakeDate)),
220 ("make_time", raw_call(ExprType::MakeTime)),
221 ("make_timestamp", raw_call(ExprType::MakeTimestamp)),
222 ("make_timestamptz", raw_call(ExprType::MakeTimestamptz)),
223 ("timezone", guard_by_len(|_binder, [arg0, arg1]| {
224 Ok(FunctionCall::new(ExprType::AtTimeZone, vec![arg1, arg0])?.into())
226 })),
227 ("to_date", raw_call(ExprType::CharToDate)),
228 ("substr", raw_call(ExprType::Substr)),
230 ("length", raw_call(ExprType::Length)),
231 ("upper", raw_call(ExprType::Upper)),
232 ("lower", raw_call(ExprType::Lower)),
233 ("trim", raw_call(ExprType::Trim)),
234 ("replace", raw_call(ExprType::Replace)),
235 ("overlay", raw_call(ExprType::Overlay)),
236 ("btrim", raw_call(ExprType::Trim)),
237 ("ltrim", raw_call(ExprType::Ltrim)),
238 ("rtrim", raw_call(ExprType::Rtrim)),
239 ("md5", raw_call(ExprType::Md5)),
240 ("to_char", raw_call(ExprType::ToChar)),
241 (
242 "concat",
243 rewrite(ExprType::ConcatWs, rewrite_concat_to_concat_ws),
244 ),
245 ("concat_ws", raw_call(ExprType::ConcatWs)),
246 ("format", raw_call(ExprType::Format)),
247 ("translate", raw_call(ExprType::Translate)),
248 ("split_part", raw_call(ExprType::SplitPart)),
249 ("char_length", raw_call(ExprType::CharLength)),
250 ("character_length", raw_call(ExprType::CharLength)),
251 ("repeat", raw_call(ExprType::Repeat)),
252 ("ascii", raw_call(ExprType::Ascii)),
253 ("octet_length", raw_call(ExprType::OctetLength)),
254 ("bit_length", raw_call(ExprType::BitLength)),
255 ("regexp_match", raw_call(ExprType::RegexpMatch)),
256 ("regexp_replace", raw_call(ExprType::RegexpReplace)),
257 ("regexp_count", raw_call(ExprType::RegexpCount)),
258 ("regexp_split_to_array", raw_call(ExprType::RegexpSplitToArray)),
259 ("chr", raw_call(ExprType::Chr)),
260 ("starts_with", raw_call(ExprType::StartsWith)),
261 ("initcap", raw_call(ExprType::Initcap)),
262 ("lpad", raw_call(ExprType::Lpad)),
263 ("rpad", raw_call(ExprType::Rpad)),
264 ("reverse", raw_call(ExprType::Reverse)),
265 ("strpos", raw_call(ExprType::Position)),
266 ("to_ascii", raw_call(ExprType::ToAscii)),
267 ("to_hex", raw_call(ExprType::ToHex)),
268 ("quote_ident", raw_call(ExprType::QuoteIdent)),
269 ("quote_literal", guard_by_len(|_binder, [mut input]| {
270 if input.return_type() != DataType::Varchar {
271 FunctionCall::cast_mut(&mut input, &DataType::Varchar, CastContext::Explicit)?;
274 }
275 Ok(FunctionCall::new_unchecked(ExprType::QuoteLiteral, vec![input], DataType::Varchar).into())
276 })),
277 ("quote_nullable", guard_by_len(|_binder, [mut input]| {
278 if input.return_type() != DataType::Varchar {
279 FunctionCall::cast_mut(&mut input, &DataType::Varchar, CastContext::Explicit)?;
282 }
283 Ok(FunctionCall::new_unchecked(ExprType::QuoteNullable, vec![input], DataType::Varchar).into())
284 })),
285 ("string_to_array", raw_call(ExprType::StringToArray)),
286 ("get_bit", raw_call(ExprType::GetBit)),
287 ("get_byte", raw_call(ExprType::GetByte)),
288 ("set_bit", raw_call(ExprType::SetBit)),
289 ("set_byte", raw_call(ExprType::SetByte)),
290 ("bit_count", raw_call(ExprType::BitCount)),
291 ("encode", raw_call(ExprType::Encode)),
292 ("decode", raw_call(ExprType::Decode)),
293 ("convert_from", raw_call(ExprType::ConvertFrom)),
294 ("convert_to", raw_call(ExprType::ConvertTo)),
295 ("sha1", raw_call(ExprType::Sha1)),
296 ("sha224", raw_call(ExprType::Sha224)),
297 ("sha256", raw_call(ExprType::Sha256)),
298 ("sha384", raw_call(ExprType::Sha384)),
299 ("sha512", raw_call(ExprType::Sha512)),
300 ("encrypt", raw_call(ExprType::Encrypt)),
301 ("decrypt", raw_call(ExprType::Decrypt)),
302 ("hmac", raw_call(ExprType::Hmac)),
303 ("secure_compare", raw_call(ExprType::SecureCompare)),
304 ("left", raw_call(ExprType::Left)),
305 ("right", raw_call(ExprType::Right)),
306 ("inet_aton", raw_call(ExprType::InetAton)),
307 ("inet_ntoa", raw_call(ExprType::InetNtoa)),
308 ("int8send", raw_call(ExprType::PgwireSend)),
309 ("int8recv", guard_by_len(|_binder, [mut input]| {
310 let hint = if !input.is_untyped() && input.return_type() == DataType::Varchar {
312 " Consider `decode` or cast."
313 } else {
314 ""
315 };
316 input.cast_implicit_mut(&DataType::Bytea).map_err(|e| {
317 ErrorCode::BindError(format!("{} in `recv`.{hint}", e.as_report()))
318 })?;
319 Ok(FunctionCall::new_unchecked(ExprType::PgwireRecv, vec![input], DataType::Int64).into())
320 })),
321 ("array_cat", raw_call(ExprType::ArrayCat)),
323 ("array_append", raw_call(ExprType::ArrayAppend)),
324 ("array_join", raw_call(ExprType::ArrayToString)),
325 ("array_prepend", raw_call(ExprType::ArrayPrepend)),
326 ("array_to_string", raw_call(ExprType::ArrayToString)),
327 ("array_distinct", raw_call(ExprType::ArrayDistinct)),
328 ("array_min", raw_call(ExprType::ArrayMin)),
329 ("array_sort", raw_call(ExprType::ArraySort)),
330 ("array_length", raw_call(ExprType::ArrayLength)),
331 ("cardinality", raw_call(ExprType::Cardinality)),
332 ("array_remove", raw_call(ExprType::ArrayRemove)),
333 ("array_replace", raw_call(ExprType::ArrayReplace)),
334 ("array_reverse", raw_call(ExprType::ArrayReverse)),
335 ("array_max", raw_call(ExprType::ArrayMax)),
336 ("array_sum", raw_call(ExprType::ArraySum)),
337 ("array_position", raw_call(ExprType::ArrayPosition)),
338 ("array_positions", raw_call(ExprType::ArrayPositions)),
339 ("array_contains", raw_call(ExprType::ArrayContains)),
340 ("arraycontains", raw_call(ExprType::ArrayContains)),
341 ("array_contained", raw_call(ExprType::ArrayContained)),
342 ("arraycontained", raw_call(ExprType::ArrayContained)),
343 ("array_flatten", guard_by_len(|_binder, [input]| {
344 input.ensure_array_type().map_err(|_| ErrorCode::BindError("array_flatten expects `any[][]` input".into()))?;
345 let return_type = input.return_type().into_list_elem();
346 if !return_type.is_array() {
347 return Err(ErrorCode::BindError("array_flatten expects `any[][]` input".into()).into());
348 }
349 Ok(FunctionCall::new_unchecked(ExprType::ArrayFlatten, vec![input], return_type).into())
350 })),
351 ("trim_array", raw_call(ExprType::TrimArray)),
352 (
353 "array_ndims",
354 guard_by_len(|_binder, [input]| {
355 input.ensure_array_type()?;
356
357 let n = input.return_type().array_ndims()
358 .try_into().map_err(|_| ErrorCode::BindError("array_ndims integer overflow".into()))?;
359 Ok(ExprImpl::literal_int(n))
360 }),
361 ),
362 (
363 "array_lower",
364 guard_by_len(|binder, [arg0, arg1]| {
365 let ndims_expr = binder.bind_builtin_scalar_function("array_ndims", vec![arg0], false)?;
367 let arg1 = arg1.cast_implicit(&DataType::Int32)?;
368
369 FunctionCall::new(
370 ExprType::Case,
371 vec![
372 FunctionCall::new(
373 ExprType::And,
374 vec![
375 FunctionCall::new(ExprType::LessThan, vec![ExprImpl::literal_int(0), arg1.clone()])?.into(),
376 FunctionCall::new(ExprType::LessThanOrEqual, vec![arg1, ndims_expr])?.into(),
377 ],
378 )?.into(),
379 ExprImpl::literal_int(1),
380 ],
381 ).map(Into::into)
382 }),
383 ),
384 ("array_upper", raw_call(ExprType::ArrayLength)), ("array_dims", raw_call(ExprType::ArrayDims)),
386 ("hex_to_int256", raw_call(ExprType::HexToInt256)),
388 ("jsonb_object_field", raw_call(ExprType::JsonbAccess)),
390 ("jsonb_array_element", raw_call(ExprType::JsonbAccess)),
391 ("jsonb_object_field_text", raw_call(ExprType::JsonbAccessStr)),
392 ("jsonb_array_element_text", raw_call(ExprType::JsonbAccessStr)),
393 ("jsonb_extract_path", raw_call(ExprType::JsonbExtractPath)),
394 ("jsonb_extract_path_text", raw_call(ExprType::JsonbExtractPathText)),
395 ("jsonb_typeof", raw_call(ExprType::JsonbTypeof)),
396 ("jsonb_array_length", raw_call(ExprType::JsonbArrayLength)),
397 ("jsonb_concat", raw_call(ExprType::JsonbConcat)),
398 ("jsonb_object", raw_call(ExprType::JsonbObject)),
399 ("jsonb_pretty", raw_call(ExprType::JsonbPretty)),
400 ("jsonb_contains", raw_call(ExprType::JsonbContains)),
401 ("jsonb_contained", raw_call(ExprType::JsonbContained)),
402 ("jsonb_exists", raw_call(ExprType::JsonbExists)),
403 ("jsonb_exists_any", raw_call(ExprType::JsonbExistsAny)),
404 ("jsonb_exists_all", raw_call(ExprType::JsonbExistsAll)),
405 ("jsonb_delete", raw_call(ExprType::Subtract)),
406 ("jsonb_delete_path", raw_call(ExprType::JsonbDeletePath)),
407 ("jsonb_strip_nulls", raw_call(ExprType::JsonbStripNulls)),
408 ("to_jsonb", raw_call(ExprType::ToJsonb)),
409 ("jsonb_build_array", raw_call(ExprType::JsonbBuildArray)),
410 ("jsonb_build_object", raw_call(ExprType::JsonbBuildObject)),
411 ("jsonb_populate_record", raw_call(ExprType::JsonbPopulateRecord)),
412 ("jsonb_path_match", raw_call(ExprType::JsonbPathMatch)),
413 ("jsonb_path_exists", raw_call(ExprType::JsonbPathExists)),
414 ("jsonb_path_query_array", raw_call(ExprType::JsonbPathQueryArray)),
415 ("jsonb_path_query_first", raw_call(ExprType::JsonbPathQueryFirst)),
416 ("jsonb_set", raw_call(ExprType::JsonbSet)),
417 ("jsonb_populate_map", raw_call(ExprType::JsonbPopulateMap)),
418 ("jsonb_to_array", raw_call(ExprType::JsonbToArray)),
419 ("map_from_entries", raw_call(ExprType::MapFromEntries)),
421 ("map_access", raw_call(ExprType::MapAccess)),
422 ("map_keys", raw_call(ExprType::MapKeys)),
423 ("map_values", raw_call(ExprType::MapValues)),
424 ("map_entries", raw_call(ExprType::MapEntries)),
425 ("map_from_key_values", raw_call(ExprType::MapFromKeyValues)),
426 ("map_cat", raw_call(ExprType::MapCat)),
427 ("map_contains", raw_call(ExprType::MapContains)),
428 ("map_delete", raw_call(ExprType::MapDelete)),
429 ("map_insert", raw_call(ExprType::MapInsert)),
430 ("map_length", raw_call(ExprType::MapLength)),
431 ("l2_distance", raw_call(ExprType::L2Distance)),
433 ("cosine_distance", raw_call(ExprType::CosineDistance)),
434 ("l1_distance", raw_call(ExprType::L1Distance)),
435 ("inner_product", raw_call(ExprType::InnerProduct)),
436 ("vector_norm", raw_call(ExprType::L2Norm)),
437 ("l2_normalize", raw_call(ExprType::L2Normalize)),
438 ("subvector", guard_by_len(|_, [vector_expr, start_expr, len_expr]| {
439 let dimensions = if let DataType::Vector(length) = vector_expr.return_type() {
440 length as i32
441 } else {
442 return Err(ErrorCode::BindError("subvector expects `vector(dim)` input".into()).into());
443 };
444 let start = start_expr
445 .try_fold_const()
446 .transpose()?
447 .and_then(|datum| match datum {
448 Some(ScalarImpl::Int32(v)) => Some(v),
449 _ => None,
450 })
451 .ok_or_else(|| ErrorCode::ExprError("`start` must be an Int32 constant".into()))?;
452
453 let len = len_expr
454 .try_fold_const()
455 .transpose()?
456 .and_then(|datum| match datum {
457 Some(ScalarImpl::Int32(v)) => Some(v),
458 _ => None,
459 })
460 .ok_or_else(|| ErrorCode::ExprError("`count` must be an Int32 constant".into()))?;
461 if len < 1 || len > DataType::VEC_MAX_SIZE as i32 {
462 return Err(ErrorCode::InvalidParameterValue(format!("Invalid vector size: expected 1..={}, got {}", DataType::VEC_MAX_SIZE, len)).into());
463 }
464
465 let end = start + len - 1;
466
467 if start < 1 || end > dimensions {
468 return Err(ErrorCode::InvalidParameterValue(format!(
469 "vector slice range out of bounds: start={}, end={}, valid range is [1, {}]",
470 start,
471 end,
472 dimensions
473 )).into());
474 }
475
476 Ok(FunctionCall::new_unchecked(ExprType::Subvector, vec![vector_expr, start_expr, len_expr], DataType::Vector(len as usize)).into())
477 })),
478 ("pi", pi()),
480 ("greatest", raw_call(ExprType::Greatest)),
482 ("least", raw_call(ExprType::Least)),
483 (
485 "pg_typeof",
486 guard_by_len(|_binder, [input]| {
487 let v = match input.is_untyped() {
488 true => "unknown".into(),
489 false => input.return_type().to_string(),
490 };
491 Ok(ExprImpl::literal_varchar(v))
492 }),
493 ),
494 ("current_catalog", current_database()),
495 ("current_database", current_database()),
496 ("current_schema", guard_by_len(|binder, []| {
497 Ok(binder
498 .first_valid_schema()
499 .map(|schema| ExprImpl::literal_varchar(schema.name()))
500 .unwrap_or_else(|_| ExprImpl::literal_null(DataType::Varchar)))
501 })),
502 ("current_schemas", raw(|binder, mut inputs| {
503 let no_match_err = ErrorCode::ExprError(
504 "No function matches the given name and argument types. You might need to add explicit type casts.".into()
505 );
506 if inputs.len() != 1 {
507 return Err(no_match_err.into());
508 }
509 let input = inputs
510 .pop()
511 .unwrap()
512 .enforce_bool_clause("current_schemas")
513 .map_err(|_| no_match_err)?;
514
515 let ExprImpl::Literal(literal) = &input else {
516 bail_not_implemented!("Only boolean literals are supported in `current_schemas`.");
517 };
518
519 let Some(bool) = literal.get_data().as_ref().map(|bool| bool.clone().into_bool()) else {
520 return Ok(ExprImpl::literal_null(DataType::Varchar.list()));
521 };
522
523 let paths = if bool {
524 binder.search_path.path()
525 } else {
526 binder.search_path.real_path()
527 };
528
529 let mut schema_names = vec![];
530 for path in paths {
531 let mut schema_name = path;
532 if schema_name == USER_NAME_WILD_CARD {
533 schema_name = &binder.auth_context.user_name;
534 }
535
536 if binder
537 .catalog
538 .get_schema_by_name(&binder.db_name, schema_name)
539 .is_ok()
540 {
541 schema_names.push(schema_name.as_str());
542 }
543 }
544
545 Ok(ExprImpl::literal_list(
546 ListValue::from_iter(schema_names),
547 DataType::Varchar,
548 ))
549 })),
550 ("session_user", session_user()),
551 ("current_role", current_user()),
552 ("current_user", current_user()),
553 ("user", current_user()),
554 ("pg_get_userbyid", raw_call(ExprType::PgGetUserbyid)),
555 ("pg_get_indexdef", raw_call(ExprType::PgGetIndexdef)),
556 ("pg_get_viewdef", raw_call(ExprType::PgGetViewdef)),
557 ("pg_index_column_has_property", raw_call(ExprType::PgIndexColumnHasProperty)),
558 ("pg_relation_size", raw(|_binder, mut inputs| {
559 if inputs.is_empty() {
560 return Err(ErrorCode::ExprError(
561 "function pg_relation_size() does not exist".into(),
562 )
563 .into());
564 }
565 inputs[0].cast_to_regclass_mut()?;
566 Ok(FunctionCall::new(ExprType::PgRelationSize, inputs)?.into())
567 })),
568 ("pg_get_serial_sequence", raw_literal(ExprImpl::literal_null(DataType::Varchar))),
569 ("pg_table_size", guard_by_len(|_binder, [mut input]| {
570 input.cast_to_regclass_mut()?;
571 Ok(FunctionCall::new(ExprType::PgRelationSize, vec![input])?.into())
572 })),
573 ("pg_indexes_size", guard_by_len(|_binder, [mut input]| {
574 input.cast_to_regclass_mut()?;
575 Ok(FunctionCall::new(ExprType::PgIndexesSize, vec![input])?.into())
576 })),
577 ("pg_get_expr", raw(|_binder, inputs| {
578 if inputs.len() == 2 || inputs.len() == 3 {
579 Ok(ExprImpl::literal_varchar("".into()))
581 } else {
582 Err(ErrorCode::ExprError(
583 "Too many/few arguments for pg_catalog.pg_get_expr()".into(),
584 )
585 .into())
586 }
587 })),
588 ("pg_my_temp_schema", guard_by_len(|_binder, []| {
589 Ok(ExprImpl::literal_int(
591 0,
593 ))
594 })),
595 ("current_setting", guard_by_len(|binder, [input]| {
596 let input = if let ExprImpl::Literal(literal) = &input &&
597 let Some(ScalarImpl::Utf8(input)) = literal.get_data()
598 {
599 input
600 } else {
601 return Err(ErrorCode::ExprError(
602 "Only literal is supported in `setting_name`.".into(),
603 )
604 .into());
605 };
606 let session_config = binder.session_config.read();
607 Ok(ExprImpl::literal_varchar(session_config.get(input.as_ref())?))
608 })),
609 ("set_config", guard_by_len(|binder, [arg0, arg1, arg2]| {
610 let setting_name = if let ExprImpl::Literal(literal) = &arg0 && let Some(ScalarImpl::Utf8(input)) = literal.get_data() {
611 input
612 } else {
613 return Err(ErrorCode::ExprError(
614 "Only string literal is supported in `setting_name`.".into(),
615 )
616 .into());
617 };
618
619 let new_value = if let ExprImpl::Literal(literal) = &arg1 && let Some(ScalarImpl::Utf8(input)) = literal.get_data() {
620 input
621 } else {
622 return Err(ErrorCode::ExprError(
623 "Only string literal is supported in `setting_name`.".into(),
624 )
625 .into());
626 };
627
628 let is_local = if let ExprImpl::Literal(literal) = &arg2 && let Some(ScalarImpl::Bool(input)) = literal.get_data() {
629 input
630 } else {
631 return Err(ErrorCode::ExprError(
632 "Only bool literal is supported in `is_local`.".into(),
633 )
634 .into());
635 };
636
637 if *is_local {
638 return Err(ErrorCode::ExprError(
639 "`is_local = true` is not supported now.".into(),
640 )
641 .into());
642 }
643
644 let mut session_config = binder.session_config.write();
645
646 session_config.set(setting_name, new_value.to_string(), &mut ())?;
648
649 Ok(ExprImpl::literal_varchar(new_value.to_string()))
650 })),
651 ("format_type", raw_call(ExprType::FormatType)),
652 ("pg_table_is_visible", raw_call(ExprType::PgTableIsVisible)),
653 ("pg_type_is_visible", raw_literal(ExprImpl::literal_bool(true))),
654 ("pg_get_constraintdef", raw_literal(ExprImpl::literal_null(DataType::Varchar))),
655 ("pg_get_partkeydef", raw_literal(ExprImpl::literal_null(DataType::Varchar))),
656 ("pg_encoding_to_char", raw_literal(ExprImpl::literal_varchar("UTF8".into()))),
657 ("has_database_privilege", raw(|binder, mut inputs| {
658 if inputs.len() == 2 {
659 inputs.insert(0, ExprImpl::literal_varchar(binder.auth_context.user_name.clone()));
660 }
661 if inputs.len() == 3 {
662 Ok(FunctionCall::new(ExprType::HasDatabasePrivilege, inputs)?.into())
663 } else {
664 Err(ErrorCode::ExprError(
665 "Too many/few arguments for pg_catalog.has_database_privilege()".into(),
666 )
667 .into())
668 }
669 })),
670 ("has_table_privilege", raw(|binder, mut inputs| {
671 if inputs.len() == 2 {
672 inputs.insert(0, ExprImpl::literal_varchar(binder.auth_context.user_name.clone()));
673 }
674 if inputs.len() == 3 {
675 if inputs[1].return_type() == DataType::Varchar {
676 inputs[1].cast_to_regclass_mut()?;
677 }
678 Ok(FunctionCall::new(ExprType::HasTablePrivilege, inputs)?.into())
679 } else {
680 Err(ErrorCode::ExprError(
681 "Too many/few arguments for pg_catalog.has_table_privilege()".into(),
682 )
683 .into())
684 }
685 })),
686 ("has_any_column_privilege", raw(|binder, mut inputs| {
687 if inputs.len() == 2 {
688 inputs.insert(0, ExprImpl::literal_varchar(binder.auth_context.user_name.clone()));
689 }
690 if inputs.len() == 3 {
691 if inputs[1].return_type() == DataType::Varchar {
692 inputs[1].cast_to_regclass_mut()?;
693 }
694 Ok(FunctionCall::new(ExprType::HasAnyColumnPrivilege, inputs)?.into())
695 } else {
696 Err(ErrorCode::ExprError(
697 "Too many/few arguments for pg_catalog.has_any_column_privilege()".into(),
698 )
699 .into())
700 }
701 })),
702 ("has_schema_privilege", raw(|binder, mut inputs| {
703 if inputs.len() == 2 {
704 inputs.insert(0, ExprImpl::literal_varchar(binder.auth_context.user_name.clone()));
705 }
706 if inputs.len() == 3 {
707 Ok(FunctionCall::new(ExprType::HasSchemaPrivilege, inputs)?.into())
708 } else {
709 Err(ErrorCode::ExprError(
710 "Too many/few arguments for pg_catalog.has_schema_privilege()".into(),
711 )
712 .into())
713 }
714 })),
715 ("has_function_privilege", raw(|binder, mut inputs| {
716 if inputs.len() == 2 {
717 inputs.insert(0, ExprImpl::literal_varchar(binder.auth_context.user_name.clone()));
718 }
719 if inputs.len() == 3 {
720 Ok(FunctionCall::new(ExprType::HasFunctionPrivilege, inputs)?.into())
721 } else {
722 Err(ErrorCode::ExprError(
723 "Too many/few arguments for pg_catalog.has_function_privilege()".into(),
724 )
725 .into())
726 }
727 })),
728 ("pg_stat_get_numscans", raw_literal(ExprImpl::literal_bigint(0))),
729 ("pg_backend_pid", raw(|binder, _inputs| {
730 Ok(ExprImpl::literal_int(binder.session_id.0))
732 })),
733 ("pg_cancel_backend", guard_by_len(|_binder, [_input]| {
734 Ok(ExprImpl::literal_bool(false))
736 })),
737 ("pg_terminate_backend", guard_by_len(|_binder, [_input]| {
738 Ok(ExprImpl::literal_bool(false))
741 })),
742 ("pg_tablespace_location", guard_by_len(|_binder, [_input]| {
743 Ok(ExprImpl::literal_null(DataType::Varchar))
744 })),
745 ("pg_postmaster_start_time", guard_by_len(|_binder, []| {
746 let server_start_time = risingwave_variables::get_server_start_time();
747 let datum = server_start_time.map(Timestamptz::from).map(ScalarImpl::from);
748 let literal = Literal::new(datum, DataType::Timestamptz);
749 Ok(literal.into())
750 })),
751 ("col_description", raw_call(ExprType::ColDescription)),
755 ("obj_description", raw_literal(ExprImpl::literal_varchar("".to_owned()))),
756 ("shobj_description", raw_literal(ExprImpl::literal_varchar("".to_owned()))),
757 ("pg_is_in_recovery", raw_call(ExprType::PgIsInRecovery)),
758 ("rw_recovery_status", raw_call(ExprType::RwRecoveryStatus)),
759 ("rw_cluster_id", raw_call(ExprType::RwClusterId)),
760 ("rw_epoch_to_ts", raw_call(ExprType::RwEpochToTs)),
761 ("rw_fragment_vnodes", raw_call(ExprType::RwFragmentVnodes)),
762 ("rw_actor_vnodes", raw_call(ExprType::RwActorVnodes)),
763 ("rw_vnode", raw_call(ExprType::VnodeUser)),
765 ("rw_license", raw_call(ExprType::License)),
766 ("rw_test_paid_tier", raw_call(ExprType::TestFeature)), ("rw_test_feature", raw_call(ExprType::TestFeature)), ("version", raw_literal(ExprImpl::literal_varchar(current_cluster_version()))),
770 ("now", now()),
772 ("current_timestamp", now()),
773 ("proctime", proctime()),
774 ("pg_sleep", raw_call(ExprType::PgSleep)),
775 ("pg_sleep_for", raw_call(ExprType::PgSleepFor)),
776 ("random", raw_call(ExprType::Random)),
777 ("date", guard_by_len(|_binder, [input]| {
783 input.cast_explicit(&DataType::Date).map_err(Into::into)
784 })),
785
786 ("openai_embedding", guard_by_len(|_binder, [arg0, arg1]| {
788 if let ExprImpl::Literal(config) = &arg0 && let Some(ScalarImpl::Jsonb(_config)) = config.get_data() {
790 Ok(FunctionCall::new(ExprType::OpenaiEmbedding, vec![arg0, arg1])?.into())
791 } else {
792 Err(ErrorCode::InvalidInputSyntax(
793 "`embedding_config` must be constant jsonb".to_owned(),
794 ).into())
795 }
796 })),
797 ]
798 .into_iter()
799 .collect()
800 });
801
802 static FUNCTIONS_BKTREE: LazyLock<BKTree<&str>> = LazyLock::new(|| {
803 let mut tree = BKTree::new(metrics::Levenshtein);
804
805 for k in HANDLES.keys() {
807 tree.add(*k);
808 }
809
810 tree
811 });
812
813 if variadic {
814 let func = match function_name {
815 "format" => ExprType::FormatVariadic,
816 "concat" => ExprType::ConcatVariadic,
817 "concat_ws" => ExprType::ConcatWsVariadic,
818 "jsonb_build_array" => ExprType::JsonbBuildArrayVariadic,
819 "jsonb_build_object" => ExprType::JsonbBuildObjectVariadic,
820 "jsonb_extract_path" => ExprType::JsonbExtractPathVariadic,
821 "jsonb_extract_path_text" => ExprType::JsonbExtractPathTextVariadic,
822 _ => {
823 return Err(ErrorCode::BindError(format!(
824 "VARIADIC argument is not allowed in function \"{}\"",
825 function_name
826 ))
827 .into());
828 }
829 };
830 return Ok(FunctionCall::new(func, inputs)?.into());
831 }
832
833 match HANDLES.get(function_name) {
835 Some(handle) => handle(self, inputs),
836 None => {
837 let allowed_distance = if function_name.len() > 3 { 2 } else { 1 };
838
839 let candidates = FUNCTIONS_BKTREE
840 .find(function_name, allowed_distance)
841 .map(|(_idx, c)| c)
842 .join(" or ");
843
844 Err(no_function!(
845 candidates = (!candidates.is_empty()).then_some(candidates),
846 "{}({})",
847 function_name,
848 inputs.iter().map(|e| e.return_type()).join(", ")
849 )
850 .into())
851 }
852 }
853 }
854
855 fn ensure_now_function_allowed(&self) -> Result<()> {
856 if self.is_for_stream()
857 && !matches!(
858 self.context.clause,
859 Some(Clause::Where)
860 | Some(Clause::Having)
861 | Some(Clause::JoinOn)
862 | Some(Clause::From)
863 )
864 {
865 return Err(ErrorCode::InvalidInputSyntax(format!(
866 "For streaming queries, `NOW()` function is only allowed in `WHERE`, `HAVING`, `ON` and `FROM`. Found in clause: {:?}. \
867 Please please refer to https://www.risingwave.dev/docs/current/sql-pattern-temporal-filters/ for more information",
868 self.context.clause
869 ))
870 .into());
871 }
872 if matches!(self.context.clause, Some(Clause::GeneratedColumn)) {
873 return Err(ErrorCode::InvalidInputSyntax(
874 "Cannot use `NOW()` function in generated columns. Do you want `PROCTIME()`?"
875 .to_owned(),
876 )
877 .into());
878 }
879 Ok(())
880 }
881
882 fn ensure_proctime_function_allowed(&self) -> Result<()> {
883 if !self.is_for_ddl() {
884 return Err(ErrorCode::InvalidInputSyntax(
885 "Function `PROCTIME()` is only allowed in CREATE TABLE/SOURCE. Is `NOW()` what you want?".to_owned(),
886 )
887 .into());
888 }
889 Ok(())
890 }
891}
892
893fn rewrite_concat_to_concat_ws(inputs: Vec<ExprImpl>) -> Result<Vec<ExprImpl>> {
894 if inputs.is_empty() {
895 Err(ErrorCode::BindError(
896 "Function `concat` takes at least 1 arguments (0 given)".to_owned(),
897 )
898 .into())
899 } else {
900 let inputs = std::iter::once(ExprImpl::literal_varchar("".to_owned()))
901 .chain(inputs)
902 .collect();
903 Ok(inputs)
904 }
905}
906
907fn rewrite_nullif_to_case_when(inputs: Vec<ExprImpl>) -> Result<Vec<ExprImpl>> {
910 if inputs.len() != 2 {
911 Err(ErrorCode::BindError("Function `nullif` must contain 2 arguments".to_owned()).into())
912 } else {
913 let inputs = vec![
914 FunctionCall::new(ExprType::Equal, inputs.clone())?.into(),
915 Literal::new(None, inputs[0].return_type()).into(),
916 inputs[0].clone(),
917 ];
918 Ok(inputs)
919 }
920}
921
922fn rewrite_two_bool_inputs(mut inputs: Vec<ExprImpl>) -> Result<Vec<ExprImpl>> {
923 if inputs.len() != 2 {
924 return Err(
925 ErrorCode::BindError("function must contain only 2 arguments".to_owned()).into(),
926 );
927 }
928 let left = inputs.pop().unwrap();
929 let right = inputs.pop().unwrap();
930 Ok(vec![
931 left.cast_implicit(&DataType::Boolean)?,
932 right.cast_implicit(&DataType::Boolean)?,
933 ])
934}