Skip to content

Commit

Permalink
Hidden Functions (#1250)
Browse files Browse the repository at this point in the history
  • Loading branch information
yliuuuu authored Oct 25, 2023
1 parent 9abc89e commit 7d9cf21
Show file tree
Hide file tree
Showing 5 changed files with 188 additions and 56 deletions.
1 change: 1 addition & 0 deletions partiql-plan/src/main/resources/partiql_plan_0_1.ion
Original file line number Diff line number Diff line change
Expand Up @@ -33,6 +33,7 @@ fn::[
},
unresolved::{
identifier: identifier,
isHidden: bool,
},
]

Expand Down
77 changes: 77 additions & 0 deletions partiql-planner/PlannerCheckList.adoc
Original file line number Diff line number Diff line change
@@ -0,0 +1,77 @@
== Planner Implementation Check List

=== Functions and Operators


|===
|Category |Name |Query Expression |Header Function signature | Hidden | Implemented | COMMENT

|Logical Operator |NOT | NOT expr | not(expr: Boolean) : Boolean | True | Yes. |
|Logical Operator | AND | expr1 AND expr2 | and(expr1: Boolean, expr2: Boolean) : Boolean | True | Yes. |
|Logical Operator | OR | expr1 or expr2 | or(expr1: Boolean, expr2 Boolean) : Boolean | True | Yes. |
| Unary Operator | POS | +expr | pos(expr: T) : T where T is a numeric Type| True | Yes. |
|Unary Operator | NEG | -expr | neg(expr:T) : T where T is a numeric Type| True | Yes. |
|Arithmetic Operator | PLUS | expr1 + expr2 | plus(expr1: T, expr2: T) : T where T is a numeric Type | True | Yes. |
|Arithmetic Operator | MINUS | expr1 - expr2 | minus(expr1: T, expr2: T) : T where T is a numeric Type | True | Yes. |
|Arithmetic Operator | Multiplication | expr1 * expr2 | times(expr1: T, expr2: T) : T where T is a numeric Type | True | Yes. |
|Arithmetic Operator | Division | expr1 / expr2 | div(expr1: T, expr2: T) : T where T is a numeric Type | True | Yes. |
|Arithmetic Operator | Modulo | expr1 % expr2 | mod(expr1: T, expr2: T) : T where T is a numeric Type | True | Yes. |
|Arithmetic Operator | Bitwise AND | expr1 & expr2 | bitwise_and(expr1: I, expr2: I) : I where I is a Integer Type| True | Yes. |
|Comparison Operator | Equal | expr1 = expr2 | eq(expr1: T, expr2: T) : Boolean where T is any PartiQL Value Type. | True | Yes. |
|Comparison Operator | NOT EQUAL | expr1 != expr2 ; expr1 <> expr2 | ne(expr1: T, expr2: T) : Boolean where T is any PartiQL Value Type. | True | Yes. |
|Comparison Operator | LESS THAN | expr1 < expr2 | lt(expr1: T, expr2: T) : Boolean where T is any PartiQL Value Type. | True | Yes. |
|Comparison Operator | LESS THAN OR EQUAL | expr1 ≤ expr2 | lte(expr1: T, expr2: T) : Boolean where T is any PartiQL Value Type. | True | Yes. |
|Comparison Operator | GREATER THAN | expr1 > expr2 | gt(expr1: T, expr2: T) : Boolean where T is any PartiQL Value Type. | True | Yes. |
|Comparison Operator | GREATER THAN OR EQUAL | expr1 ≥ expr2 | gte(expr1: T, expr2: T) : Boolean where T is any PartiQL Value Type. | True | Yes. |
| Function | Upper | UPPER(expr) | upper(expr: T) : T where T is a text Type | False | Yes. |
| Function | Lower | LOWER(expr) | lower(expr: T) : T where T is a text Type | False | Yes. |
| Function | Coalesce | COALESCE(expr, expr2, ...., expr_n) | N/A | False | No. |
| Function | Nullif | NULLIF(expr1, expr2) | N/A | False | Yes. |
| Function | UtcNow | UTCNOW() | utcnow() : Timestamp | False | Yes. |
| Function | position | POSITION(expr1, epxr2) | position(expr1: T, expr2: T) : INT64 | False | YES. |
| Function - Special Form| position | POSITION(expr1 in expr2) | position(expr1: T, expr2: T) : INT64 | TRUE | YES. |
| Function | substring | SUBSTRING(expr1, expr2) | substring(expr1: T, expr2: INT64) : T where T is a Text Type | False | Yes. |
| Function - special form | substring | SUBSTRING(expr1 FROM expr2) | substring(expr1: T, expr2: INT64) : T where T is a Text Type | True | Yes. |
| Function | substring | SUBSTRING(expr1, expr2, expr3) | substring(expr1: T, expr2: INT64, expr3: INT64) : T where T is a Text Type | False | Yes. |
| Function - special form | substring | SUBSTRING(expr1 FROM expr2 FOR expr3) | substring(expr1: T, expr2: INT64, expr3: INT64) : T where T is a Text Type | False | Yes. |
| Function | Trim | TRIM(expr) | trim(expr: T) : T where T is a Text Type | False | Yes. |
| Function - special form | Trim | TRIM(BOTH FROM expr) | N/A | TRUE | NO. |
| Function - special form | Trim | TRIM(expr1 FROM expr2); TRIM(BOTH expr1 FROM expr2) | trim_chars(expr1: T, expr2: T) : T where T is a Text Type | True | Yes. |
| Function - special form | Trim | TRIM(LEADING FROM expr) | trim_leading(expr: T) : T where T is a Text Type | True | Yes. |
| Function - special form | Trim | TRIM(LEADING expr1 FROM expr2) | trim_leading_chars(expr1: T, expr2: T) : T where T is a Text Type | True | Yes. |
| Function - special form | Trim | TRIM(TRAILING FROM expr) | trim_trailing(expr: T) : T where T is a Text Type | True | Yes. |
| Function - special form | Trim | TRIM(TRAILING expr1 FROM expr2) | trim_trailing_chars(expr1: T, expr2: T) : T where T is a Text Type | True | Yes. |
| Function - special form | LIKE | expr1 LIKE expr2 | like(expr1: STRING, expr2: STRING) : Boolean | True | Yes. |
| Function - special form | LIKE | expr1 LIKE expr2 ESCAPE expr3 | like(expr1: STRING, expr2: STRING, expr3: STRING) : Boolean | True | Yes. |
| Function - special form | BETWEEN | expr1 BETWEEN expr2 AND expr3 | between(expr1: T, expr2: T, expr3: T) : Boolean where T is a numeric Type | True | Yes. | Between can also be applied to Datetime type in many data base system.
| Function - special form | IN | expr1 IN expr2 | in_collection(expr1: T1, expr2: T2) : Boolean where T1 can be any PartiQL value Type and T2 is a collection Type | True | Yes. |
| is Operator | IS | expr IS type | is_$type_name(expr: T) where T can be any PartiQL Value Type | True | Yes. | The type operand of the is Operator get reflected by the function name
| Cast Operator | CAST | CAST(expr AS Type)| cast_$type_name(expr) | True | Yes | Cast function are generated based on the Type lattice
| Function - special form | DATE_ADD | DATE_ADD(datetimePart, expr1, expr2) | date_add_$datetimePart(expr1: INT, expr2: T) where T is a Datetime Type | True | Yes. | The datetime part operand of the date_add function get reflected by the function name
| Function - special form | DATE_DIFF | DATE_DIFF(datetimePart, expr1, expr2) | date_diff_$datetimePart(expr1: T, expr2: T) : INT64 : where T is a Datetime Type | True | Yes. | The datetime part operand of the date_diff function get reflected by the function name
| System Function | CURRENT_USER | CURRENT_USER | current_user()| True | Yes |
| System Function | CURRENT_DATE | CURRENT_DATE | current_user()| True | Yes |
| Function | CHAR_LENGTH | CHAR_LENGTH(str) | N/A | N/A | No |
| Function | EXIST | EXISTS(val) | N/A | N/A | No |
| Function | EXTRACT | EXTRACT(datatimePart FROM t) | N/A | N/A | No |
| Function | FILTER_DISTINCT | FILTER_DISTINCT(c) | N/A | N/A | No |
| Function | MAKE DATE | MAKE_DATE(year, month, day) | N/A | N/A | No | We might be able to deprecate this function once we have the constructor call for Date Literal
| Function | MAKE DATE | MAKE_TIME(hour, minute, second, timezoneMinutes?) | N/A | N/A | No | We might be able to deprecate this function once we have the constructor call for TIME Literal
| Function | SIZE | SIZE(c) | N/A | N/A | No |
| Function | TO_STRING | TO_STRING(timestamp, timestamp_format_pattern) | N/A | N/A | No |
| Function | TO_TIMESTAMP | TO_TIMESTAMP(str[ , timestamp_format_pattern]) | N/A | N/A | No |
| Function | UNIX_TIMESTAMP | UNIX_TIMESTAMP([timestamp]) | N/A | N/A | No |
| Function | FROM_UNIXTIME | FROM_UNIXTIME(unix_timestamp) | N/A | N/A | No |
| Function | CEILING | CEILING(v) | N/A | N/A | NO |
| Function | FLOOR | FLOOR(v) | N/A | N/A | NO |
| Function | ABS | ABS(v) | N/A | N/A | NO |
| Function | SQRT | SQRT(v) | N/A | N/A | NO |
| Function | Nature log | LN(v) | N/A | N/A | NO |
| Function | exponential | EXP(v) | N/A | N/A | NO |
| Function | POWER | POW(v) | N/A | N/A | NO |
| Function | BIT_LENGTH | BIT_LENGTH(v) | N/A | N/A | NO |
| Function | OCTET_LENGTH | OCTET_LENGTH(v) | N/A | N/A | NO |
| Function | OVERLAY | OVERLAY(str1 PLACING str2 FROM pos) | N/A | N/A | NO |
| Function | OVERLAY | OVERLAY(str1 PLACING str2 FROM pos FOR for) | N/A | N/A | NO |
| Function | TEXT_REPLACE | TEXT_REPLACE(string, from, to) | N/A | N/A | NO |
|===
119 changes: 82 additions & 37 deletions partiql-planner/src/main/kotlin/org/partiql/planner/Header.kt
Original file line number Diff line number Diff line change
Expand Up @@ -38,18 +38,12 @@ import org.partiql.value.PartiQLValueType.SYMBOL
import org.partiql.value.PartiQLValueType.TIME
import org.partiql.value.PartiQLValueType.TIMESTAMP

/**
* A structure for scalar function lookup.
*/
private typealias FnMap<T> = Map<String, List<T>>

/**
* Map session attributes to underlying function name.
* Unicode non-character to be used for name sanitization
*/
internal val ATTRIBUTES: Map<String, String> = mapOf(
"CURRENT_USER" to "\$__current_user",
"CURRENT_DATE" to "\$__current_date"
)
private val HIDDEN_FLAG: Char = Char(0xFDD0)

/**
* A place for type and function definitions. Eventually these will be read from Ion files.
Expand All @@ -73,7 +67,9 @@ internal class Header(
*/
public fun lookup(ref: Fn.Unresolved): List<FunctionSignature.Scalar> {
val name = getFnName(ref.identifier)
return functions.getOrDefault(name, emptyList())
return if (ref.isHidden)
functions.getOrDefault("${HIDDEN_FLAG}_$name", emptyList())
else functions.getOrDefault(name, emptyList())
}

/**
Expand All @@ -92,7 +88,7 @@ internal class Header(
return null
}
val name = castName(targetType)
val casts = functions.getOrDefault(name, emptyList())
val casts = functions.getOrDefault("${HIDDEN_FLAG}_$name", emptyList())
for (cast in casts) {
if (cast.parameters.isEmpty()) {
break // should be unreachable
Expand Down Expand Up @@ -139,15 +135,18 @@ internal class Header(
val types = TypeLattice.partiql()
val (casts, unsafeCastSet) = Functions.casts(types)
val functions = Functions.combine(
Functions.builtins()
)
val internalFunctions = Functions.combineInternal(
casts,
Functions.operators(),
Functions.builtins(),
Functions.special(),
Functions.system(),
)
val aggregations = Functions.combine(
Functions.aggregations(),
)
return Header(namespace, types, functions, aggregations, unsafeCastSet)
return Header(namespace, types, functions + internalFunctions, aggregations, unsafeCastSet)
}

/**
Expand All @@ -171,11 +170,13 @@ internal class Header(
public fun <T : FunctionSignature> combine(vararg functions: List<T>): FnMap<T> {
return functions.flatMap { it.sortedWith(functionPrecedence) }.groupBy { it.name }
}
public fun <T : FunctionSignature> combineInternal(vararg functions: List<T>): FnMap<T> {
return functions.flatMap { it.sortedWith(functionPrecedence) }.groupBy { "${HIDDEN_FLAG}_${it.name}" }
}

// ====================================
// TYPES
// ====================================

private val allTypes = PartiQLValueType.values()

private val nullableTypes = listOf(
Expand Down Expand Up @@ -271,28 +272,37 @@ internal class Header(
).flatten()

/**
* SQL and PartiQL Scalar Builtins
* SQL Builtins (not special forms)
*/
public fun builtins(): List<FunctionSignature.Scalar> = listOf(
upper(),
lower(),
coalesce(),
nullIf(),
position(),
substring(),
trim(),
utcNow(),
).flatten()

/**
* SQL and PartiQL special forms
*/
public fun special(): List<FunctionSignature.Scalar> = listOf(
like(),
between(),
inCollection(),
isType(),
isTypeSingleArg(),
isTypeDoubleArgsInt(),
isTypeTime(),
coalesce(),
nullIf(),
substring(),
position(),
trim(),
substring(),
trimSpecial(),
overlay(),
extract(),
dateAdd(),
dateDiff(),
utcNow(),
).flatten()

/**
Expand Down Expand Up @@ -521,19 +531,22 @@ internal class Header(
// TODO
private fun coalesce(): List<FunctionSignature.Scalar> = emptyList()

// NULLIF(x, y)
private fun nullIf(): List<FunctionSignature.Scalar> = nullableTypes.map { t ->
FunctionSignature.Scalar(
name = "null_if",
returns = t,
parameters = listOf(
FunctionParameter("value", t),
FunctionParameter("nullifier", BOOL),
FunctionParameter("nullifier", BOOL), // TODO: why is this BOOL?
),
isNullCall = true,
isNullable = true,
)
}

// SUBSTRING (expression, start[, length]?)
// SUBSTRINGG(expression from start [FOR length]? )
private fun substring(): List<FunctionSignature.Scalar> = textTypes.map { t ->
listOf(
FunctionSignature.Scalar(
Expand All @@ -547,7 +560,7 @@ internal class Header(
isNullable = false,
),
FunctionSignature.Scalar(
name = "substring_length",
name = "substring",
returns = t,
parameters = listOf(
FunctionParameter("value", t),
Expand All @@ -560,6 +573,8 @@ internal class Header(
)
}.flatten()

// position (str1, str2)
// position (str1 in str2)
private fun position(): List<FunctionSignature.Scalar> = textTypes.map { t ->
FunctionSignature.Scalar(
name = "position",
Expand All @@ -573,17 +588,24 @@ internal class Header(
)
}

// trim(str)
private fun trim(): List<FunctionSignature.Scalar> = textTypes.map { t ->
listOf(
FunctionSignature.Scalar(
name = "trim",
returns = t,
parameters = listOf(
FunctionParameter("value", t),
),
isNullCall = true,
isNullable = false,
FunctionSignature.Scalar(
name = "trim",
returns = t,
parameters = listOf(
FunctionParameter("value", t),
),
isNullCall = true,
isNullable = false,
)
}

// TODO: We need to add a special form function for TRIM(BOTH FROM value)
private fun trimSpecial(): List<FunctionSignature.Scalar> = textTypes.map { t ->
listOf(
// TRIM(chars FROM value)
// TRIM(both chars from value)
FunctionSignature.Scalar(
name = "trim_chars",
returns = t,
Expand All @@ -594,6 +616,7 @@ internal class Header(
isNullCall = true,
isNullable = false,
),
// TRIM(LEADING FROM value)
FunctionSignature.Scalar(
name = "trim_leading",
returns = t,
Expand All @@ -603,6 +626,7 @@ internal class Header(
isNullCall = true,
isNullable = false,
),
// TRIM(LEADING chars FROM value)
FunctionSignature.Scalar(
name = "trim_leading_chars",
returns = t,
Expand All @@ -613,6 +637,7 @@ internal class Header(
isNullCall = true,
isNullable = false,
),
// TRIM(TRAILING FROM value)
FunctionSignature.Scalar(
name = "trim_trailing",
returns = t,
Expand All @@ -622,6 +647,7 @@ internal class Header(
isNullCall = true,
isNullable = false,
),
// TRIM(TRAILING chars FROM value)
FunctionSignature.Scalar(
name = "trim_trailing_chars",
returns = t,
Expand All @@ -641,15 +667,15 @@ internal class Header(
// TODO
private fun extract(): List<FunctionSignature.Scalar> = emptyList()

private fun dateArithmetic(prefix: String): List<FunctionSignature.Scalar> {
private fun dateAdd(): List<FunctionSignature.Scalar> {
val operators = mutableListOf<FunctionSignature.Scalar>()
for (type in datetimeTypes) {
for (field in DatetimeField.values()) {
if (field == DatetimeField.TIMEZONE_HOUR || field == DatetimeField.TIMEZONE_MINUTE) {
continue
}
val signature = FunctionSignature.Scalar(
name = "${prefix}_${field.name.lowercase()}",
name = "date_add_${field.name.lowercase()}",
returns = type,
parameters = listOf(
FunctionParameter("interval", INT),
Expand All @@ -664,9 +690,28 @@ internal class Header(
return operators
}

private fun dateAdd(): List<FunctionSignature.Scalar> = dateArithmetic("date_add")

private fun dateDiff(): List<FunctionSignature.Scalar> = dateArithmetic("date_diff")
private fun dateDiff(): List<FunctionSignature.Scalar> {
val operators = mutableListOf<FunctionSignature.Scalar>()
for (type in datetimeTypes) {
for (field in DatetimeField.values()) {
if (field == DatetimeField.TIMEZONE_HOUR || field == DatetimeField.TIMEZONE_MINUTE) {
continue
}
val signature = FunctionSignature.Scalar(
name = "date_diff_${field.name.lowercase()}",
returns = INT64,
parameters = listOf(
FunctionParameter("datetime1", type),
FunctionParameter("datetime2", type),
),
isNullCall = true,
isNullable = false,
)
operators.add(signature)
}
}
return operators
}

private fun utcNow(): List<FunctionSignature.Scalar> = listOf(
FunctionSignature.Scalar(
Expand All @@ -678,14 +723,14 @@ internal class Header(
)

private fun currentUser() = FunctionSignature.Scalar(
name = "\$__current_user",
name = "current_user",
returns = STRING,
parameters = emptyList(),
isNullable = true,
)

private fun currentDate() = FunctionSignature.Scalar(
name = "\$__current_date",
name = "current_date",
returns = DATE,
parameters = emptyList(),
isNullable = false,
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -342,8 +342,8 @@ internal object RelConverter {
schema.add(binding)
val args = expr.args.map { arg -> arg.toRex(env) }
val id = AstToPlan.convert(expr.function)
val agg = aggUnresolved(id)
relOpAggregateCall(agg, args)
val fn = aggUnresolved(id)
relOpAggregateCall(fn, args)
}
var groups = emptyList<Rex>()
if (groupBy != null) {
Expand Down
Loading

0 comments on commit 7d9cf21

Please sign in to comment.