Function CoverageΒΆ

Here is a list of all scalar, aggregate, and window functions from Spark, with functions that are available in Velox highlighted.

Scalar Functions

Aggregate Functions

Window Functions

abs()

count_if

inline

nvl

sqrt()

any

cume_dist

acos()

count_min_sketch

inline_outer

nvl2

stack

approx_count_distinct

dense_rank()

acosh()

covar_pop

input_file_block_length

octet_length

std

approx_percentile

first_value

add_months()

covar_samp

input_file_block_start

or

stddev

array_agg

lag

aggregate()

crc32()

input_file_name

overlay()

stddev_pop

avg()

last_value

and

cume_dist

instr()

parse_url

stddev_samp

bit_and

lead

any

current_catalog

int

percent_rank

str_to_map()

bit_or

nth_value()

approx_count_distinct

current_database

isnan()

percentile

string

bit_xor()

ntile()

approx_percentile

current_date

isnotnull()

percentile_approx

struct

bool_and

percent_rank

array()

current_timestamp

isnull()

pi

substr

bool_or

rank()

array_contains()

current_timezone

java_method

pmod()

substring()

collect_list()

row_number()

array_distinct()

current_user

json_array_length()

posexplode

substring_index()

collect_set()

array_except()

date

json_object_keys()

posexplode_outer

sum

corr()

array_intersect()

date_add()

json_tuple

position

tan

count

array_join()

date_format()

kurtosis

positive

tanh

count_if

array_max()

date_from_unix_date()

lag

pow

timestamp

count_min_sketch

array_min()

date_part

last

power()

timestamp_micros()

covar_pop

array_position()

date_sub()

last_day()

printf

timestamp_millis()

covar_samp()

array_remove()

date_trunc()

last_value

quarter()

timestamp_seconds

every

array_repeat()

datediff()

lcase

radians

tinyint

first()

array_sort()

day()

lead

raise_error()

to_csv

first_value

array_union()

dayofmonth()

least()

rand()

to_date

grouping

arrays_overlap

dayofweek()

left()

randn

to_json

grouping_id

arrays_zip()

dayofyear()

length()

random()

to_timestamp

histogram_numeric

ascii()

decimal

levenshtein()

range

to_unix_timestamp()

kurtosis()

asin()

decode

like()

rank

to_utc_timestamp()

last()

asinh()

degrees()

ln

reflect

transform()

last_value

assert_true

dense_rank

locate()

regexp

transform_keys

max()

atan()

div

log()

regexp_extract()

transform_values

max_by()

atan2()

double

log10()

regexp_extract_all()

translate()

mean

atanh()

e

log1p()

regexp_like

trim()

min()

avg

element_at()

log2()

regexp_replace()

trunc()

min_by()

base64

elt

lower()

repeat()

try_add

percentile

between()

encode

lpad()

replace()

try_divide

percentile_approx

bigint

every

ltrim()

reverse()

typeof

regr_avgx

bin()

exists()

make_date()

right

ucase

regr_avgy

binary

exp()

make_dt_interval

rint()

unbase64()

regr_count

bit_and

explode

make_interval

rlike()

unhex()

regr_r2

bit_count()

explode_outer

make_timestamp()

round()

unix_date()

skewness()

bit_get()

expm1()

make_ym_interval()

row_number

unix_micros()

some

bit_length()

extract

map()

rpad()

unix_millis()

std

bit_or

factorial()

map_concat()

rtrim()

unix_seconds()

stddev()

bit_xor

filter()

map_entries()

schema_of_csv

unix_timestamp()

stddev_pop

bool_and

find_in_set()

map_filter()

schema_of_json

upper()

stddev_samp()

bool_or

first

map_from_arrays()

second()

uuid()

sum()

boolean

first_value

map_from_entries

sentences

var_pop

try_avg

bround

flatten()

map_keys()

sequence

var_samp

try_sum

btrim

float

map_values()

session_window

variance

var_pop

cardinality

floor()

map_zip_with()

sha

version

var_samp()

case

forall()

max

sha1()

weekday()

variance()

cast

format_number

max_by

sha2()

weekofyear

cbrt()

format_string

md5()

shiftleft()

when

ceil()

from_csv

mean

shiftright()

width_bucket()

ceiling

from_json

min

shiftrightunsigned

window

char

from_unixtime()

min_by

shuffle()

xpath

char_length

from_utc_timestamp()

minute()

sign()

xpath_boolean

character_length

get_json_object()

mod

signum

xpath_double

chr()

getbit

monotonically_increasing_id()

sin

xpath_float

coalesce

greatest()

month()

sinh()

xpath_int

collect_list

grouping

months_between

size()

xpath_long

collect_set

grouping_id

named_struct

skewness

xpath_number

concat()

hash()

nanvl

slice()

xpath_short

concat_ws

hex()

negative

smallint

xpath_string

conv()

hour()

next_day()

some

xxhash64()

corr

hypot()

not()

sort_array()

year()

cos()

if

now

soundex()

zip_with()

cosh()

ifnull

nth_value

space

cot()

in()

ntile

spark_partition_id()

count

initcap

nullif

split()