Skip to content
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
4 changes: 2 additions & 2 deletions docs/source/contributor-guide/spark_expressions_support.md
Original file line number Diff line number Diff line change
Expand Up @@ -379,10 +379,10 @@
- [x] expm1
- [ ] factorial
- [x] floor
- [ ] greatest
- [x] greatest
- [x] hex
- [ ] hypot
- [ ] least
- [x] least
- [x] ln
- [ ] log
- [x] log10
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -108,9 +108,11 @@ object QueryPlanSerde extends Logging with CometExprShim with CometTypeShim {
classOf[Exp] -> CometScalarFunction("exp"),
classOf[Expm1] -> CometScalarFunction("expm1"),
classOf[Floor] -> CometFloor,
classOf[Greatest] -> CometScalarFunction("greatest"),
classOf[Hex] -> CometHex,
classOf[IntegralDivide] -> CometIntegralDivide,
classOf[IsNaN] -> CometIsNaN,
classOf[Least] -> CometScalarFunction("least"),
classOf[Log] -> CometLog,
classOf[Log2] -> CometLog2,
classOf[Log10] -> CometLog10,
Expand Down
211 changes: 211 additions & 0 deletions spark/src/test/resources/sql-tests/expressions/math/greatest.sql
Original file line number Diff line number Diff line change
@@ -0,0 +1,211 @@
-- Licensed to the Apache Software Foundation (ASF) under one
-- or more contributor license agreements. See the NOTICE file
-- distributed with this work for additional information
-- regarding copyright ownership. The ASF licenses this file
-- to you under the Apache License, Version 2.0 (the
-- "License"); you may not use this file except in compliance
-- with the License. You may obtain a copy of the License at
--
-- http://www.apache.org/licenses/LICENSE-2.0
--
-- Unless required by applicable law or agreed to in writing,
-- software distributed under the License is distributed on an
-- "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
-- KIND, either express or implied. See the License for the
-- specific language governing permissions and limitations
-- under the License.

statement
CREATE TABLE test_greatest(a int, b int, c int) USING parquet

statement
INSERT INTO test_greatest VALUES
(1, 2, 3),
(3, 2, 1),
(NULL, 2, 3),
(1, NULL, 3),
(1, 2, NULL),
(NULL, NULL, 3),
(NULL, NULL, NULL),
(-1, 0, 1),
(2147483647, -2147483648, 0)

-- column arguments
query
SELECT greatest(a, b, c) FROM test_greatest

-- two column arguments
query
SELECT greatest(a, b) FROM test_greatest

-- literal arguments
query
SELECT greatest(1, 2, 3), greatest(3, 2, 1), greatest(-1, 0, 1)

-- NULL literal handling
query
SELECT greatest(NULL, 2, 3), greatest(1, NULL, 3), greatest(NULL, NULL, NULL)

-- mixed column and literal
query
SELECT greatest(a, 0) FROM test_greatest

statement
CREATE TABLE test_greatest_types(f float, d double, s string, dt date) USING parquet

statement
INSERT INTO test_greatest_types VALUES
(1.5, 2.5, 'apple', DATE '2023-01-01'),
(-1.5, -2.5, 'banana', DATE '2023-06-15'),
(0.0, 0.0, 'cherry', DATE '2023-12-31'),
(NULL, NULL, NULL, NULL),
(cast('NaN' as float), 1.0, 'a', DATE '2020-01-01'),
(cast('Infinity' as float), cast('-Infinity' as double), 'z', DATE '2099-12-31')

-- floating point with NaN and Infinity
query
SELECT greatest(f, 0.0) FROM test_greatest_types

query
SELECT greatest(d, 0.0) FROM test_greatest_types

-- string type
query
SELECT greatest(s, 'b') FROM test_greatest_types

-- date type
query
SELECT greatest(dt, DATE '2023-06-01') FROM test_greatest_types

-- literal floating point edge cases
query
SELECT greatest(cast('NaN' as float), 1.0), greatest(cast('NaN' as float), cast('NaN' as float))

query
SELECT greatest(cast('Infinity' as double), 1.0), greatest(cast('-Infinity' as double), 1.0)


statement
CREATE TABLE test_greatest_long(a bigint, b bigint) USING parquet

statement
INSERT INTO test_greatest_long VALUES
(1, 2),
(-1, 1),
(9223372036854775807, -9223372036854775808),
(NULL, 100),
(NULL, NULL)

-- long/bigint type
query
SELECT greatest(a, b) FROM test_greatest_long

query
SELECT greatest(cast(1 as bigint), cast(-1 as bigint), cast(9223372036854775807 as bigint))

statement
CREATE TABLE test_greatest_decimal(a decimal(20,5), b decimal(20,5)) USING parquet

statement
INSERT INTO test_greatest_decimal VALUES
(1.00000, 2.00000),
(-99999.99999, 99999.99999),
(0.00001, -0.00001),
(NULL, 123.45000),
(NULL, NULL)

-- decimal type
query
SELECT greatest(a, b) FROM test_greatest_decimal

query
SELECT greatest(cast(1.5 as decimal(10,2)), cast(2.5 as decimal(10,2)), cast(-1.0 as decimal(10,2)))

statement
CREATE TABLE test_greatest_bool(a boolean, b boolean) USING parquet

statement
INSERT INTO test_greatest_bool VALUES
(true, false),
(false, true),
(true, true),
(false, false),
(NULL, true),
(NULL, NULL)

-- boolean type
query
SELECT greatest(a, b) FROM test_greatest_bool

query
SELECT greatest(true, false), greatest(false, false), greatest(true, true)

statement
CREATE TABLE test_greatest_ts(a timestamp, b timestamp) USING parquet

statement
INSERT INTO test_greatest_ts VALUES
(TIMESTAMP '2023-01-01 08:00:00', TIMESTAMP '2023-01-01 10:00:00'),
(TIMESTAMP '2020-06-15 12:30:00', TIMESTAMP '2020-06-15 12:29:59'),
(NULL, TIMESTAMP '2023-01-01 00:00:00'),
(NULL, NULL)

-- timestamp type
query
SELECT greatest(a, b) FROM test_greatest_ts

query
SELECT greatest(TIMESTAMP '2015-07-01 08:00:00', TIMESTAMP '2015-07-01 10:00:00')

-- many arguments (5+)
query
SELECT greatest(1, 2, 3, 4, 5, 6, 7, 8, 9, 10)

query
SELECT greatest(a, b, c, a, b) FROM test_greatest

-- array type (lexicographic ordering)
statement
CREATE TABLE test_greatest_array(a array<int>, b array<int>) USING parquet

statement
INSERT INTO test_greatest_array VALUES
(array(1, 2, 3), array(1, 2, 4)),
(array(1, 2), array(1, 2, 0)),
(array(3), array(2, 9, 9)),
(array(1, 1), array(1, 1)),
(NULL, array(1)),
(array(1), NULL),
(NULL, NULL)

query
SELECT greatest(a, b) FROM test_greatest_array

query
SELECT greatest(array(1, 2), array(1, 3), array(1, 1))

query
SELECT greatest(array('b', 'a'), array('a', 'z'))

-- struct type (field-by-field ordering)
statement
CREATE TABLE test_greatest_struct(a struct<x:int, y:string>, b struct<x:int, y:string>) USING parquet

statement
INSERT INTO test_greatest_struct VALUES
(named_struct('x', 1, 'y', 'a'), named_struct('x', 2, 'y', 'a')),
(named_struct('x', 1, 'y', 'b'), named_struct('x', 1, 'y', 'a')),
(named_struct('x', 3, 'y', 'z'), named_struct('x', 3, 'y', 'z')),
(NULL, named_struct('x', 1, 'y', 'a')),
(named_struct('x', 1, 'y', 'a'), NULL),
(NULL, NULL)

query
SELECT greatest(a, b) FROM test_greatest_struct

query
SELECT greatest(named_struct('x', 1, 'y', 'b'), named_struct('x', 1, 'y', 'a'))

-- nested complex type: array of structs
query
SELECT greatest(array(named_struct('x', 1)), array(named_struct('x', 2)))
Loading
Loading