Files
greptimedb/tests/cases/standalone/common/aggregate/approx_distinct.sql
dennis zhuang c6e5552f05 test: migrate aggregation tests from duckdb, part4 (#6965)
* test: migrate aggregation tests from duckdb, part4

Signed-off-by: Dennis Zhuang <killme2008@gmail.com>

* fix: tests

Signed-off-by: Dennis Zhuang <killme2008@gmail.com>

* fix: rename tests

Signed-off-by: Dennis Zhuang <killme2008@gmail.com>

* fix: comments

Signed-off-by: Dennis Zhuang <killme2008@gmail.com>

* chore: ignore zero weights test

Signed-off-by: Dennis Zhuang <killme2008@gmail.com>

* chore: remove duplicated sql

Signed-off-by: Dennis Zhuang <killme2008@gmail.com>

---------

Signed-off-by: Dennis Zhuang <killme2008@gmail.com>
2025-09-25 08:00:17 +00:00

52 lines
1.7 KiB
SQL

-- Migrated from DuckDB test: test/sql/aggregate/aggregates/test_approximate_distinct_count.test
-- Test approx_distinct function
-- Basic tests
SELECT APPROX_DISTINCT(1);
-- FIXME(dennis): This feature is not implemented: Support for 'approx_distinct' for data type Null is not implemented
-- SELECT APPROX_DISTINCT(NULL);
SELECT APPROX_DISTINCT('hello');
-- Test with range data
SELECT APPROX_DISTINCT(10), APPROX_DISTINCT('hello') FROM numbers LIMIT 100;
SELECT APPROX_DISTINCT(number) FROM numbers WHERE 1 = 0 LIMIT 100 ;
-- Test with different data types
CREATE TABLE dates_test(t DATE, ts TIMESTAMP TIME INDEX);
INSERT INTO dates_test VALUES
('2008-01-01', 1000), (NULL, 2000), ('2007-01-01', 3000),
('2008-02-01', 4000), ('2008-01-02', 5000), ('2008-01-01', 6000),
('2008-01-01', 7000), ('2008-01-01', 8000);
-- FIXME(dennis): This feature is not implemented: Support for 'approx_distinct' for data type Date32 is not implemented
-- SELECT APPROX_DISTINCT(t) FROM dates_test;
DROP TABLE dates_test;
CREATE TABLE names_test(t VARCHAR, ts TIMESTAMP TIME INDEX);
INSERT INTO names_test VALUES
('Pedro', 1000), (NULL, 2000), ('Pedro', 3000), ('Pedro', 4000),
('Mark', 5000), ('Mark', 6000), ('Mark', 7000),
('Hannes-Muehleisen', 8000), ('Hannes-Muehleisen', 9000);
SELECT APPROX_DISTINCT(t) FROM names_test;
DROP TABLE names_test;
-- Test with large dataset
CREATE TABLE large_test(a INTEGER, b INTEGER, ts TIMESTAMP TIME INDEX);
INSERT INTO large_test SELECT number, number % 10, number * 1000 FROM numbers LIMIT 2000;
SELECT APPROX_DISTINCT(a), APPROX_DISTINCT(b) FROM large_test;
-- Test with groups
SELECT b, APPROX_DISTINCT(a) FROM large_test GROUP BY b ORDER BY b;
DROP TABLE large_test;