khannaekta commented on a change in pull request #571:
URL: https://github.com/apache/madlib/pull/571#discussion_r723776016
##########
File path: src/ports/postgres/modules/dbscan/test/dbscan.sql_in
##########
@@ -118,27 +118,68 @@ SELECT assert(count(DISTINCT cluster_id) = 3, 'Incorrect
cluster count') FROM db
DROP TABLE IF EXISTS dbscan_train_data3;
CREATE TABLE dbscan_train_data3 (
-id_in integer,
-data0 integer,
-data1 integer);
-copy dbscan_train_data3 (id_in, data0, data1) FROM stdin delimiter '|';
-1|1|1
-2|2|2
-3|3|3
-4|4|4
-5|4|8
-6|17|8
-7|19|8
-8|19|9
-9|19|10
-10|3|111
-11|3|112
-12|3|113
-13|8|113
+ city TEXT,
+ country TEXT,
+ lat INTEGER,
+ lon INTEGER,
+ PRIMARY KEY (city, country)
+);
+COPY dbscan_train_data3 (city, country, lon, lat) FROM stdin csv header;
+city,country,lat,lon
+Bangkok,Thailand,13,100
+Athens,Greece,37,23
+Beijing,China,39,116
+St. Petersburg,Russia,59,30
+Barcelona,Spain,23,9
+Tehran,Iran,35,51
+Bristol,England,51,-2
+São Paulo,Brazil,-23,-46
+Berlin,Germany,30,25
+New Dehli,India,28,77
+Sydney,Australia,-34,151
+Bogotá,Colombia,4,-74
+Kingston,Jamaica,17,-76
+Rome,Italy,41,12
+Bombay,India,19,72
+Cape Town,South Africa,-33,22
+Cairo,Egypt,30,31
+Guayaquil,Ecuador,-2,-79
+Jakarta,Indonesia,-6,106
+Hamburg,Germany,53,2
+Hong Kong,China,22,114
+Bordeux,France,44,0
+Nairobi,Kenya,-1,36
+Osaka,Japan,34,135
\.
+-- Test that id and point params may be passed in as expressions
DROP TABLE IF EXISTS out1, out1_summary;
-SELECT
dbscan('dbscan_train_data3','out1','id_in','ARRAY[data0,data1]',20,4,'squared_dist_norm2','brute');
+SELECT dbscan('dbscan_train_data3',
+ 'out1',
+ $$('x' || left(md5(city || ',' || country),16))::BIT(64)::BIGINT$$
+ ,'ARRAY[lat,lon]',
+ 50, 1, 'squared_dist_norm2', 'optimized'
+);
+
+SELECT assert(
+ id_column = $$('x' || left(md5(city || ',' ||
country),16))::BIT(64)::BIGINT$$,
+ 'id expression passed in does not match expression saved in summary
table: ' || id_column
+) FROM out1_summary;
+SELECT assert(
+ expr_point = $$ARRAY[lat,lon]$$,
+ 'point expression passed in does not match expression saved in summary
table: ' || expr_point
+) FROM out1_summary; -- verify point expression saved in summary
+SELECT assert(COUNT(*) = 20, 'Wrong number of rows returned') FROM out1; --
Should return 20 non-noise points
+
+-- Results in Graph WCC error - TODO: fix
Review comment:
Do we still want to validate this or we can remove it?
--
This is an automated message from the Apache Git Service.
To respond to the message, please log on to GitHub and use the
URL above to go to the specific comment.
To unsubscribe, e-mail: [email protected]
For queries about this service, please contact Infrastructure at:
[email protected]