InputTable
DROP TABLE input_table_varbyte;
CREATE MULTISET TABLE input_table_varbyte(id INTEGER, array_col Varbyte(32000)) PRIMARY INDEX( id );
INSERT INTO input_table_varbyte values(1, '000000000000F03F000000000000F03F'XB);
INSERT INTO input_table_varbyte values(2, '00000000000000400000000000000040'XB);
INSERT INTO input_table_varbyte values(3, '00000000000020400000000000002040'XB);
INSERT INTO input_table_varbyte values(4, '00000000000022400000000000002240'XB);
id |
array_col |
1 |
000000000000F03F000000000000F03F |
2 |
00000000000000400000000000000040 |
3 |
00000000000020400000000000002040 |
4 |
00000000000022400000000000002240 |
InitialCentroidsTable
DROP TABLE initial_centroids_table_varbyte;
CREATE MULTISET TABLE initial_centroids_table_varbyte as (SELECT * FROM input_table_varbyte where id in (2,4)) with data;
id |
array_col |
2 |
00000000000000400000000000000040 |
4 |
00000000000022400000000000002240 |
Example: TD_KMeans SQL Call: InitialCentroidsTable not provided
SELECT * FROM TD_KMeans (
ON input_table_varbyte as InputTable
USING
IdColumn('id')
TargetColumns('array_col')
NumClusters(2)
Seed(0)
StopThreshold(0.0395)
MaxIterNum(3)
EmbeddingSize(2)
)as dt;
Output: InitialCentroidsTable not provided
td_clusterid_kmeans |
array_col |
td_size_kmeans |
td_withinss_kmeans |
id |
td_modelinfo_kmeans |
0 |
000000000000F83F000000000000F83F |
2 |
1.000000000000000E 000 |
NULL |
NULL |
1 |
00000000000021400000000000002140 |
2 |
1.000000000000000E 000 |
NULL |
NULL |
NULL |
NULL |
NULL |
NULL |
NULL |
Converged: true |
NULL |
NULL |
NULL |
NULL |
NULL |
Number of Iterations: 2 |
NULL |
NULL |
NULL |
NULL |
NULL |
Number of Clusters: 2 |
NULL |
NULL |
NULL |
NULL |
NULL |
Total_WithinSS : 2.00000000000000E+00 |
NULL |
NULL |
NULL |
NULL |
NULL |
Between_SS : 9.80000000000000E+01 |
NULL |
NULL |
NULL |
NULL |
NULL |
Method for InitialCentroids: Random |
Example: TD_KMeans SQL Call: InitialCentroidsTable is provided
SELECT * FROM TD_KMeans (
ON input_table_varbyte as InputTable
ON initial_centroids_table_varbyte as InitialCentroidsTable DIMENSION
USING
IdColumn('id')
TargetColumns('array_col')
StopThreshold(0.0395)
MaxIterNum(3)
EmbeddingSize(2)
)as dt;
Output: InitialCentroidsTable is provided
td_clusterid_kmeans |
array_col |
td_size_kmeans |
td_withinss_kmeans |
id |
td_modelinfo_kmeans |
0 |
000000000000F83F000000000000F83F |
2 |
1.000000000000000E 000 |
NULL |
NULL |
1 |
00000000000021400000000000002140 |
2 |
1.000000000000000E 000 |
NULL |
NULL |
NULL |
NULL |
NULL |
NULL |
NULL |
Converged: true |
NULL |
NULL |
NULL |
NULL |
NULL |
Number of Iterations: 2 |
NULL |
NULL |
NULL |
NULL |
NULL |
Number of Clusters: 2 |
NULL |
NULL |
NULL |
NULL |
NULL |
Total_WithinSS : 2.00000000000000E+00 |
NULL |
NULL |
NULL |
NULL |
NULL |
Between_SS : 9.80000000000000E+01 |
NULL |
NULL |
NULL |
NULL |
NULL |
Method for InitialCentroids: Externally supplied InitialCentroidsTable |