diff --git a/src/generator/testcase.py b/src/generator/testcase.py
index 9889bd7..2905183 100755
--- a/src/generator/testcase.py
+++ b/src/generator/testcase.py
@@ -3,6 +3,7 @@
number and different vary parameter combinations
"""
import os
+import pipes
from xml_parser import *
from file_path import *
@@ -78,8 +79,10 @@ def __writeTestItemsSql(self, itemName, algorithm, method, \
"'" + self.caseName + "' ," +\
"'" + self.algorithm + "' ," +\
"'" + method + "' ," +\
- "'" + paras + "' ," +\
- "'" + varVal + "' ," +\
+ "$_parasString$" \
+ + paras + "$_parasString$ ," +\
+ "$_valueString$" \
+ + varVal + "$_valueString$ ," +\
"'" + varName + "' ," +\
"'" + dataset + "' ," +\
str(rownum) + ");"
@@ -155,10 +158,10 @@ def GenCase(self, mtdList, exeIteration, tsType, debug):
elif "rows" == varName :
caseItemRows = varValue
caseItemPara.append("--" + varName + " " + \
- self.paraHandler.handle(varName, varValue, "var", mtdName))
+ pipes.quote(self.paraHandler.handle(varName, varValue, "var", mtdName)))
else:
caseItemPara.append("--" + varName + " " + \
- self.paraHandler.handle(varName, varValue, "var", mtdName))
+ pipes.quote(self.paraHandler.handle(varName, varValue, "var", mtdName)))
except Exception, exp:
pass
diff --git a/testspec/casespec/kmeans_new.xml b/testspec/casespec/kmeans_new.xml
new file mode 100755
index 0000000..21247a3
--- /dev/null
+++ b/testspec/casespec/kmeans_new.xml
@@ -0,0 +1,2646 @@
+
+
+ feature
+
+
+ kmeans
+
+
+ kmeans_new_cset
+
+ benchmark
+ TemplateExecutor
+
+
+
+ kmeans_new_plusplus
+
+ benchmark
+ TemplateExecutor
+
+
+
+ kmeans_new_random
+
+ benchmark
+ TemplateExecutor
+
+
+
+ kmeans_new_cset_ctas
+
+ benchmark
+ TemplateExecutor
+
+
+
+ kmeans_new_plusplus_ctas
+
+ benchmark
+ TemplateExecutor
+
+
+
+ kmeans_new_random_ctas
+
+ benchmark
+ TemplateExecutor
+
+
+
+
+
+ kmeans_new_cset_baseline
+ It is to get baseline of kmeans using predefined centroids against R.
+
+ 1
+
+ kmeans_new_cset
+
+ dataset
+ km_abalonekm_movement_libraskm_us_census_1990km_water_treatmentkm_winekm_winequality_red
+
+
+ dist_metric
+ madlib.dist_norm1madlib.squared_dist_norm2madlib.squared_anglemadlib.squared_tanimoto
+
+
+
+ DROP TABLE IF EXISTS madlibtestresult.kmeans_cset_baseline_result;
+
+
+
+
+ kmeans_new_plusplus_baseline
+ It is to get baseline of kmeans using plus plus against R.
+
+ 1
+
+ kmeans_new_plusplus
+
+ dataset
+ km_abalonekm_movement_libraskm_us_census_1990km_water_treatmentkm_winekm_winequality_red
+
+
+ dist_metric
+ dist_norm1squared_dist_norm2squared_anglesquared_tanimoto
+
+
+
+ k
+ 6
+
+
+
+
+
+
+ kmeans_new_random_baseline
+ It is to get baseline of kmeans using random against R.
+
+ 1
+
+ kmeans_new_random
+
+ dataset
+ km_abalonekm_movement_libraskm_us_census_1990km_water_treatmentkm_winekm_winequality_red
+
+
+ dist_metric
+ dist_norm1squared_dist_norm2squared_anglesquared_tanimoto
+
+
+
+ k
+ 6
+
+
+
+
+
+
+ kmeans_new_cset_maximum_iteration
+ It is to test kmeans with maximum iteration.
+
+ 1
+
+ kmeans_new_cset
+
+ dataset
+ km_abalonekm_movement_libraskm_us_census_1990km_water_treatmentkm_winekm_winequality_red
+
+
+ max_iter
+ 5102030
+
+
+ dist_metric
+ dist_norm1squared_dist_norm2squared_anglesquared_tanimoto
+
+
+
+
+
+ kmeans_new_plusplus_maximum_iteration
+ It is to test kmeans with maximum iteration.
+
+ 1
+
+ kmeans_new_plusplus
+
+ dataset
+ km_abalonekm_movement_libraskm_us_census_1990km_water_treatmentkm_winekm_winequality_red
+
+
+ max_iter
+ 5102030
+
+
+
+ k
+ 6
+
+
+
+
+
+
+ kmeans_new_random_maximum_iteration
+ It is to test kmeans with maximum iteration.
+
+ 1
+
+ kmeans_new_random
+
+ dataset
+ km_abalonekm_movement_libraskm_us_census_1990km_water_treatmentkm_winekm_winequality_red
+
+
+ max_iter
+ 5102030
+
+
+
+ k
+ 6
+
+
+
+
+
+
+ kmeans_cset_negative_overwrite
+ It is to test kmeans with existing output tables.
+
+ 1
+
+ kmeans_cset
+
+
+ dataset
+ km_abalone
+
+
+ src_col_data
+ position
+
+
+ src_col_id
+ pid
+
+
+ out_points
+ madlibtestresult.kmeans_cset_negative_overwrite_out_points
+
+
+ out_centroids
+ madlibtestresult.kmeans_cset_negative_overwrite_out_centroids
+
+
+
+
+
+ kmeans_cset
+
+
+ dataset
+ km_abalone
+
+
+ src_col_data
+ position
+
+
+ src_col_id
+ pid
+
+
+ out_points
+ madlibtestresult.kmeans_cset_negative_overwrite_out_points
+
+
+ out_centroids
+ madlibtestresult.kmeans_cset_negative_overwrite_out_centroids
+
+
+
+ DROP TABLE IF EXISTS madlibtestresult.kmeans_cset_negative_overwrite_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_cset_negative_overwrite_out_centroids;
+
+
+
+
+
+ kmeans_plusplus_negative_overwrite
+ It is to test kmeans with existing output tables.
+
+ 1
+
+ kmeans_plusplus
+
+
+ dataset
+ km_abalone
+
+
+ src_col_data
+ position
+
+
+ src_col_id
+ pid
+
+
+ out_points
+ madlibtestresult.kmeans_plusplus_negative_overwrite_out_points
+
+
+ out_centroids
+ madlibtestresult.kmeans_plusplus_negative_overwrite_out_centroids
+
+
+ k
+ 6
+
+
+ sample_frac
+ 0.01
+
+
+
+
+
+ kmeans_plusplus
+
+
+ dataset
+ km_abalone
+
+
+ src_col_data
+ position
+
+
+ src_col_id
+ pid
+
+
+ out_points
+ madlibtestresult.kmeans_plusplus_negative_overwrite_out_points
+
+
+ out_centroids
+ madlibtestresult.kmeans_plusplus_negative_overwrite_out_centroids
+
+
+ k
+ 6
+
+
+ sample_frac
+ 0.01
+
+
+
+ DROP TABLE IF EXISTS madlibtestresult.kmeans_plusplus_negative_overwrite_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_plusplus_negative_overwrite_out_centroids;
+
+
+
+
+
+ kmeans_random_negative_overwrite
+ It is to test kmeans with existing output tables.
+
+ 1
+
+ kmeans_random
+
+
+ dataset
+ km_abalone
+
+
+ src_col_data
+ position
+
+
+ src_col_id
+ pid
+
+
+ out_points
+ madlibtestresult.kmeans_random_negative_overwrite_out_points
+
+
+ out_centroids
+ madlibtestresult.kmeans_random_negative_overwrite_out_centroids
+
+
+ k
+ 6
+
+
+
+
+
+ kmeans_random
+
+
+ dataset
+ km_abalone
+
+
+ src_col_data
+ position
+
+
+ src_col_id
+ pid
+
+
+ out_points
+ madlibtestresult.kmeans_random_negative_overwrite_out_points
+
+
+ out_centroids
+ madlibtestresult.kmeans_random_negative_overwrite_out_centroids
+
+
+ k
+ 6
+
+
+
+ DROP TABLE IF EXISTS madlibtestresult.kmeans_random_negative_overwrite_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_random_negative_overwrite_out_centroids;
+
+
+
+
+
+ kmeans_canopy_negative_overwrite
+ It is to test kmeans with existing output tables.
+
+ 1
+
+ kmeans_canopy
+
+
+ dataset
+ km_abalone
+
+
+ src_col_data
+ position
+
+
+ src_col_id
+ pid
+
+
+ out_points
+ madlibtestresult.kmeans_canopy_negative_overwrite_out_points
+
+
+ out_centroids
+ madlibtestresult.kmeans_canopy_negative_overwrite_out_centroids
+
+
+ t1
+ NULL
+
+
+ t2
+ NULL
+
+
+
+
+
+ kmeans_canopy
+
+
+ dataset
+ km_abalone
+
+
+ src_col_data
+ position
+
+
+ src_col_id
+ pid
+
+
+ out_points
+ madlibtestresult.kmeans_canopy_negative_overwrite_out_points
+
+
+ out_centroids
+ madlibtestresult.kmeans_canopy_negative_overwrite_out_centroids
+
+
+ t1
+ NULL
+
+
+ t2
+ NULL
+
+
+
+ DROP TABLE IF EXISTS madlibtestresult.kmeans_canopy_negative_overwrite_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_canopy_negative_overwrite_out_centroids;
+
+
+
+
+
+ kmeans_cset_negative_src_relation
+ It is to test kmeans using negative source relation.
+
+ 1
+
+ kmeans_cset
+
+ src_relation
+ madlibtestdata.invalid_src_relationNULL
+
+
+
+ src_col_data
+ position
+
+
+ src_col_id
+ pid
+
+
+ out_points
+ madlibtestresult.kmeans_cset_negative_src_relation_out_points
+
+
+ out_centroids
+ madlibtestresult.kmeans_cset_negative_src_relation_out_centroids
+
+
+ init_cset_rel
+ madlibtestdata.km_abalone_centroids
+
+
+ init_cset_col
+ position
+
+
+
+ DROP TABLE IF EXISTS madlibtestresult.kmeans_cset_negative_src_relation_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_cset_negative_src_relation_out_centroids;
+
+
+
+
+
+ kmeans_plusplus_negative_src_relation
+ It is to test kmeans using negative source relation.
+
+ 1
+
+ kmeans_plusplus
+
+ src_relation
+ madlibtestdata.invalid_src_relationNULL
+
+
+
+ src_col_data
+ position
+
+
+ src_col_id
+ pid
+
+
+ out_points
+ madlibtestresult.kmeans_plusplus_negative_src_relation_out_points
+
+
+ out_centroids
+ madlibtestresult.kmeans_plusplus_negative_src_relation_out_centroids
+
+
+ k
+ 6
+
+
+ sample_frac
+ 0.01
+
+
+
+ DROP TABLE IF EXISTS madlibtestresult.kmeans_plusplus_negative_src_relation_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_plusplus_negative_src_relation_out_centroids;
+
+
+
+
+
+ kmeans_random_negative_src_relation
+ It is to test kmeans using negative source relation.
+
+ 1
+
+ kmeans_random
+
+ src_relation
+ madlibtestdata.invalid_src_relationNULL
+
+
+
+ src_col_data
+ position
+
+
+ src_col_id
+ pid
+
+
+ out_points
+ madlibtestresult.kmeans_random_negative_src_relation_out_points
+
+
+ out_centroids
+ madlibtestresult.kmeans_random_negative_src_relation_out_centroids
+
+
+ k
+ 6
+
+
+
+ DROP TABLE IF EXISTS madlibtestresult.kmeans_random_negative_src_relation_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_random_negative_src_relation_out_centroids;
+
+
+
+
+
+ kmeans_canopy_negative_src_relation
+ It is to test kmeans using negative source relation.
+
+ 1
+
+ kmeans_canopy
+
+ src_relation
+ madlibtestdata.invalid_src_relationNULL
+
+
+
+ src_col_data
+ position
+
+
+ src_col_id
+ pid
+
+
+ out_points
+ madlibtestresult.kmeans_canopy_negative_src_relation_out_points
+
+
+ out_centroids
+ madlibtestresult.kmeans_canopy_negative_src_relation_out_centroids
+
+
+ t1
+ NULL
+
+
+ t2
+ NULL
+
+
+
+ DROP TABLE IF EXISTS madlibtestresult.kmeans_canopy_negative_src_relation_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_canopy_negative_src_relation_out_centroids;
+
+
+
+
+
+ kmeans_cset_negative_src_col_data
+ It is to test kmeans using negative source column data.
+
+ 1
+
+ kmeans_cset
+
+ src_col_data
+ invalid_src_col_dataNULL
+
+
+
+ src_relation
+ madlibtestdata.km_abalone
+
+
+ src_col_id
+ pid
+
+
+ out_points
+ madlibtestresult.kmeans_cset_negative_src_col_data_out_points
+
+
+ out_centroids
+ madlibtestresult.kmeans_cset_negative_src_col_data_out_centroids
+
+
+
+ init_cset_rel
+ madlibtestdata.km_abalone_centroids
+
+
+ init_cset_col
+ position
+
+
+ DROP TABLE IF EXISTS madlibtestresult.kmeans_cset_negative_src_col_data_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_cset_negative_src_col_data_out_centroids;
+
+
+
+
+
+ kmeans_plusplus_negative_src_col_data
+ It is to test kmeans using negative source column data.
+
+ 1
+
+ kmeans_plusplus
+
+ src_col_data
+ invalid_src_col_dataNULL
+
+
+
+ src_relation
+ madlibtestdata.km_abalone
+
+
+ src_col_id
+ pid
+
+
+ out_points
+ madlibtestresult.kmeans_plusplus_negative_src_col_data_out_points
+
+
+ out_centroids
+ madlibtestresult.kmeans_plusplus_negative_src_col_data_out_centroids
+
+
+ k
+ 6
+
+
+ sample_frac
+ 0.01
+
+
+
+ DROP TABLE IF EXISTS madlibtestresult.kmeans_plusplus_negative_src_col_data_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_plusplus_negative_src_col_data_out_centroids;
+
+
+
+
+
+ kmeans_random_negative_src_col_data
+ It is to test kmeans using negative source column data.
+
+ 1
+
+ kmeans_random
+
+ src_col_data
+ invalid_src_col_dataNULL
+
+
+
+ src_relation
+ madlibtestdata.km_abalone
+
+
+ src_col_id
+ pid
+
+
+ out_points
+ madlibtestresult.kmeans_random_negative_src_col_data_out_points
+
+
+ out_centroids
+ madlibtestresult.kmeans_random_negative_src_col_data_out_centroids
+
+
+ k
+ 6
+
+
+
+ DROP TABLE IF EXISTS madlibtestresult.kmeans_random_negative_src_col_data_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_random_negative_src_col_data_out_centroids;
+
+
+
+
+
+ kmeans_canopy_negative_src_col_data
+ It is to test kmeans using negative source column data.
+
+ 1
+
+ kmeans_canopy
+
+ src_col_data
+ invalid_src_col_dataNULL
+
+
+
+ src_relation
+ madlibtestdata.km_abalone
+
+
+ src_col_data
+ position
+
+
+ src_col_id
+ pid
+
+
+ out_points
+ madlibtestresult.kmeans_canopy_negative_src_col_data_out_points
+
+
+ out_centroids
+ madlibtestresult.kmeans_canopy_negative_src_col_data_out_centroids
+
+
+ t1
+ NULL
+
+
+ t2
+ NULL
+
+
+
+ DROP TABLE IF EXISTS madlibtestresult.kmeans_canopy_negative_src_col_data_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_canopy_negative_src_col_data_out_centroids;
+
+
+
+
+
+ kmeans_cset_negative_src_col_id
+ It is to test kmeans using negative source column id.
+
+ 1
+
+ kmeans_cset
+
+ src_col_id
+ invalid_src_col_idNULL
+
+
+
+ src_relation
+ madlibtestdata.km_abalone
+
+
+ src_col_data
+ position
+
+
+ out_points
+ madlibtestresult.kmeans_cset_negative_src_col_id_out_points
+
+
+ out_centroids
+ madlibtestresult.kmeans_cset_negative_src_col_id_out_centroids
+
+
+ init_cset_rel
+ madlibtestdata.km_abalone_centroids
+
+
+ init_cset_col
+ position
+
+
+
+ DROP TABLE IF EXISTS madlibtestresult.kmeans_cset_negative_src_col_id_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_cset_negative_src_col_id_out_centroids;
+
+
+
+
+
+ kmeans_plusplus_negative_src_col_id
+ It is to test kmeans using negative source column id.
+
+ 1
+
+ kmeans_plusplus
+
+ src_col_id
+ invalid_src_col_idNULL
+
+
+
+ src_relation
+ madlibtestdata.km_abalone
+
+
+ src_col_data
+ position
+
+
+ out_points
+ madlibtestresult.kmeans_plusplus_negative_src_col_id_out_points
+
+
+ out_centroids
+ madlibtestresult.kmeans_plusplus_negative_src_col_id_out_centroids
+
+
+ k
+ 6
+
+
+ sample_frac
+ 0.01
+
+
+
+ DROP TABLE IF EXISTS madlibtestresult.kmeans_plusplus_negative_src_col_id_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_plusplus_negative_src_col_id_out_centroids;
+
+
+
+
+
+ kmeans_random_negative_src_col_id
+ It is to test kmeans using negative source column id.
+
+ 1
+
+ kmeans_random
+
+ src_col_id
+ invalid_src_col_idNULL
+
+
+
+ src_relation
+ madlibtestdata.km_abalone
+
+
+ src_col_data
+ position
+
+
+ out_points
+ madlibtestresult.kmeans_random_negative_src_col_id_out_points
+
+
+ out_centroids
+ madlibtestresult.kmeans_random_negative_src_col_id_out_centroids
+
+
+ k
+ 6
+
+
+
+ DROP TABLE IF EXISTS madlibtestresult.kmeans_random_negative_src_col_id_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_random_negative_src_col_id_out_centroids;
+
+
+
+
+
+ kmeans_canopy_negative_src_col_id
+ It is to test kmeans using negative source column id.
+
+ 1
+
+ kmeans_canopy
+
+ src_col_id
+ invalid_src_col_idNULL
+
+
+
+ src_relation
+ madlibtestdata.km_abalone
+
+
+ src_col_data
+ position
+
+
+ out_points
+ madlibtestresult.kmeans_canopy_negative_src_col_id_out_points
+
+
+ out_centroids
+ madlibtestresult.kmeans_canopy_negative_src_col_id_out_centroids
+
+
+ t1
+ NULL
+
+
+ t2
+ NULL
+
+
+
+ DROP TABLE IF EXISTS madlibtestresult.kmeans_canopy_negative_src_col_id_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_canopy_negative_src_col_id_out_centroids;
+
+
+
+
+
+ kmeans_cset_negative_dist_metric
+ It is to test kmeans using negative dist metric.
+
+ 1
+
+ kmeans_cset
+
+
+ src_relation
+ madlibtestdata.km_abalone
+
+
+ src_col_data
+ position
+
+
+ src_col_id
+ pid
+
+
+ out_points
+ madlibtestresult.kmeans_cset_negative_dist_metric_out_points
+
+
+ out_centroids
+ madlibtestresult.kmeans_cset_negative_dist_metric_out_centroids
+
+
+ dist_metric
+ invalid_dist_metric
+
+
+ init_cset_rel
+ madlibtestdata.km_abalone_centroids
+
+
+ init_cset_col
+ position
+
+
+
+ DROP TABLE IF EXISTS madlibtestresult.kmeans_cset_negative_dist_metric_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_cset_negative_dist_metric_out_centroids;
+
+
+
+
+
+ kmeans_plusplus_negative_dist_metric
+ It is to test kmeans using negative dist metric.
+
+ 1
+
+ kmeans_plusplus
+
+
+ src_relation
+ madlibtestdata.km_abalone
+
+
+ src_col_data
+ position
+
+
+ src_col_id
+ pid
+
+
+ out_points
+ madlibtestresult.kmeans_plusplus_negative_dist_metric_out_points
+
+
+ out_centroids
+ madlibtestresult.kmeans_plusplus_negative_dist_metric_out_centroids
+
+
+ dist_metric
+ invalid_dist_metric
+
+
+ k
+ 6
+
+
+ sample_frac
+ 0.01
+
+
+
+ DROP TABLE IF EXISTS madlibtestresult.kmeans_plusplus_negative_dist_metric_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_plusplus_negative_dist_metric_out_centroids;
+
+
+
+
+
+ kmeans_random_negative_dist_metric
+ It is to test kmeans using negative dist metric.
+
+ 1
+
+ kmeans_random
+
+
+ src_relation
+ madlibtestdata.km_abalone
+
+
+ src_col_data
+ position
+
+
+ src_col_id
+ pid
+
+
+ dist_metric
+ pid
+
+
+ out_points
+ madlibtestresult.kmeans_random_negative_dist_metric_out_points
+
+
+ out_centroids
+ madlibtestresult.kmeans_random_negative_dist_metric_out_centroids
+
+
+ dist_metric
+ invalid_dist_metric
+
+
+ k
+ 6
+
+
+
+ DROP TABLE IF EXISTS madlibtestresult.kmeans_random_negative_dist_metric_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_random_negative_dist_metric_out_centroids;
+
+
+
+
+
+ kmeans_canopy_negative_dist_metric
+ It is to test kmeans using negative dist metric.
+
+ 1
+
+ kmeans_canopy
+
+
+ src_relation
+ madlibtestdata.km_abalone
+
+
+ src_col_data
+ position
+
+
+ src_col_id
+ pid
+
+
+ out_points
+ madlibtestresult.kmeans_canopy_negative_dist_metric_out_points
+
+
+ out_centroids
+ madlibtestresult.kmeans_canopy_negative_dist_metric_out_centroids
+
+
+ dist_metric
+ invalid_dist_metric
+
+
+ t1
+ NULL
+
+
+ t2
+ NULL
+
+
+
+ DROP TABLE IF EXISTS madlibtestresult.kmeans_canopy_negative_dist_metric_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_canopy_negative_dist_metric_out_centroids;
+
+
+
+
+
+ kmeans_plusplus_negative_k
+ It is to test kmeans using negative k.
+
+ 1
+
+ kmeans_plusplus
+
+ k
+ -10
+
+
+
+ src_relation
+ madlibtestdata.km_abalone
+
+
+ src_col_data
+ position
+
+
+ src_col_id
+ pid
+
+
+ out_points
+ madlibtestresult.kmeans_plusplus_negative_k_out_points
+
+
+ out_centroids
+ madlibtestresult.kmeans_plusplus_negative_k_out_centroids
+
+
+ sample_frac
+ 0.01
+
+
+
+ DROP TABLE IF EXISTS madlibtestresult.kmeans_plusplus_negative_k_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_plusplus_negative_k_out_centroids;
+
+
+
+
+
+ kmeans_random_negative_k
+ It is to test kmeans using negative k.
+
+ 1
+
+ kmeans_random
+
+ k
+ -10
+
+
+
+ src_relation
+ madlibtestdata.km_abalone
+
+
+ src_col_data
+ position
+
+
+ src_col_id
+ pid
+
+
+ k
+ pid
+
+
+ out_points
+ madlibtestresult.kmeans_random_negative_k_out_points
+
+
+ out_centroids
+ madlibtestresult.kmeans_random_negative_k_out_centroids
+
+
+
+ DROP TABLE IF EXISTS madlibtestresult.kmeans_random_negative_k_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_random_negative_k_out_centroids;
+
+
+
+
+
+ kmeans_cset_negative_max_iteration
+ It is to test kmeans using negative max iteration.
+
+ 1
+
+ kmeans_cset
+
+ max_iter
+ -10
+
+
+
+ src_relation
+ madlibtestdata.km_abalone
+
+
+ src_col_data
+ position
+
+
+ src_col_id
+ pid
+
+
+ out_points
+ madlibtestresult.kmeans_cset_negative_max_iteration_out_points
+
+
+ out_centroids
+ madlibtestresult.kmeans_cset_negative_max_iteration_out_centroids
+
+
+ init_cset_rel
+ madlibtestdata.km_abalone_centroids
+
+
+ init_cset_col
+ position
+
+
+
+ DROP TABLE IF EXISTS madlibtestresult.kmeans_cset_negative_max_iteration_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_cset_negative_max_iteration_out_centroids;
+
+
+
+
+
+ kmeans_plusplus_negative_max_iteration
+ It is to test kmeans using negative max iteration.
+
+ 1
+
+ kmeans_plusplus
+
+ max_iter
+ -10
+
+
+
+ src_relation
+ madlibtestdata.km_abalone
+
+
+ src_col_data
+ position
+
+
+ src_col_id
+ pid
+
+
+ out_points
+ madlibtestresult.kmeans_plusplus_negative_max_iteration_out_points
+
+
+ out_centroids
+ madlibtestresult.kmeans_plusplus_negative_max_iteration_out_centroids
+
+
+ k
+ 6
+
+
+ sample_frac
+ 0.01
+
+
+
+ DROP TABLE IF EXISTS madlibtestresult.kmeans_plusplus_negative_max_iteration_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_plusplus_negative_max_iteration_out_centroids;
+
+
+
+
+
+ kmeans_random_negative_max_iteration
+ It is to test kmeans using negative max iteration.
+
+ 1
+
+ kmeans_random
+
+ max_iter
+ -10
+
+
+
+ src_relation
+ madlibtestdata.km_abalone
+
+
+ src_col_data
+ position
+
+
+ src_col_id
+ pid
+
+
+ out_points
+ madlibtestresult.kmeans_random_negative_max_iteration_out_points
+
+
+ out_centroids
+ madlibtestresult.kmeans_random_negative_max_iteration_out_centroids
+
+
+ k
+ 6
+
+
+
+ DROP TABLE IF EXISTS madlibtestresult.kmeans_random_negative_max_iteration_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_random_negative_max_iteration_out_centroids;
+
+
+
+
+
+ kmeans_canopy_negative_max_iteration
+ It is to test kmeans using negative max iteration.
+
+ 1
+
+ kmeans_canopy
+
+ max_iter
+ -10
+
+
+
+ src_relation
+ madlibtestdata.km_abalone
+
+
+ src_col_data
+ position
+
+
+ src_col_id
+ pid
+
+
+ out_points
+ madlibtestresult.kmeans_canopy_negative_max_iteration_out_points
+
+
+ out_centroids
+ madlibtestresult.kmeans_canopy_negative_max_iteration_out_centroids
+
+
+ t1
+ NULL
+
+
+ t2
+ NULL
+
+
+
+ DROP TABLE IF EXISTS madlibtestresult.kmeans_canopy_negative_max_iteration_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_canopy_negative_max_iteration_out_centroids;
+
+
+
+
+
+ kmeans_cset_negative_convergence_threshold
+ It is to test kmeans using negative convergence threshold.
+
+ 1
+
+ kmeans_cset
+
+ conv_threshold
+ -0.0001010000
+
+
+
+ src_relation
+ madlibtestdata.km_abalone
+
+
+ src_col_data
+ position
+
+
+ src_col_id
+ pid
+
+
+ out_points
+ madlibtestresult.kmeans_cset_negative_convergence_threshold_out_points
+
+
+ out_centroids
+ madlibtestresult.kmeans_cset_negative_convergence_threshold_out_centroids
+
+
+ init_cset_rel
+ madlibtestdata.km_abalone_centroids
+
+
+ init_cset_col
+ position
+
+
+
+ DROP TABLE IF EXISTS madlibtestresult.kmeans_cset_negative_convergence_threshold_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_cset_negative_convergence_threshold_out_centroids;
+
+
+
+
+
+ kmeans_plusplus_negative_convergence_threshold
+ It is to test kmeans using negative convergence threshold.
+
+ 1
+
+ kmeans_plusplus
+
+ conv_threshold
+ -0.0001010000
+
+
+
+ src_relation
+ madlibtestdata.km_abalone
+
+
+ src_col_data
+ position
+
+
+ src_col_id
+ pid
+
+
+ out_points
+ madlibtestresult.kmeans_plusplus_negative_convergence_threshold_out_points
+
+
+ out_centroids
+ madlibtestresult.kmeans_plusplus_negative_convergence_threshold_out_centroids
+
+
+ k
+ 6
+
+
+ sample_frac
+ 0.01
+
+
+
+ DROP TABLE IF EXISTS madlibtestresult.kmeans_plusplus_negative_convergence_threshold_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_plusplus_negative_convergence_threshold_out_centroids;
+
+
+
+
+
+ kmeans_random_negative_convergence_threshold
+ It is to test kmeans using negative convergence threshold.
+
+ 1
+
+ kmeans_random
+
+ conv_threshold
+ -0.0001010000
+
+
+
+ src_relation
+ madlibtestdata.km_abalone
+
+
+ src_col_data
+ position
+
+
+ src_col_id
+ pid
+
+
+ out_points
+ madlibtestresult.kmeans_random_negative_convergence_threshold_out_points
+
+
+ out_centroids
+ madlibtestresult.kmeans_random_negative_convergence_threshold_out_centroids
+
+
+ k
+ 6
+
+
+
+ DROP TABLE IF EXISTS madlibtestresult.kmeans_random_negative_convergence_threshold_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_random_negative_convergence_threshold_out_centroids;
+
+
+
+
+
+ kmeans_canopy_negative_convergence_threshold
+ It is to test kmeans using negative convergence threshold.
+
+ 1
+
+ kmeans_canopy
+
+ conv_threshold
+ -0.0001010000
+
+
+
+ src_relation
+ madlibtestdata.km_abalone
+
+
+ src_col_data
+ position
+
+
+ src_col_id
+ pid
+
+
+ out_points
+ madlibtestresult.kmeans_canopy_negative_convergence_threshold_out_points
+
+
+ out_centroids
+ madlibtestresult.kmeans_canopy_negative_convergence_threshold_out_centroids
+
+
+ t1
+ NULL
+
+
+ t2
+ NULL
+
+
+
+ DROP TABLE IF EXISTS madlibtestresult.kmeans_canopy_negative_convergence_threshold_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_canopy_negative_convergence_threshold_out_centroids;
+
+
+
+
+
+ kmeans_cset_negative_gof_switch
+ It is to test kmeans using negative gof switch.
+
+ 1
+
+ kmeans_cset
+
+
+ src_relation
+ madlibtestdata.km_abalone
+
+
+ src_col_data
+ position
+
+
+ src_col_id
+ pid
+
+
+ out_points
+ madlibtestresult.kmeans_cset_negative_gof_switch_out_points
+
+
+ out_centroids
+ madlibtestresult.kmeans_cset_negative_gof_switch_out_centroids
+
+
+ evaluate
+ invalid_gof_switch
+
+
+ init_cset_rel
+ madlibtestdata.km_abalone_centroids
+
+
+ init_cset_col
+ position
+
+
+
+ DROP TABLE IF EXISTS madlibtestresult.kmeans_cset_negative_gof_switch_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_cset_negative_gof_switch_out_centroids;
+
+
+
+
+
+ kmeans_plusplus_negative_gof_switch
+ It is to test kmeans using negative gof switch.
+
+ 1
+
+ kmeans_plusplus
+
+
+ src_relation
+ madlibtestdata.km_abalone
+
+
+ src_col_data
+ position
+
+
+ src_col_id
+ pid
+
+
+ out_points
+ madlibtestresult.kmeans_plusplus_negative_gof_switch_out_points
+
+
+ out_centroids
+ madlibtestresult.kmeans_plusplus_negative_gof_switch_out_centroids
+
+
+ evaluate
+ invalid_gof_switch
+
+
+ k
+ 6
+
+
+ sample_frac
+ 0.01
+
+
+
+ DROP TABLE IF EXISTS madlibtestresult.kmeans_plusplus_negative_gof_switch_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_plusplus_negative_gof_switch_out_centroids;
+
+
+
+
+
+ kmeans_random_negative_gof_switch
+ It is to test kmeans using negative gof switch.
+
+ 1
+
+ kmeans_random
+
+
+ src_relation
+ madlibtestdata.km_abalone
+
+
+ src_col_data
+ position
+
+
+ src_col_id
+ pid
+
+
+ out_points
+ madlibtestresult.kmeans_random_negative_gof_switch_out_points
+
+
+ out_centroids
+ madlibtestresult.kmeans_random_negative_gof_switch_out_centroids
+
+
+ evaluate
+ invalid_gof_switch
+
+
+ k
+ 6
+
+
+
+ DROP TABLE IF EXISTS madlibtestresult.kmeans_random_negative_gof_switch_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_random_negative_gof_switch_out_centroids;
+
+
+
+
+
+ kmeans_canopy_negative_gof_switch
+ It is to test kmeans using negative gof switch.
+
+ 1
+
+ kmeans_canopy
+
+
+ src_relation
+ madlibtestdata.km_abalone
+
+
+ src_col_data
+ position
+
+
+ src_col_id
+ pid
+
+
+ out_points
+ madlibtestresult.kmeans_canopy_negative_gof_switch_out_points
+
+
+ out_centroids
+ madlibtestresult.kmeans_canopy_negative_gof_switch_out_centroids
+
+
+ evaluate
+ invalid_gof_switch
+
+
+ t1
+ NULL
+
+
+ t2
+ NULL
+
+
+
+ DROP TABLE IF EXISTS madlibtestresult.kmeans_canopy_negative_gof_switch_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_canopy_negative_gof_switch_out_centroids;
+
+
+
+
+
+ kmeans_cset_negative_out_points
+ It is to test kmeans using negative out points.
+
+ 1
+
+ kmeans_cset
+
+
+ src_relation
+ madlibtestdata.km_abalone
+
+
+ src_col_data
+ position
+
+
+ src_col_id
+ pid
+
+
+ out_points
+ NULL
+
+
+ out_centroids
+ madlibtestresult.kmeans_cset_negative_out_points_out_centroids
+
+
+ init_cset_rel
+ madlibtestdata.km_abalone_centroids
+
+
+ init_cset_col
+ position
+
+
+
+ DROP TABLE IF EXISTS madlibtestresult.kmeans_cset_negative_out_points_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_cset_negative_out_points_out_centroids;
+
+
+
+
+
+ kmeans_plusplus_negative_out_points
+ It is to test kmeans using negative out points.
+
+ 1
+
+ kmeans_plusplus
+
+
+ src_relation
+ madlibtestdata.km_abalone
+
+
+ src_col_data
+ position
+
+
+ src_col_id
+ pid
+
+
+ out_points
+ NULL
+
+
+ out_centroids
+ madlibtestresult.kmeans_plusplus_negative_out_points_out_centroids
+
+
+ k
+ 6
+
+
+ sample_frac
+ 0.01
+
+
+
+ DROP TABLE IF EXISTS madlibtestresult.kmeans_plusplus_negative_out_points_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_plusplus_negative_out_points_out_centroids;
+
+
+
+
+
+ kmeans_random_negative_out_points
+ It is to test kmeans using negative out points.
+
+ 1
+
+ kmeans_random
+
+
+ src_relation
+ madlibtestdata.km_abalone
+
+
+ src_col_data
+ position
+
+
+ src_col_id
+ pid
+
+
+ out_points
+ NULL
+
+
+ out_centroids
+ madlibtestresult.kmeans_random_negative_out_points_out_centroids
+
+
+ k
+ 6
+
+
+
+ DROP TABLE IF EXISTS madlibtestresult.kmeans_random_negative_out_points_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_random_negative_out_points_out_centroids;
+
+
+
+
+
+ kmeans_canopy_negative_out_points
+ It is to test kmeans using negative out points.
+
+ 1
+
+ kmeans_canopy
+
+
+ src_relation
+ madlibtestdata.km_abalone
+
+
+ src_col_data
+ position
+
+
+ src_col_id
+ pid
+
+
+ out_points
+ NULL
+
+
+ out_centroids
+ madlibtestresult.kmeans_canopy_negative_out_points_out_centroids
+
+
+ t1
+ NULL
+
+
+ t2
+ NULL
+
+
+
+ DROP TABLE IF EXISTS madlibtestresult.kmeans_canopy_negative_out_points_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_canopy_negative_out_points_out_centroids;
+
+
+
+
+
+ kmeans_cset_negative_out_centroids
+ It is to test kmeans using negative out centroids.
+
+ 1
+
+ kmeans_cset
+
+
+ src_relation
+ madlibtestdata.km_abalone
+
+
+ src_col_data
+ position
+
+
+ src_col_id
+ pid
+
+
+ out_points
+ madlibtestresult.kmeans_canopy_negative_out_centroids_out_points
+
+
+ out_centroids
+ NULL
+
+
+ init_cset_rel
+ madlibtestdata.km_abalone_centroids
+
+
+ init_cset_col
+ position
+
+
+
+ DROP TABLE IF EXISTS madlibtestresult.kmeans_cset_negative_out_centroids_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_cset_negative_out_centroids_out_centroids;
+
+
+
+
+
+ kmeans_plusplus_negative_out_centroids
+ It is to test kmeans using negative out centroids.
+
+ 1
+
+ kmeans_plusplus
+
+
+ src_relation
+ madlibtestdata.km_abalone
+
+
+ src_col_data
+ position
+
+
+ src_col_id
+ pid
+
+
+ out_points
+ madlibtestresult.kmeans_canopy_negative_out_centroids_out_points
+
+
+ out_centroids
+ NULL
+
+
+ k
+ 6
+
+
+ sample_frac
+ 0.01
+
+
+
+ DROP TABLE IF EXISTS madlibtestresult.kmeans_plusplus_negative_out_centroids_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_plusplus_negative_out_centroids_out_centroids;
+
+
+
+
+
+ kmeans_random_negative_out_centroids
+ It is to test kmeans using negative out centroids.
+
+ 1
+
+ kmeans_random
+
+
+ src_relation
+ madlibtestdata.km_abalone
+
+
+ src_col_data
+ position
+
+
+ src_col_id
+ pid
+
+
+ out_points
+ madlibtestresult.kmeans_canopy_negative_out_centroids_out_points
+
+
+ out_centroids
+ NULL
+
+
+ k
+ 6
+
+
+
+ DROP TABLE IF EXISTS madlibtestresult.kmeans_random_negative_out_centroids_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_random_negative_out_centroids_out_centroids;
+
+
+
+
+
+ kmeans_canopy_negative_out_centroids
+ It is to test kmeans using negative out centroids.
+
+ 1
+
+ kmeans_canopy
+
+
+ src_relation
+ madlibtestdata.km_abalone
+
+
+ src_col_data
+ position
+
+
+ src_col_id
+ pid
+
+
+ out_points
+ madlibtestresult.kmeans_canopy_negative_out_centroids_out_points
+
+
+ out_centroids
+ NULL
+
+
+ t1
+ NULL
+
+
+ t2
+ NULL
+
+
+
+ DROP TABLE IF EXISTS madlibtestresult.kmeans_canopy_negative_out_centroids_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_canopy_negative_out_centroids_out_centroids;
+
+
+
+
+
+ kmeans_cset_negative_verbosity
+ It is to test kmeans using negative verbosity.
+
+ 1
+
+ kmeans_cset
+
+
+ src_relation
+ madlibtestdata.km_abalone
+
+
+ src_col_data
+ position
+
+
+ src_col_id
+ pid
+
+
+ out_points
+ madlibtestresult.kmeans_cset_negative_verbosity_out_points
+
+
+ out_centroids
+ madlibtestresult.kmeans_cset_negative_verbosity_out_centroids
+
+
+ verbosity
+ invalid_verbosity
+
+
+ init_cset_rel
+ madlibtestdata.km_abalone_centroids
+
+
+ init_cset_col
+ position
+
+
+
+ DROP TABLE IF EXISTS madlibtestresult.kmeans_cset_negative_verbosity_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_cset_negative_verbosity_out_centroids;
+
+
+
+
+
+ kmeans_plusplus_negative_verbosity
+ It is to test kmeans using negative verbosity.
+
+ 1
+
+ kmeans_plusplus
+
+
+ src_relation
+ madlibtestdata.km_abalone
+
+
+ src_col_data
+ position
+
+
+ src_col_id
+ pid
+
+
+ out_points
+ madlibtestresult.kmeans_plusplus_negative_verbosity_out_points
+
+
+ out_centroids
+ madlibtestresult.kmeans_plusplus_negative_verbosity_out_centroids
+
+
+ verbosity
+ invalid_verbosity
+
+
+ k
+ 6
+
+
+ sample_frac
+ 0.01
+
+
+
+ DROP TABLE IF EXISTS madlibtestresult.kmeans_plusplus_negative_verbosity_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_plusplus_negative_verbosity_out_centroids;
+
+
+
+
+
+ kmeans_random_negative_verbosity
+ It is to test kmeans using negative verbosity.
+
+ 1
+
+ kmeans_random
+
+
+ src_relation
+ madlibtestdata.km_abalone
+
+
+ src_col_data
+ position
+
+
+ src_col_id
+ pid
+
+
+ out_points
+ madlibtestresult.kmeans_random_negative_verbosity_out_points
+
+
+ out_centroids
+ madlibtestresult.kmeans_random_negative_verbosity_out_centroids
+
+
+ verbosity
+ invalid_verbosity
+
+
+ k
+ 6
+
+
+
+ DROP TABLE IF EXISTS madlibtestresult.kmeans_random_negative_verbosity_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_random_negative_verbosity_out_centroids;
+
+
+
+
+
+ kmeans_canopy_negative_verbosity
+ It is to test kmeans using negative verbosity.
+
+ 1
+
+ kmeans_canopy
+
+
+ src_relation
+ madlibtestdata.km_abalone
+
+
+ src_col_data
+ position
+
+
+ src_col_id
+ pid
+
+
+ out_points
+ madlibtestresult.kmeans_canopy_negative_verbosity_out_points
+
+
+ out_centroids
+ madlibtestresult.kmeans_canopy_negative_verbosity_out_centroids
+
+
+ verbosity
+ invalid_verbosity
+
+
+ t1
+ NULL
+
+
+ t2
+ NULL
+
+
+
+ DROP TABLE IF EXISTS madlibtestresult.kmeans_canopy_negative_verbosity_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_canopy_negative_verbosity_out_centroids;
+
+
+
+
+
+ kmeans_canopy_negative_t1
+ It is to test kmeans using negative t1.
+
+ 1
+
+ kmeans_canopy
+
+
+ src_relation
+ madlibtestdata.km_abalone
+
+
+ src_col_data
+ position
+
+
+ src_col_id
+ pid
+
+
+ out_points
+ madlibtestresult.kmeans_canopy_negative_t1_out_points
+
+
+ out_centroids
+ madlibtestresult.kmeans_canopy_negative_t1_out_centroids
+
+
+ t1
+ -1
+
+
+ t2
+ NULL
+
+
+
+ DROP TABLE IF EXISTS madlibtestresult.kmeans_canopy_negative_t1_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_canopy_negative_t1_out_centroids;
+
+
+
+
+
+ kmeans_canopy_negative_t2
+ It is to test kmeans using negative t2.
+
+ 1
+
+ kmeans_canopy
+
+
+ src_relation
+ madlibtestdata.km_abalone
+
+
+ src_col_data
+ position
+
+
+ src_col_id
+ pid
+
+
+ out_points
+ madlibtestresult.kmeans_canopy_negative_t2_out_points
+
+
+ out_centroids
+ madlibtestresult.kmeans_canopy_negative_t2_out_centroids
+
+
+ t1
+ NULL
+
+
+ t2
+ -1
+
+
+
+ DROP TABLE IF EXISTS madlibtestresult.kmeans_canopy_negative_t2_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_canopy_negative_t2_out_centroids;
+
+
+
+
+
+ kmeans_cset_negative_init_cset_rel
+ It is to test kmeans using negative init cset relation.
+
+ 1
+
+ kmeans_cset
+
+
+ src_relation
+ madlibtestdata.km_abalone
+
+
+ src_col_data
+ position
+
+
+ src_col_id
+ pid
+
+
+ out_points
+ madlibtestresult.kmeans_cset_negative_init_cset_rel_out_points
+
+
+ out_centroids
+ madlibtestresult.kmeans_cset_negative_init_cset_rel_out_centroids
+
+
+ init_cset_rel
+ invalid_init_cset_rel
+
+
+ init_cset_col
+ position
+
+
+
+ DROP TABLE IF EXISTS madlibtestresult.kmeans_cset_negative_init_cset_rel_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_cset_negative_init_cset_rel_out_centroids;
+
+
+
+
+
+ kmeans_cset_negative_init_cset_col
+ It is to test kmeans using negative init cset column.
+
+ 1
+
+ kmeans_cset
+
+
+ src_relation
+ madlibtestdata.km_abalone
+
+
+ src_col_data
+ position
+
+
+ src_col_id
+ pid
+
+
+ out_points
+ madlibtestresult.kmeans_cset_negative_init_cset_col_out_points
+
+
+ out_centroids
+ madlibtestresult.kmeans_cset_negative_init_cset_col_out_centroids
+
+
+ init_cset_rel
+ madlibtestdata.km_abalone_precentroids
+
+
+ init_cset_col
+ invalid_init_cset_col
+
+
+
+ DROP TABLE IF EXISTS madlibtestresult.kmeans_cset_negative_init_cset_col_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_cset_negative_init_cset_col_out_centroids;
+
+
+
+
+
+ kmeans_new_cset_ctas
+ It is to test kmeans using create table as.
+
+ 1
+
+ kmeans_new_cset_ctas
+
+
+ dataset
+ km_abalone
+
+
+
+ DROP TABLE IF EXISTS madlibtestresult.kmeans_new_cset_ctas_abalone;
+
+
+
+
+
+ kmeans_plusplus_ctas
+ It is to test kmeans using create table as.
+
+ 1
+
+ kmeans_plusplus_ctas
+
+
+ dataset
+ km_abalone
+
+
+ src_col_data
+ position
+
+
+ src_col_id
+ pid
+
+
+ out_points
+ madlibtestresult.kmeans_plusplus_ctas_out_points
+
+
+ out_centroids
+ madlibtestresult.kmeans_plusplus_ctas_out_centroids
+
+
+ k
+ 6
+
+
+ sample_frac
+ 0.01
+
+
+
+ DROP TABLE IF EXISTS madlibtestresult.kmeans_plusplus_ctas_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_plusplus_ctas_out_centroids;
+
+
+
+
+
+ kmeans_random_ctas
+ It is to test kmeans using create table as.
+
+ 1
+
+ kmeans_random_ctas
+
+
+ dataset
+ km_abalone
+
+
+ src_col_data
+ position
+
+
+ src_col_id
+ pid
+
+
+ out_points
+ madlibtestresult.kmeans_random_ctas_out_points
+
+
+ out_centroids
+ madlibtestresult.kmeans_random_ctas_out_centroids
+
+
+ k
+ 6
+
+
+
+ DROP TABLE IF EXISTS madlibtestresult.kmeans_random_ctas_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_random_ctas_out_centroids;
+
+
+
+
+
+ kmeans_canopy_ctas
+ It is to test kmeans using create table as.
+
+ 1
+
+ kmeans_canopy_ctas
+
+
+ dataset
+ km_abalone
+
+
+ src_col_data
+ position
+
+
+ src_col_id
+ pid
+
+
+ out_points
+ madlibtestresult.kmeans_canopy_ctas_out_points
+
+
+ out_centroids
+ madlibtestresult.kmeans_canopy_ctas_out_centroids
+
+
+ t1
+ NULL
+
+
+ t2
+ NULL
+
+
+
+ DROP TABLE IF EXISTS madlibtestresult.kmeans_canopy_ctas_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_canopy_ctas_out_centroids;
+
+
+
+
+
+
diff --git a/testspec/metadata/algorithmspec.xml b/testspec/metadata/algorithmspec.xml
index b1b3b5c..3877961 100755
--- a/testspec/metadata/algorithmspec.xml
+++ b/testspec/metadata/algorithmspec.xml
@@ -3317,7 +3317,73 @@
-
+
+ kmeans_new_cset
+ true
+
+ SELECT * FROM {madlib_schema}.kmeans
+ ( {src_relation} -- rel_source
+ , {src_col_data} -- expr_point
+ , {init_cset_rel} -- rel_initial_centroids
+ , {init_cset_col} -- expr_centroid
+ , {dist_metric} -- fn_squared_dist
+ , {agg_mean} -- agg_mean
+ , {max_iter} -- max_num_iterations
+ , {conv_threshold} -- min_frac_reassigned
+ ) AS q;
+
+
+ src_relation
+ text
+
+
+ src_col_data
+ text
+
+
+ dist_metric
+ text
+ madlib.squared_dist_norm2
+
+
+ agg_mean
+ text
+ madlib.avg
+
+
+ max_iter
+ int
+ 20
+
+
+ conv_threshold
+ float
+ 0.001
+
+
+ init_cset_rel
+ text
+
+
+ init_cset_col
+ text
+
+
+
+ objective_fn
+ double precision
+
+
+ frac_reassigned
+ double precision
+
+
+ num_iterations
+ integer
+
+
+
+
kmeans_plusplus
true
@@ -3409,7 +3475,68 @@
double precision
-
+
+
+ kmeans_new_plusplus
+ true
+
+ SELECT * FROM {madlib_schema}.kmeanspp
+ ( {src_relation} -- rel_source
+ , {src_col_data} -- expr_point
+ , {k} -- k
+ , {dist_metric} -- fn_squared_dist
+ , {agg_mean} -- agg_mean
+ , {max_iter} -- max_num_iterations
+ , {conv_threshold} -- min_frac_reassigned
+ ) AS q;
+
+
+ src_relation
+ text
+
+
+ src_col_data
+ text
+
+
+ dist_metric
+ text
+ madlib.squared_dist_norm2
+
+
+ agg_mean
+ text
+ madlib.avg
+
+
+ max_iter
+ int
+ 20
+
+
+ conv_threshold
+ double precision
+ 0.001
+
+
+ k
+ smallint
+
+
+
+ objective_fn
+ double precision
+
+
+ frac_reassigned
+ double precision
+
+
+ num_iterations
+ integer
+
+
+
kmeans_random
true
@@ -3497,6 +3624,85 @@
+
+ kmeans_new_random
+ true
+
+ SELECT * FROM {madlib_schema}.kmeans_random
+ ( {src_relation} -- rel_source
+ , {src_col_data} -- expr_point
+ , {k} -- k
+ , {dist_metric} -- fn_squared_dist
+ , {agg_mean} -- agg_mean
+ , {max_iter} -- max_num_iterations
+ , {conv_threshold} -- min_frac_reassigned
+ ) AS q;
+
+
+ src_relation
+ text
+
+
+ src_col_data
+ text
+
+
+ src_col_id
+ text
+ NULL
+
+
+ out_points
+ text
+
+
+ out_centroids
+ text
+
+
+ dist_metric
+ text
+ l2norm
+
+
+ max_iter
+ int
+ 20
+
+
+ conv_threshold
+ float
+ 0.001
+
+
+ evaluate
+ boolean
+ True
+
+
+ verbosity
+ boolean
+ True
+
+
+ k
+ int
+
+
+
+ objective_fn
+ double precision
+
+
+ frac_reassigned
+ double precision
+
+
+ num_iterations
+ integer
+
+
+
kmeans_canopy
true
@@ -3673,6 +3879,73 @@
+
+ kmeans_new_cset_ctas
+
+ SELECT {madlib_schema}.create_table_as('{table_name}', $$
+ SELECT * FROM {madlib_schema}.kmeans
+ ( {src_relation} -- rel_source
+ , {src_col_data} -- expr_point
+ , {init_cset_rel} -- rel_initial_centroids
+ , {init_cset_col} -- expr_centroid
+ , ({dist_metrics})[1]-- fn_dist
+ , {agg_mean} -- agg_mean
+ , {max_iter} -- max_num_iterations
+ , {conv_threshold} -- min_frac_reassigned
+ ) AS q
+ $$);
+ SELECT {madlib_schema}.simple_silhouette
+ ( {src_relation} -- rel_source
+ , {src_col_data} -- expr_point
+ , (SELECT centroids FROM {table_name}) -- centroids
+ , ({dist_metrics})[2] -- fn_dist
+ );
+
+
+ table_name
+ text
+ false
+
+
+ src_relation
+ text
+
+
+ src_col_data
+ text
+
+
+ dist_metrics
+ text
+ false
+ ARRAY['madlib.squared_dist_norm2','madlib.dist_norm2']
+
+
+ agg_mean
+ text
+ madlib.avg
+
+
+ max_iter
+ int
+ 20
+
+
+ conv_threshold
+ float
+ 0.001
+
+
+ init_cset_rel
+ text
+
+
+ init_cset_col
+ text
+
+
+
+
kmeans_plusplus_ctas
@@ -3755,7 +4028,80 @@
-
+
+
+ kmeans_new_plusplus_ctas
+
+ CREATE TABLE {table_name} AS
+ SELECT * FROM {madlib_schema}.kmeans_random
+ ( {src_relation} -- rel_source
+ , {src_col_data} -- expr_point
+ , {k} -- k
+ , {dist_metric} -- fn_squared_dist
+ , {agg_mean} -- agg_mean
+ , {max_iter} -- max_num_iterations
+ , {conv_threshold} -- min_frac_reassigned
+ ) AS q;
+ DROP TABLE {table_name};
+
+
+ table_name
+ text
+ false
+
+
+ src_relation
+ text
+
+
+ src_col_data
+ text
+
+
+ src_col_id
+ text
+ NULL
+
+
+ out_points
+ text
+
+
+ out_centroids
+ text
+
+
+ dist_metric
+ text
+ l2norm
+
+
+ max_iter
+ int
+ 20
+
+
+ conv_threshold
+ float
+ 0.001
+
+
+ evaluate
+ boolean
+ True
+
+
+ verbosity
+ boolean
+ True
+
+
+ k
+ int
+
+
+
+
kmeans_random_ctas
@@ -3833,6 +4179,79 @@
+
+ kmeans_new_random_ctas
+
+ CREATE TABLE {table_name} AS
+ SELECT * FROM {madlib_schema}.kmeans_random
+ ( {src_relation} -- rel_source
+ , {src_col_data} -- expr_point
+ , {k} -- k
+ , {dist_metric} -- fn_squared_dist
+ , {agg_mean} -- agg_mean
+ , {max_iter} -- max_num_iterations
+ , {conv_threshold} -- min_frac_reassigned
+ ) AS q;
+ DROP TABLE {table_name};
+
+
+ table_name
+ text
+ false
+
+
+ src_relation
+ text
+
+
+ src_col_data
+ text
+
+
+ src_col_id
+ text
+ NULL
+
+
+ out_points
+ text
+
+
+ out_centroids
+ text
+
+
+ dist_metric
+ text
+ l2norm
+
+
+ max_iter
+ int
+ 20
+
+
+ conv_threshold
+ float
+ 0.001
+
+
+ evaluate
+ boolean
+ True
+
+
+ verbosity
+ boolean
+ True
+
+
+ k
+ int
+
+
+
+
kmeans_canopy_ctas
@@ -3916,8 +4335,105 @@
+
+
+ kmeans_new_pp_seeding
+ true
+
+ SELECT {madlib_schema}.kmeanspp_seeding
+ ( {src_relation} -- rel_source
+ , {src_col_data} -- expr_point
+ , {k} -- k
+ , {dist_metric} -- fn_dist
+ , {initial_centroids} -- initial_centroids
+ );
+
+
+ src_relation
+ text
+
+
+ src_col_data
+ text
+
+
+ k
+ smallint
+
+
+ dist_metric
+ text
+ madlib.dist_norm2
+
+
+ initial_centroids
+ double precision[][]
+ NULL
+
+
+
+
+ kmeans_new_random_seeding
+ true
+
+ SELECT {madlib_schema}.kmeans_random_seeding
+ ( {src_relation} -- rel_source
+ , {src_col_data} -- expr_point
+ , {k} -- k
+ , {initial_centroids} -- initial_centroids
+ );
+
+
+ src_relation
+ text
+
+
+ src_col_data
+ text
+
+
+ k
+ smallint
+
+
+ initial_centroids
+ double precision[][]
+ NULL
+
+
+
+
+ kmeans_new_cset
+ true
+
+ SELECT {madlib_schema}.simple_silhouette
+ ( {src_relation} -- rel_source
+ , {src_col_data} -- expr_point
+ , (SELECT centroids FROM {src_result}) -- centroids
+ , {dist_metric} -- fn_dist
+ );
+
+
+ src_relation
+ text
+
+
+ src_col_data
+ text
+
+
+ src_result
+ text
+ false
+
+
+ dist_metric
+ text
+ madlib.dist_norm2
+
+
-
+
linear_regression
diff --git a/testspec/metadata/dataset.xml b/testspec/metadata/dataset.xml
index 5ffe05d..7df3695 100755
--- a/testspec/metadata/dataset.xml
+++ b/testspec/metadata/dataset.xml
@@ -6424,6 +6424,25 @@
position
+
+ kmeans_new_cset
+
+ src_relation
+ madlibtestdata.km_abalone
+
+
+ src_col_data
+ position
+
+
+ init_cset_rel
+ madlibtestdata.km_abalone_centroids
+
+
+ init_cset_col
+ position
+
+
kmeans_plusplus
@@ -6431,6 +6450,17 @@
madlibtestdata.km_abalone
+
+ kmeans_new_plusplus
+
+ src_relation
+ madlibtestdata.km_abalone
+
+
+ src_col_data
+ position
+
+
kmeans_random
@@ -6438,6 +6468,17 @@
madlibtestdata.km_abalone
+
+ kmeans_new_random
+
+ src_relation
+ madlibtestdata.km_abalone
+
+
+ src_col_data
+ position
+
+
kmeans_canopy
@@ -6464,6 +6505,29 @@
position
+
+ kmeans_new_cset_ctas
+
+ table_name
+ madlibtestresult.kmeans_new_cset_ctas_abalone
+
+
+ src_relation
+ madlibtestdata.km_abalone
+
+
+ src_col_data
+ position
+
+
+ init_cset_rel
+ madlibtestdata.km_abalone_centroids
+
+
+ init_cset_col
+ position
+
+
kmeans_plusplus_ctas
@@ -6475,6 +6539,21 @@
madlibtestdata.km_abalone
+
+ kmeans_new_plusplus_ctas
+
+ table_name
+ madlibtestresult.kmeans_new_plusplus_ctas_abalone
+
+
+ src_relation
+ madlibtestdata.km_abalone
+
+
+ src_col_data
+ position
+
+
kmeans_random_ctas
@@ -6486,6 +6565,21 @@
madlibtestdata.km_abalone
+
+ kmeans_new_random_ctas
+
+ table_name
+ madlibtestresult.kmeans_new_random_ctas_abalone
+
+
+ src_relation
+ madlibtestdata.km_abalone
+
+
+ src_col_data
+ position
+
+
kmeans_canopy_ctas
@@ -6497,6 +6591,17 @@
madlibtestdata.km_abalone
+
+ kmeans_new_silhouette
+
+ src_relation
+ madlibtestdata.km_abalone
+
+
+ src_col_data
+ position
+
+