diff --git a/src/generator/testcase.py b/src/generator/testcase.py index 9889bd7..2905183 100755 --- a/src/generator/testcase.py +++ b/src/generator/testcase.py @@ -3,6 +3,7 @@ number and different vary parameter combinations """ import os +import pipes from xml_parser import * from file_path import * @@ -78,8 +79,10 @@ def __writeTestItemsSql(self, itemName, algorithm, method, \ "'" + self.caseName + "' ," +\ "'" + self.algorithm + "' ," +\ "'" + method + "' ," +\ - "'" + paras + "' ," +\ - "'" + varVal + "' ," +\ + "$_parasString$" \ + + paras + "$_parasString$ ," +\ + "$_valueString$" \ + + varVal + "$_valueString$ ," +\ "'" + varName + "' ," +\ "'" + dataset + "' ," +\ str(rownum) + ");" @@ -155,10 +158,10 @@ def GenCase(self, mtdList, exeIteration, tsType, debug): elif "rows" == varName : caseItemRows = varValue caseItemPara.append("--" + varName + " " + \ - self.paraHandler.handle(varName, varValue, "var", mtdName)) + pipes.quote(self.paraHandler.handle(varName, varValue, "var", mtdName))) else: caseItemPara.append("--" + varName + " " + \ - self.paraHandler.handle(varName, varValue, "var", mtdName)) + pipes.quote(self.paraHandler.handle(varName, varValue, "var", mtdName))) except Exception, exp: pass diff --git a/testspec/casespec/kmeans_new.xml b/testspec/casespec/kmeans_new.xml new file mode 100755 index 0000000..21247a3 --- /dev/null +++ b/testspec/casespec/kmeans_new.xml @@ -0,0 +1,2646 @@ + + + feature + + + kmeans + + + kmeans_new_cset + + benchmark + TemplateExecutor + + + + kmeans_new_plusplus + + benchmark + TemplateExecutor + + + + kmeans_new_random + + benchmark + TemplateExecutor + + + + kmeans_new_cset_ctas + + benchmark + TemplateExecutor + + + + kmeans_new_plusplus_ctas + + benchmark + TemplateExecutor + + + + kmeans_new_random_ctas + + benchmark + TemplateExecutor + + + + + + kmeans_new_cset_baseline + It is to get baseline of kmeans using predefined centroids against R. + + 1 + + kmeans_new_cset + + dataset + km_abalonekm_movement_libraskm_us_census_1990km_water_treatmentkm_winekm_winequality_red + + + dist_metric + madlib.dist_norm1madlib.squared_dist_norm2madlib.squared_anglemadlib.squared_tanimoto + + + + DROP TABLE IF EXISTS madlibtestresult.kmeans_cset_baseline_result; + + + + + kmeans_new_plusplus_baseline + It is to get baseline of kmeans using plus plus against R. + + 1 + + kmeans_new_plusplus + + dataset + km_abalonekm_movement_libraskm_us_census_1990km_water_treatmentkm_winekm_winequality_red + + + dist_metric + dist_norm1squared_dist_norm2squared_anglesquared_tanimoto + + + + k + 6 + + + + + + + kmeans_new_random_baseline + It is to get baseline of kmeans using random against R. + + 1 + + kmeans_new_random + + dataset + km_abalonekm_movement_libraskm_us_census_1990km_water_treatmentkm_winekm_winequality_red + + + dist_metric + dist_norm1squared_dist_norm2squared_anglesquared_tanimoto + + + + k + 6 + + + + + + + kmeans_new_cset_maximum_iteration + It is to test kmeans with maximum iteration. + + 1 + + kmeans_new_cset + + dataset + km_abalonekm_movement_libraskm_us_census_1990km_water_treatmentkm_winekm_winequality_red + + + max_iter + 5102030 + + + dist_metric + dist_norm1squared_dist_norm2squared_anglesquared_tanimoto + + + + + + kmeans_new_plusplus_maximum_iteration + It is to test kmeans with maximum iteration. + + 1 + + kmeans_new_plusplus + + dataset + km_abalonekm_movement_libraskm_us_census_1990km_water_treatmentkm_winekm_winequality_red + + + max_iter + 5102030 + + + + k + 6 + + + + + + + kmeans_new_random_maximum_iteration + It is to test kmeans with maximum iteration. + + 1 + + kmeans_new_random + + dataset + km_abalonekm_movement_libraskm_us_census_1990km_water_treatmentkm_winekm_winequality_red + + + max_iter + 5102030 + + + + k + 6 + + + + + + + kmeans_cset_negative_overwrite + It is to test kmeans with existing output tables. + + 1 + + kmeans_cset + + + dataset + km_abalone + + + src_col_data + position + + + src_col_id + pid + + + out_points + madlibtestresult.kmeans_cset_negative_overwrite_out_points + + + out_centroids + madlibtestresult.kmeans_cset_negative_overwrite_out_centroids + + + + + + kmeans_cset + + + dataset + km_abalone + + + src_col_data + position + + + src_col_id + pid + + + out_points + madlibtestresult.kmeans_cset_negative_overwrite_out_points + + + out_centroids + madlibtestresult.kmeans_cset_negative_overwrite_out_centroids + + + + DROP TABLE IF EXISTS madlibtestresult.kmeans_cset_negative_overwrite_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_cset_negative_overwrite_out_centroids; + + + + + + kmeans_plusplus_negative_overwrite + It is to test kmeans with existing output tables. + + 1 + + kmeans_plusplus + + + dataset + km_abalone + + + src_col_data + position + + + src_col_id + pid + + + out_points + madlibtestresult.kmeans_plusplus_negative_overwrite_out_points + + + out_centroids + madlibtestresult.kmeans_plusplus_negative_overwrite_out_centroids + + + k + 6 + + + sample_frac + 0.01 + + + + + + kmeans_plusplus + + + dataset + km_abalone + + + src_col_data + position + + + src_col_id + pid + + + out_points + madlibtestresult.kmeans_plusplus_negative_overwrite_out_points + + + out_centroids + madlibtestresult.kmeans_plusplus_negative_overwrite_out_centroids + + + k + 6 + + + sample_frac + 0.01 + + + + DROP TABLE IF EXISTS madlibtestresult.kmeans_plusplus_negative_overwrite_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_plusplus_negative_overwrite_out_centroids; + + + + + + kmeans_random_negative_overwrite + It is to test kmeans with existing output tables. + + 1 + + kmeans_random + + + dataset + km_abalone + + + src_col_data + position + + + src_col_id + pid + + + out_points + madlibtestresult.kmeans_random_negative_overwrite_out_points + + + out_centroids + madlibtestresult.kmeans_random_negative_overwrite_out_centroids + + + k + 6 + + + + + + kmeans_random + + + dataset + km_abalone + + + src_col_data + position + + + src_col_id + pid + + + out_points + madlibtestresult.kmeans_random_negative_overwrite_out_points + + + out_centroids + madlibtestresult.kmeans_random_negative_overwrite_out_centroids + + + k + 6 + + + + DROP TABLE IF EXISTS madlibtestresult.kmeans_random_negative_overwrite_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_random_negative_overwrite_out_centroids; + + + + + + kmeans_canopy_negative_overwrite + It is to test kmeans with existing output tables. + + 1 + + kmeans_canopy + + + dataset + km_abalone + + + src_col_data + position + + + src_col_id + pid + + + out_points + madlibtestresult.kmeans_canopy_negative_overwrite_out_points + + + out_centroids + madlibtestresult.kmeans_canopy_negative_overwrite_out_centroids + + + t1 + NULL + + + t2 + NULL + + + + + + kmeans_canopy + + + dataset + km_abalone + + + src_col_data + position + + + src_col_id + pid + + + out_points + madlibtestresult.kmeans_canopy_negative_overwrite_out_points + + + out_centroids + madlibtestresult.kmeans_canopy_negative_overwrite_out_centroids + + + t1 + NULL + + + t2 + NULL + + + + DROP TABLE IF EXISTS madlibtestresult.kmeans_canopy_negative_overwrite_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_canopy_negative_overwrite_out_centroids; + + + + + + kmeans_cset_negative_src_relation + It is to test kmeans using negative source relation. + + 1 + + kmeans_cset + + src_relation + madlibtestdata.invalid_src_relationNULL + + + + src_col_data + position + + + src_col_id + pid + + + out_points + madlibtestresult.kmeans_cset_negative_src_relation_out_points + + + out_centroids + madlibtestresult.kmeans_cset_negative_src_relation_out_centroids + + + init_cset_rel + madlibtestdata.km_abalone_centroids + + + init_cset_col + position + + + + DROP TABLE IF EXISTS madlibtestresult.kmeans_cset_negative_src_relation_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_cset_negative_src_relation_out_centroids; + + + + + + kmeans_plusplus_negative_src_relation + It is to test kmeans using negative source relation. + + 1 + + kmeans_plusplus + + src_relation + madlibtestdata.invalid_src_relationNULL + + + + src_col_data + position + + + src_col_id + pid + + + out_points + madlibtestresult.kmeans_plusplus_negative_src_relation_out_points + + + out_centroids + madlibtestresult.kmeans_plusplus_negative_src_relation_out_centroids + + + k + 6 + + + sample_frac + 0.01 + + + + DROP TABLE IF EXISTS madlibtestresult.kmeans_plusplus_negative_src_relation_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_plusplus_negative_src_relation_out_centroids; + + + + + + kmeans_random_negative_src_relation + It is to test kmeans using negative source relation. + + 1 + + kmeans_random + + src_relation + madlibtestdata.invalid_src_relationNULL + + + + src_col_data + position + + + src_col_id + pid + + + out_points + madlibtestresult.kmeans_random_negative_src_relation_out_points + + + out_centroids + madlibtestresult.kmeans_random_negative_src_relation_out_centroids + + + k + 6 + + + + DROP TABLE IF EXISTS madlibtestresult.kmeans_random_negative_src_relation_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_random_negative_src_relation_out_centroids; + + + + + + kmeans_canopy_negative_src_relation + It is to test kmeans using negative source relation. + + 1 + + kmeans_canopy + + src_relation + madlibtestdata.invalid_src_relationNULL + + + + src_col_data + position + + + src_col_id + pid + + + out_points + madlibtestresult.kmeans_canopy_negative_src_relation_out_points + + + out_centroids + madlibtestresult.kmeans_canopy_negative_src_relation_out_centroids + + + t1 + NULL + + + t2 + NULL + + + + DROP TABLE IF EXISTS madlibtestresult.kmeans_canopy_negative_src_relation_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_canopy_negative_src_relation_out_centroids; + + + + + + kmeans_cset_negative_src_col_data + It is to test kmeans using negative source column data. + + 1 + + kmeans_cset + + src_col_data + invalid_src_col_dataNULL + + + + src_relation + madlibtestdata.km_abalone + + + src_col_id + pid + + + out_points + madlibtestresult.kmeans_cset_negative_src_col_data_out_points + + + out_centroids + madlibtestresult.kmeans_cset_negative_src_col_data_out_centroids + + + + init_cset_rel + madlibtestdata.km_abalone_centroids + + + init_cset_col + position + + + DROP TABLE IF EXISTS madlibtestresult.kmeans_cset_negative_src_col_data_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_cset_negative_src_col_data_out_centroids; + + + + + + kmeans_plusplus_negative_src_col_data + It is to test kmeans using negative source column data. + + 1 + + kmeans_plusplus + + src_col_data + invalid_src_col_dataNULL + + + + src_relation + madlibtestdata.km_abalone + + + src_col_id + pid + + + out_points + madlibtestresult.kmeans_plusplus_negative_src_col_data_out_points + + + out_centroids + madlibtestresult.kmeans_plusplus_negative_src_col_data_out_centroids + + + k + 6 + + + sample_frac + 0.01 + + + + DROP TABLE IF EXISTS madlibtestresult.kmeans_plusplus_negative_src_col_data_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_plusplus_negative_src_col_data_out_centroids; + + + + + + kmeans_random_negative_src_col_data + It is to test kmeans using negative source column data. + + 1 + + kmeans_random + + src_col_data + invalid_src_col_dataNULL + + + + src_relation + madlibtestdata.km_abalone + + + src_col_id + pid + + + out_points + madlibtestresult.kmeans_random_negative_src_col_data_out_points + + + out_centroids + madlibtestresult.kmeans_random_negative_src_col_data_out_centroids + + + k + 6 + + + + DROP TABLE IF EXISTS madlibtestresult.kmeans_random_negative_src_col_data_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_random_negative_src_col_data_out_centroids; + + + + + + kmeans_canopy_negative_src_col_data + It is to test kmeans using negative source column data. + + 1 + + kmeans_canopy + + src_col_data + invalid_src_col_dataNULL + + + + src_relation + madlibtestdata.km_abalone + + + src_col_data + position + + + src_col_id + pid + + + out_points + madlibtestresult.kmeans_canopy_negative_src_col_data_out_points + + + out_centroids + madlibtestresult.kmeans_canopy_negative_src_col_data_out_centroids + + + t1 + NULL + + + t2 + NULL + + + + DROP TABLE IF EXISTS madlibtestresult.kmeans_canopy_negative_src_col_data_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_canopy_negative_src_col_data_out_centroids; + + + + + + kmeans_cset_negative_src_col_id + It is to test kmeans using negative source column id. + + 1 + + kmeans_cset + + src_col_id + invalid_src_col_idNULL + + + + src_relation + madlibtestdata.km_abalone + + + src_col_data + position + + + out_points + madlibtestresult.kmeans_cset_negative_src_col_id_out_points + + + out_centroids + madlibtestresult.kmeans_cset_negative_src_col_id_out_centroids + + + init_cset_rel + madlibtestdata.km_abalone_centroids + + + init_cset_col + position + + + + DROP TABLE IF EXISTS madlibtestresult.kmeans_cset_negative_src_col_id_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_cset_negative_src_col_id_out_centroids; + + + + + + kmeans_plusplus_negative_src_col_id + It is to test kmeans using negative source column id. + + 1 + + kmeans_plusplus + + src_col_id + invalid_src_col_idNULL + + + + src_relation + madlibtestdata.km_abalone + + + src_col_data + position + + + out_points + madlibtestresult.kmeans_plusplus_negative_src_col_id_out_points + + + out_centroids + madlibtestresult.kmeans_plusplus_negative_src_col_id_out_centroids + + + k + 6 + + + sample_frac + 0.01 + + + + DROP TABLE IF EXISTS madlibtestresult.kmeans_plusplus_negative_src_col_id_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_plusplus_negative_src_col_id_out_centroids; + + + + + + kmeans_random_negative_src_col_id + It is to test kmeans using negative source column id. + + 1 + + kmeans_random + + src_col_id + invalid_src_col_idNULL + + + + src_relation + madlibtestdata.km_abalone + + + src_col_data + position + + + out_points + madlibtestresult.kmeans_random_negative_src_col_id_out_points + + + out_centroids + madlibtestresult.kmeans_random_negative_src_col_id_out_centroids + + + k + 6 + + + + DROP TABLE IF EXISTS madlibtestresult.kmeans_random_negative_src_col_id_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_random_negative_src_col_id_out_centroids; + + + + + + kmeans_canopy_negative_src_col_id + It is to test kmeans using negative source column id. + + 1 + + kmeans_canopy + + src_col_id + invalid_src_col_idNULL + + + + src_relation + madlibtestdata.km_abalone + + + src_col_data + position + + + out_points + madlibtestresult.kmeans_canopy_negative_src_col_id_out_points + + + out_centroids + madlibtestresult.kmeans_canopy_negative_src_col_id_out_centroids + + + t1 + NULL + + + t2 + NULL + + + + DROP TABLE IF EXISTS madlibtestresult.kmeans_canopy_negative_src_col_id_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_canopy_negative_src_col_id_out_centroids; + + + + + + kmeans_cset_negative_dist_metric + It is to test kmeans using negative dist metric. + + 1 + + kmeans_cset + + + src_relation + madlibtestdata.km_abalone + + + src_col_data + position + + + src_col_id + pid + + + out_points + madlibtestresult.kmeans_cset_negative_dist_metric_out_points + + + out_centroids + madlibtestresult.kmeans_cset_negative_dist_metric_out_centroids + + + dist_metric + invalid_dist_metric + + + init_cset_rel + madlibtestdata.km_abalone_centroids + + + init_cset_col + position + + + + DROP TABLE IF EXISTS madlibtestresult.kmeans_cset_negative_dist_metric_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_cset_negative_dist_metric_out_centroids; + + + + + + kmeans_plusplus_negative_dist_metric + It is to test kmeans using negative dist metric. + + 1 + + kmeans_plusplus + + + src_relation + madlibtestdata.km_abalone + + + src_col_data + position + + + src_col_id + pid + + + out_points + madlibtestresult.kmeans_plusplus_negative_dist_metric_out_points + + + out_centroids + madlibtestresult.kmeans_plusplus_negative_dist_metric_out_centroids + + + dist_metric + invalid_dist_metric + + + k + 6 + + + sample_frac + 0.01 + + + + DROP TABLE IF EXISTS madlibtestresult.kmeans_plusplus_negative_dist_metric_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_plusplus_negative_dist_metric_out_centroids; + + + + + + kmeans_random_negative_dist_metric + It is to test kmeans using negative dist metric. + + 1 + + kmeans_random + + + src_relation + madlibtestdata.km_abalone + + + src_col_data + position + + + src_col_id + pid + + + dist_metric + pid + + + out_points + madlibtestresult.kmeans_random_negative_dist_metric_out_points + + + out_centroids + madlibtestresult.kmeans_random_negative_dist_metric_out_centroids + + + dist_metric + invalid_dist_metric + + + k + 6 + + + + DROP TABLE IF EXISTS madlibtestresult.kmeans_random_negative_dist_metric_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_random_negative_dist_metric_out_centroids; + + + + + + kmeans_canopy_negative_dist_metric + It is to test kmeans using negative dist metric. + + 1 + + kmeans_canopy + + + src_relation + madlibtestdata.km_abalone + + + src_col_data + position + + + src_col_id + pid + + + out_points + madlibtestresult.kmeans_canopy_negative_dist_metric_out_points + + + out_centroids + madlibtestresult.kmeans_canopy_negative_dist_metric_out_centroids + + + dist_metric + invalid_dist_metric + + + t1 + NULL + + + t2 + NULL + + + + DROP TABLE IF EXISTS madlibtestresult.kmeans_canopy_negative_dist_metric_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_canopy_negative_dist_metric_out_centroids; + + + + + + kmeans_plusplus_negative_k + It is to test kmeans using negative k. + + 1 + + kmeans_plusplus + + k + -10 + + + + src_relation + madlibtestdata.km_abalone + + + src_col_data + position + + + src_col_id + pid + + + out_points + madlibtestresult.kmeans_plusplus_negative_k_out_points + + + out_centroids + madlibtestresult.kmeans_plusplus_negative_k_out_centroids + + + sample_frac + 0.01 + + + + DROP TABLE IF EXISTS madlibtestresult.kmeans_plusplus_negative_k_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_plusplus_negative_k_out_centroids; + + + + + + kmeans_random_negative_k + It is to test kmeans using negative k. + + 1 + + kmeans_random + + k + -10 + + + + src_relation + madlibtestdata.km_abalone + + + src_col_data + position + + + src_col_id + pid + + + k + pid + + + out_points + madlibtestresult.kmeans_random_negative_k_out_points + + + out_centroids + madlibtestresult.kmeans_random_negative_k_out_centroids + + + + DROP TABLE IF EXISTS madlibtestresult.kmeans_random_negative_k_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_random_negative_k_out_centroids; + + + + + + kmeans_cset_negative_max_iteration + It is to test kmeans using negative max iteration. + + 1 + + kmeans_cset + + max_iter + -10 + + + + src_relation + madlibtestdata.km_abalone + + + src_col_data + position + + + src_col_id + pid + + + out_points + madlibtestresult.kmeans_cset_negative_max_iteration_out_points + + + out_centroids + madlibtestresult.kmeans_cset_negative_max_iteration_out_centroids + + + init_cset_rel + madlibtestdata.km_abalone_centroids + + + init_cset_col + position + + + + DROP TABLE IF EXISTS madlibtestresult.kmeans_cset_negative_max_iteration_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_cset_negative_max_iteration_out_centroids; + + + + + + kmeans_plusplus_negative_max_iteration + It is to test kmeans using negative max iteration. + + 1 + + kmeans_plusplus + + max_iter + -10 + + + + src_relation + madlibtestdata.km_abalone + + + src_col_data + position + + + src_col_id + pid + + + out_points + madlibtestresult.kmeans_plusplus_negative_max_iteration_out_points + + + out_centroids + madlibtestresult.kmeans_plusplus_negative_max_iteration_out_centroids + + + k + 6 + + + sample_frac + 0.01 + + + + DROP TABLE IF EXISTS madlibtestresult.kmeans_plusplus_negative_max_iteration_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_plusplus_negative_max_iteration_out_centroids; + + + + + + kmeans_random_negative_max_iteration + It is to test kmeans using negative max iteration. + + 1 + + kmeans_random + + max_iter + -10 + + + + src_relation + madlibtestdata.km_abalone + + + src_col_data + position + + + src_col_id + pid + + + out_points + madlibtestresult.kmeans_random_negative_max_iteration_out_points + + + out_centroids + madlibtestresult.kmeans_random_negative_max_iteration_out_centroids + + + k + 6 + + + + DROP TABLE IF EXISTS madlibtestresult.kmeans_random_negative_max_iteration_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_random_negative_max_iteration_out_centroids; + + + + + + kmeans_canopy_negative_max_iteration + It is to test kmeans using negative max iteration. + + 1 + + kmeans_canopy + + max_iter + -10 + + + + src_relation + madlibtestdata.km_abalone + + + src_col_data + position + + + src_col_id + pid + + + out_points + madlibtestresult.kmeans_canopy_negative_max_iteration_out_points + + + out_centroids + madlibtestresult.kmeans_canopy_negative_max_iteration_out_centroids + + + t1 + NULL + + + t2 + NULL + + + + DROP TABLE IF EXISTS madlibtestresult.kmeans_canopy_negative_max_iteration_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_canopy_negative_max_iteration_out_centroids; + + + + + + kmeans_cset_negative_convergence_threshold + It is to test kmeans using negative convergence threshold. + + 1 + + kmeans_cset + + conv_threshold + -0.0001010000 + + + + src_relation + madlibtestdata.km_abalone + + + src_col_data + position + + + src_col_id + pid + + + out_points + madlibtestresult.kmeans_cset_negative_convergence_threshold_out_points + + + out_centroids + madlibtestresult.kmeans_cset_negative_convergence_threshold_out_centroids + + + init_cset_rel + madlibtestdata.km_abalone_centroids + + + init_cset_col + position + + + + DROP TABLE IF EXISTS madlibtestresult.kmeans_cset_negative_convergence_threshold_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_cset_negative_convergence_threshold_out_centroids; + + + + + + kmeans_plusplus_negative_convergence_threshold + It is to test kmeans using negative convergence threshold. + + 1 + + kmeans_plusplus + + conv_threshold + -0.0001010000 + + + + src_relation + madlibtestdata.km_abalone + + + src_col_data + position + + + src_col_id + pid + + + out_points + madlibtestresult.kmeans_plusplus_negative_convergence_threshold_out_points + + + out_centroids + madlibtestresult.kmeans_plusplus_negative_convergence_threshold_out_centroids + + + k + 6 + + + sample_frac + 0.01 + + + + DROP TABLE IF EXISTS madlibtestresult.kmeans_plusplus_negative_convergence_threshold_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_plusplus_negative_convergence_threshold_out_centroids; + + + + + + kmeans_random_negative_convergence_threshold + It is to test kmeans using negative convergence threshold. + + 1 + + kmeans_random + + conv_threshold + -0.0001010000 + + + + src_relation + madlibtestdata.km_abalone + + + src_col_data + position + + + src_col_id + pid + + + out_points + madlibtestresult.kmeans_random_negative_convergence_threshold_out_points + + + out_centroids + madlibtestresult.kmeans_random_negative_convergence_threshold_out_centroids + + + k + 6 + + + + DROP TABLE IF EXISTS madlibtestresult.kmeans_random_negative_convergence_threshold_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_random_negative_convergence_threshold_out_centroids; + + + + + + kmeans_canopy_negative_convergence_threshold + It is to test kmeans using negative convergence threshold. + + 1 + + kmeans_canopy + + conv_threshold + -0.0001010000 + + + + src_relation + madlibtestdata.km_abalone + + + src_col_data + position + + + src_col_id + pid + + + out_points + madlibtestresult.kmeans_canopy_negative_convergence_threshold_out_points + + + out_centroids + madlibtestresult.kmeans_canopy_negative_convergence_threshold_out_centroids + + + t1 + NULL + + + t2 + NULL + + + + DROP TABLE IF EXISTS madlibtestresult.kmeans_canopy_negative_convergence_threshold_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_canopy_negative_convergence_threshold_out_centroids; + + + + + + kmeans_cset_negative_gof_switch + It is to test kmeans using negative gof switch. + + 1 + + kmeans_cset + + + src_relation + madlibtestdata.km_abalone + + + src_col_data + position + + + src_col_id + pid + + + out_points + madlibtestresult.kmeans_cset_negative_gof_switch_out_points + + + out_centroids + madlibtestresult.kmeans_cset_negative_gof_switch_out_centroids + + + evaluate + invalid_gof_switch + + + init_cset_rel + madlibtestdata.km_abalone_centroids + + + init_cset_col + position + + + + DROP TABLE IF EXISTS madlibtestresult.kmeans_cset_negative_gof_switch_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_cset_negative_gof_switch_out_centroids; + + + + + + kmeans_plusplus_negative_gof_switch + It is to test kmeans using negative gof switch. + + 1 + + kmeans_plusplus + + + src_relation + madlibtestdata.km_abalone + + + src_col_data + position + + + src_col_id + pid + + + out_points + madlibtestresult.kmeans_plusplus_negative_gof_switch_out_points + + + out_centroids + madlibtestresult.kmeans_plusplus_negative_gof_switch_out_centroids + + + evaluate + invalid_gof_switch + + + k + 6 + + + sample_frac + 0.01 + + + + DROP TABLE IF EXISTS madlibtestresult.kmeans_plusplus_negative_gof_switch_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_plusplus_negative_gof_switch_out_centroids; + + + + + + kmeans_random_negative_gof_switch + It is to test kmeans using negative gof switch. + + 1 + + kmeans_random + + + src_relation + madlibtestdata.km_abalone + + + src_col_data + position + + + src_col_id + pid + + + out_points + madlibtestresult.kmeans_random_negative_gof_switch_out_points + + + out_centroids + madlibtestresult.kmeans_random_negative_gof_switch_out_centroids + + + evaluate + invalid_gof_switch + + + k + 6 + + + + DROP TABLE IF EXISTS madlibtestresult.kmeans_random_negative_gof_switch_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_random_negative_gof_switch_out_centroids; + + + + + + kmeans_canopy_negative_gof_switch + It is to test kmeans using negative gof switch. + + 1 + + kmeans_canopy + + + src_relation + madlibtestdata.km_abalone + + + src_col_data + position + + + src_col_id + pid + + + out_points + madlibtestresult.kmeans_canopy_negative_gof_switch_out_points + + + out_centroids + madlibtestresult.kmeans_canopy_negative_gof_switch_out_centroids + + + evaluate + invalid_gof_switch + + + t1 + NULL + + + t2 + NULL + + + + DROP TABLE IF EXISTS madlibtestresult.kmeans_canopy_negative_gof_switch_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_canopy_negative_gof_switch_out_centroids; + + + + + + kmeans_cset_negative_out_points + It is to test kmeans using negative out points. + + 1 + + kmeans_cset + + + src_relation + madlibtestdata.km_abalone + + + src_col_data + position + + + src_col_id + pid + + + out_points + NULL + + + out_centroids + madlibtestresult.kmeans_cset_negative_out_points_out_centroids + + + init_cset_rel + madlibtestdata.km_abalone_centroids + + + init_cset_col + position + + + + DROP TABLE IF EXISTS madlibtestresult.kmeans_cset_negative_out_points_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_cset_negative_out_points_out_centroids; + + + + + + kmeans_plusplus_negative_out_points + It is to test kmeans using negative out points. + + 1 + + kmeans_plusplus + + + src_relation + madlibtestdata.km_abalone + + + src_col_data + position + + + src_col_id + pid + + + out_points + NULL + + + out_centroids + madlibtestresult.kmeans_plusplus_negative_out_points_out_centroids + + + k + 6 + + + sample_frac + 0.01 + + + + DROP TABLE IF EXISTS madlibtestresult.kmeans_plusplus_negative_out_points_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_plusplus_negative_out_points_out_centroids; + + + + + + kmeans_random_negative_out_points + It is to test kmeans using negative out points. + + 1 + + kmeans_random + + + src_relation + madlibtestdata.km_abalone + + + src_col_data + position + + + src_col_id + pid + + + out_points + NULL + + + out_centroids + madlibtestresult.kmeans_random_negative_out_points_out_centroids + + + k + 6 + + + + DROP TABLE IF EXISTS madlibtestresult.kmeans_random_negative_out_points_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_random_negative_out_points_out_centroids; + + + + + + kmeans_canopy_negative_out_points + It is to test kmeans using negative out points. + + 1 + + kmeans_canopy + + + src_relation + madlibtestdata.km_abalone + + + src_col_data + position + + + src_col_id + pid + + + out_points + NULL + + + out_centroids + madlibtestresult.kmeans_canopy_negative_out_points_out_centroids + + + t1 + NULL + + + t2 + NULL + + + + DROP TABLE IF EXISTS madlibtestresult.kmeans_canopy_negative_out_points_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_canopy_negative_out_points_out_centroids; + + + + + + kmeans_cset_negative_out_centroids + It is to test kmeans using negative out centroids. + + 1 + + kmeans_cset + + + src_relation + madlibtestdata.km_abalone + + + src_col_data + position + + + src_col_id + pid + + + out_points + madlibtestresult.kmeans_canopy_negative_out_centroids_out_points + + + out_centroids + NULL + + + init_cset_rel + madlibtestdata.km_abalone_centroids + + + init_cset_col + position + + + + DROP TABLE IF EXISTS madlibtestresult.kmeans_cset_negative_out_centroids_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_cset_negative_out_centroids_out_centroids; + + + + + + kmeans_plusplus_negative_out_centroids + It is to test kmeans using negative out centroids. + + 1 + + kmeans_plusplus + + + src_relation + madlibtestdata.km_abalone + + + src_col_data + position + + + src_col_id + pid + + + out_points + madlibtestresult.kmeans_canopy_negative_out_centroids_out_points + + + out_centroids + NULL + + + k + 6 + + + sample_frac + 0.01 + + + + DROP TABLE IF EXISTS madlibtestresult.kmeans_plusplus_negative_out_centroids_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_plusplus_negative_out_centroids_out_centroids; + + + + + + kmeans_random_negative_out_centroids + It is to test kmeans using negative out centroids. + + 1 + + kmeans_random + + + src_relation + madlibtestdata.km_abalone + + + src_col_data + position + + + src_col_id + pid + + + out_points + madlibtestresult.kmeans_canopy_negative_out_centroids_out_points + + + out_centroids + NULL + + + k + 6 + + + + DROP TABLE IF EXISTS madlibtestresult.kmeans_random_negative_out_centroids_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_random_negative_out_centroids_out_centroids; + + + + + + kmeans_canopy_negative_out_centroids + It is to test kmeans using negative out centroids. + + 1 + + kmeans_canopy + + + src_relation + madlibtestdata.km_abalone + + + src_col_data + position + + + src_col_id + pid + + + out_points + madlibtestresult.kmeans_canopy_negative_out_centroids_out_points + + + out_centroids + NULL + + + t1 + NULL + + + t2 + NULL + + + + DROP TABLE IF EXISTS madlibtestresult.kmeans_canopy_negative_out_centroids_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_canopy_negative_out_centroids_out_centroids; + + + + + + kmeans_cset_negative_verbosity + It is to test kmeans using negative verbosity. + + 1 + + kmeans_cset + + + src_relation + madlibtestdata.km_abalone + + + src_col_data + position + + + src_col_id + pid + + + out_points + madlibtestresult.kmeans_cset_negative_verbosity_out_points + + + out_centroids + madlibtestresult.kmeans_cset_negative_verbosity_out_centroids + + + verbosity + invalid_verbosity + + + init_cset_rel + madlibtestdata.km_abalone_centroids + + + init_cset_col + position + + + + DROP TABLE IF EXISTS madlibtestresult.kmeans_cset_negative_verbosity_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_cset_negative_verbosity_out_centroids; + + + + + + kmeans_plusplus_negative_verbosity + It is to test kmeans using negative verbosity. + + 1 + + kmeans_plusplus + + + src_relation + madlibtestdata.km_abalone + + + src_col_data + position + + + src_col_id + pid + + + out_points + madlibtestresult.kmeans_plusplus_negative_verbosity_out_points + + + out_centroids + madlibtestresult.kmeans_plusplus_negative_verbosity_out_centroids + + + verbosity + invalid_verbosity + + + k + 6 + + + sample_frac + 0.01 + + + + DROP TABLE IF EXISTS madlibtestresult.kmeans_plusplus_negative_verbosity_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_plusplus_negative_verbosity_out_centroids; + + + + + + kmeans_random_negative_verbosity + It is to test kmeans using negative verbosity. + + 1 + + kmeans_random + + + src_relation + madlibtestdata.km_abalone + + + src_col_data + position + + + src_col_id + pid + + + out_points + madlibtestresult.kmeans_random_negative_verbosity_out_points + + + out_centroids + madlibtestresult.kmeans_random_negative_verbosity_out_centroids + + + verbosity + invalid_verbosity + + + k + 6 + + + + DROP TABLE IF EXISTS madlibtestresult.kmeans_random_negative_verbosity_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_random_negative_verbosity_out_centroids; + + + + + + kmeans_canopy_negative_verbosity + It is to test kmeans using negative verbosity. + + 1 + + kmeans_canopy + + + src_relation + madlibtestdata.km_abalone + + + src_col_data + position + + + src_col_id + pid + + + out_points + madlibtestresult.kmeans_canopy_negative_verbosity_out_points + + + out_centroids + madlibtestresult.kmeans_canopy_negative_verbosity_out_centroids + + + verbosity + invalid_verbosity + + + t1 + NULL + + + t2 + NULL + + + + DROP TABLE IF EXISTS madlibtestresult.kmeans_canopy_negative_verbosity_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_canopy_negative_verbosity_out_centroids; + + + + + + kmeans_canopy_negative_t1 + It is to test kmeans using negative t1. + + 1 + + kmeans_canopy + + + src_relation + madlibtestdata.km_abalone + + + src_col_data + position + + + src_col_id + pid + + + out_points + madlibtestresult.kmeans_canopy_negative_t1_out_points + + + out_centroids + madlibtestresult.kmeans_canopy_negative_t1_out_centroids + + + t1 + -1 + + + t2 + NULL + + + + DROP TABLE IF EXISTS madlibtestresult.kmeans_canopy_negative_t1_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_canopy_negative_t1_out_centroids; + + + + + + kmeans_canopy_negative_t2 + It is to test kmeans using negative t2. + + 1 + + kmeans_canopy + + + src_relation + madlibtestdata.km_abalone + + + src_col_data + position + + + src_col_id + pid + + + out_points + madlibtestresult.kmeans_canopy_negative_t2_out_points + + + out_centroids + madlibtestresult.kmeans_canopy_negative_t2_out_centroids + + + t1 + NULL + + + t2 + -1 + + + + DROP TABLE IF EXISTS madlibtestresult.kmeans_canopy_negative_t2_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_canopy_negative_t2_out_centroids; + + + + + + kmeans_cset_negative_init_cset_rel + It is to test kmeans using negative init cset relation. + + 1 + + kmeans_cset + + + src_relation + madlibtestdata.km_abalone + + + src_col_data + position + + + src_col_id + pid + + + out_points + madlibtestresult.kmeans_cset_negative_init_cset_rel_out_points + + + out_centroids + madlibtestresult.kmeans_cset_negative_init_cset_rel_out_centroids + + + init_cset_rel + invalid_init_cset_rel + + + init_cset_col + position + + + + DROP TABLE IF EXISTS madlibtestresult.kmeans_cset_negative_init_cset_rel_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_cset_negative_init_cset_rel_out_centroids; + + + + + + kmeans_cset_negative_init_cset_col + It is to test kmeans using negative init cset column. + + 1 + + kmeans_cset + + + src_relation + madlibtestdata.km_abalone + + + src_col_data + position + + + src_col_id + pid + + + out_points + madlibtestresult.kmeans_cset_negative_init_cset_col_out_points + + + out_centroids + madlibtestresult.kmeans_cset_negative_init_cset_col_out_centroids + + + init_cset_rel + madlibtestdata.km_abalone_precentroids + + + init_cset_col + invalid_init_cset_col + + + + DROP TABLE IF EXISTS madlibtestresult.kmeans_cset_negative_init_cset_col_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_cset_negative_init_cset_col_out_centroids; + + + + + + kmeans_new_cset_ctas + It is to test kmeans using create table as. + + 1 + + kmeans_new_cset_ctas + + + dataset + km_abalone + + + + DROP TABLE IF EXISTS madlibtestresult.kmeans_new_cset_ctas_abalone; + + + + + + kmeans_plusplus_ctas + It is to test kmeans using create table as. + + 1 + + kmeans_plusplus_ctas + + + dataset + km_abalone + + + src_col_data + position + + + src_col_id + pid + + + out_points + madlibtestresult.kmeans_plusplus_ctas_out_points + + + out_centroids + madlibtestresult.kmeans_plusplus_ctas_out_centroids + + + k + 6 + + + sample_frac + 0.01 + + + + DROP TABLE IF EXISTS madlibtestresult.kmeans_plusplus_ctas_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_plusplus_ctas_out_centroids; + + + + + + kmeans_random_ctas + It is to test kmeans using create table as. + + 1 + + kmeans_random_ctas + + + dataset + km_abalone + + + src_col_data + position + + + src_col_id + pid + + + out_points + madlibtestresult.kmeans_random_ctas_out_points + + + out_centroids + madlibtestresult.kmeans_random_ctas_out_centroids + + + k + 6 + + + + DROP TABLE IF EXISTS madlibtestresult.kmeans_random_ctas_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_random_ctas_out_centroids; + + + + + + kmeans_canopy_ctas + It is to test kmeans using create table as. + + 1 + + kmeans_canopy_ctas + + + dataset + km_abalone + + + src_col_data + position + + + src_col_id + pid + + + out_points + madlibtestresult.kmeans_canopy_ctas_out_points + + + out_centroids + madlibtestresult.kmeans_canopy_ctas_out_centroids + + + t1 + NULL + + + t2 + NULL + + + + DROP TABLE IF EXISTS madlibtestresult.kmeans_canopy_ctas_out_points;DROP TABLE IF EXISTS madlibtestresult.kmeans_canopy_ctas_out_centroids; + + + + + + diff --git a/testspec/metadata/algorithmspec.xml b/testspec/metadata/algorithmspec.xml index b1b3b5c..3877961 100755 --- a/testspec/metadata/algorithmspec.xml +++ b/testspec/metadata/algorithmspec.xml @@ -3317,7 +3317,73 @@ - + + kmeans_new_cset + true + + + src_relation + text + + + src_col_data + text + + + dist_metric + text + madlib.squared_dist_norm2 + + + agg_mean + text + madlib.avg + + + max_iter + int + 20 + + + conv_threshold + float + 0.001 + + + init_cset_rel + text + + + init_cset_col + text + + + + objective_fn + double precision + + + frac_reassigned + double precision + + + num_iterations + integer + + + + kmeans_plusplus true