Machine-Learning/ml_api_endpoints_fix.py at master · YOIMIYA66/Machine-Learning · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
# ml_api_endpoints_fix.py
# 这个文件包含修复后的API端点函数，用于解决compare_models和ensemble API的400错误

from typing import List, Optional

# 导入原始ml_api_endpoints.py中的所有函数
from ml_api_endpoints_logs import get_deployment_logs, get_deployment_metrics
from ml_api_endpoints import (
    save_model_version,
    get_model_versions,
    deploy_model,
    get_deployed_models,
    undeploy_model
)

# 修复后的compare_models_api函数
def compare_models_api(model_names, test_data_path, target_column):
    """
    比较多个模型的性能

    Args:
        model_names: 要比较的模型名称列表
        test_data_path: 测试数据路径
        target_column: 目标列名

    Returns:
        包含比较结果的字典
    """
    import os
    import logging
    from ml_models import list_available_models, compare_models

    logger = logging.getLogger('ml_api_endpoints')

    try:
        # 验证参数
        if not model_names or len(model_names) < 2:
            return {
                "success": False,
                "error": "至少需要两个模型进行比较"
            }

        if not os.path.exists(test_data_path):
            return {
                "success": False,
                "error": f"测试数据文件不存在: {test_data_path}"
            }

        # 检查所有模型是否存在
        models = list_available_models()
        model_names_available = [m['name'] for m in models]
        missing_models = [m for m in model_names if m not in model_names_available]

        if missing_models:
            return {
                "success": False,
                "error": f"以下模型不存在: {', '.join(missing_models)}"
            }

        # 比较模型
        comparison_result = compare_models(model_names, test_data_path, target_column)

        # 格式化返回结果
        return {
            "success": True,
            "models": model_names,
            "test_data": test_data_path,
            "target_column": target_column,
            "comparison_result": comparison_result,
            "best_model": comparison_result.get('best_model', {}),
            "metrics": comparison_result.get('metrics', {}),
            "visualization_data": comparison_result.get('visualization_data', {})
        }
    except Exception as e:
        logger.error(f"比较模型时出错: {str(e)}")
        return {
            "success": False,
            "error": f"比较模型时出错: {str(e)}"
        }

# 修复后的build_ensemble_model函数
def build_ensemble_model(base_models: List[str], ensemble_type: str, weights: Optional[List[float]] = None, save_name: Optional[str] = None):
    """
    构建集成模型

    Args:
        base_models (List[str]): 基础模型名称列表
        ensemble_type (str): 集成类型 ('voting', 'stacking', 'bagging')
        weights (Optional[List[float]]): 基础模型权重列表，仅用于 'voting' 集成类型。
                                         如果提供，长度必须与 base_models 相同。
        save_name (Optional[str]): 保存的模型名称

    Returns:
        Dict[str, Any]: 包含集成模型信息的字典
    """
    import datetime
    import logging
    from ml_models import list_available_models, create_ensemble_model

    logger = logging.getLogger('ml_api_endpoints')

    try:
        # 验证参数
        if not base_models or len(base_models) < 2:
            return {
                "success": False,
                "error": "至少需要两个基础模型来构建集成模型"
            }

        if ensemble_type not in ['voting', 'stacking', 'bagging']:
            return {
                "success": False,
                "error": f"不支持的集成类型: {ensemble_type}，支持的类型有: voting, stacking, bagging"
            }

        # 验证权重（如果提供）
        if weights is not None:
            if ensemble_type != 'voting':
                return {
                    "success": False,
                    "error": "权重参数仅在 'voting' 集成类型中受支持"
                }
            if len(weights) != len(base_models):
                return {
                    "success": False,
                    "error": "权重列表的长度必须与基础模型列表的长度相同"
                }
            if not all(isinstance(w, (int, float)) for w in weights):
                return {
                    "success": False,
                    "error": "权重列表必须只包含数值"
                }

        # 检查所有基础模型是否存在
        models = list_available_models()
        model_names = [m['name'] for m in models]
        missing_models = [m for m in base_models if m not in model_names]

        if missing_models:
            return {
                "success": False,
                "error": f"以下模型不存在: {', '.join(missing_models)}"
            }

        # 准备模型列表和权重
        if weights is not None and ensemble_type == 'voting':
            model_list_with_weights = list(zip(base_models, weights))
        else:
            # 对于非voting类型或未提供权重的情况，默认权重（或由create_ensemble_model内部处理）
            model_list_with_weights = [(m, 1.0) for m in base_models] # 默认权重为1.0，create_ensemble_model可能会覆盖

        # 构建集成模型
        result = create_ensemble_model(
            model_list=model_list_with_weights,
            ensemble_type=ensemble_type,
            save_name=save_name
        )

        # 格式化返回结果
        return {
            "success": True,
            "model_name": result['model_name'],
            "ensemble_type": ensemble_type,
            "base_models": base_models,
            "model_info": {
                "type": "ensemble",
                "ensemble_type": ensemble_type,
                "base_models": base_models,
                "weights": weights if ensemble_type == 'voting' else None, # 记录权重信息
                "created_at": datetime.datetime.now().isoformat(),
                "description": result.get('metadata', {}).get('description', f"{ensemble_type.capitalize()} 集成模型")
            }
        }
    except Exception as e:
        logger.error(f"构建集成模型时出错: {str(e)}")
        return {
            "success": False,
            "error": f"构建集成模型时出错: {str(e)}"
        }