TMCMC/utils.py at main · bominwang/TMCMC · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
"""
------------------------------------------------------------------------------------------------------------------------
BearGangLab - 过渡马尔可夫链蒙特卡洛 (T-MCMC)
------------------------------------------------------------------------------------------------------------------------
先验分布和似然函数定义

参考文献:
'J. Ching and Y.-C. Chen. Transitional Markov Chain Monte Carlo Method for Bayesian
Model Updating, Model Class Selection, and Model Averaging. Journal of Engineering
Mechanics, 133(7):816-832, 2007'

作者: BoMin Wang
日期: 20240324
------------------------------------------------------------------------------------------------------------------------
"""
import numpy as np
from scipy import stats


class PriorDistribution:
    """
    先验分布类

    支持的分布类型:
    - 'normal': 正态分布
    - 'uniform': 均匀分布
    - 'lognormal': 对数正态分布
    - 'gamma': 伽马分布
    - 'beta': Beta 分布
    - 'exponential': 指数分布
    """

    def __init__(self, distribution_type: str, **params):
        """
        初始化先验分布

        参数:
        ----------
        distribution_type : str
            分布类型，可选 ['normal', 'uniform', 'lognormal', 'gamma', 'beta', 'exponential']
        **params : dict
            分布参数
            - normal: mean, std
            - uniform: low, high
            - lognormal: mean, std (对数空间的均值和标准差)
            - gamma: shape, scale
            - beta: alpha, beta
            - exponential: scale
        """
        self.distribution_type = distribution_type
        self.params = params

        # 根据分布类型创建 scipy.stats 分布对象
        if distribution_type == 'normal':
            mean = params.get('mean', 0.0)
            std = params.get('std', 1.0)
            self.dist = stats.norm(loc=mean, scale=std)

        elif distribution_type == 'uniform':
            low = params.get('low', 0.0)
            high = params.get('high', 1.0)
            self.dist = stats.uniform(loc=low, scale=high-low)

        elif distribution_type == 'lognormal':
            mean = params.get('mean', 0.0)
            std = params.get('std', 1.0)
            self.dist = stats.lognorm(s=std, scale=np.exp(mean))

        elif distribution_type == 'gamma':
            shape = params.get('shape', 2.0)
            scale = params.get('scale', 1.0)
            self.dist = stats.gamma(a=shape, scale=scale)

        elif distribution_type == 'beta':
            alpha = params.get('alpha', 2.0)
            beta = params.get('beta', 2.0)
            self.dist = stats.beta(a=alpha, b=beta)

        elif distribution_type == 'exponential':
            scale = params.get('scale', 1.0)
            self.dist = stats.expon(scale=scale)

        else:
            raise ValueError(f"不支持的分布类型: {distribution_type}")

    def sample(self, size):
        """
        从先验分布中生成随机样本

        参数:
        ----------
        size : int or tuple
            样本形状

        返回:
        ----------
        samples : np.ndarray
            随机样本
        """
        return self.dist.rvs(size=size)

    def pdf(self, x: np.ndarray) -> np.ndarray:
        """
        计算概率密度函数值

        参数:
        ----------
        x : np.ndarray
            输入点

        返回:
        ----------
        pdf_values : np.ndarray
            概率密度值
        """
        return self.dist.pdf(x)

    def log_pdf(self, x: np.ndarray) -> np.ndarray:
        """
        计算对数概率密度函数值

        参数:
        ----------
        x : np.ndarray
            输入点

        返回:
        ----------
        log_pdf_values : np.ndarray
            对数概率密度值
        """
        return self.dist.logpdf(x)

    def cdf(self, x: np.ndarray) -> np.ndarray:
        """
        计算累积分布函数值

        参数:
        ----------
        x : np.ndarray
            输入点

        返回:
        ----------
        cdf_values : np.ndarray
            累积分布值
        """
        return self.dist.cdf(x)

    def __repr__(self):
        """返回分布的字符串表示"""
        return f"PriorDistribution(type='{self.distribution_type}', params={self.params})"


class JointPrior:
    """
    多维联合先验分布类

    用于处理多个独立的先验分布组成的联合分布
    """

    def __init__(self, priors: list):
        """
        初始化联合先验分布

        参数:
        ----------
        priors : list of PriorDistribution
            各个维度的先验分布列表
        """
        self.priors = priors
        self.n_dim = len(priors)

    def sample(self, size: int) -> np.ndarray:
        """
        从联合先验分布中生成样本

        参数:
        ----------
        size : int
            样本数量

        返回:
        ----------
        samples : np.ndarray, shape (size, n_dim)
            联合样本
        """
        samples = np.zeros((size, self.n_dim))
        for i, prior in enumerate(self.priors):
            samples[:, i] = prior.sample(size)
        return samples

    def log_pdf(self, x: np.ndarray) -> np.ndarray:
        """
        计算联合对数概率密度（假设各维度独立）

        参数:
        ----------
        x : np.ndarray, shape (n_samples, n_dim)
            输入样本

        返回:
        ----------
        log_pdf : np.ndarray, shape (n_samples, 1)
            对数概率密度值
        """
        if x.ndim == 1:
            x = x.reshape(1, -1)

        log_pdf = np.zeros((x.shape[0], 1))
        for i, prior in enumerate(self.priors):
            log_pdf += prior.log_pdf(x[:, i]).reshape(-1, 1)

        return log_pdf

    def __repr__(self):
        """返回联合分布的字符串表示"""
        prior_strs = [f"  Dim {i}: {prior}" for i, prior in enumerate(self.priors)]
        return f"JointPrior({self.n_dim} dimensions):\n" + "\n".join(prior_strs)


class LikelihoodFunction:
    """
    似然函数类

    用于封装用户定义的似然函数
    """

    def __init__(self, func: callable):
        """
        初始化似然函数

        参数:
        ----------
        func : callable
            似然函数，接受参数 theta (np.ndarray) 并返回似然值
            注意：应该返回似然值本身，而不是对数似然
        """
        self.func = func

    def evaluate(self, theta: np.ndarray) -> np.ndarray:
        """
        计算似然值

        参数:
        ----------
        theta : np.ndarray
            参数值

        返回:
        ----------
        likelihood : np.ndarray
            似然值
        """
        return self.func(theta)

    def log_likelihood(self, theta: np.ndarray) -> np.ndarray:
        """
        计算对数似然值

        参数:
        ----------
        theta : np.ndarray
            参数值

        返回:
        ----------
        log_likelihood : np.ndarray
            对数似然值
        """
        likelihood = self.func(theta)
        # 避免 log(0)
        return np.log(likelihood + 1e-300)

    def __repr__(self):
        """返回似然函数的字符串表示"""
        return f"LikelihoodFunction(func={self.func.__name__})"


class GaussianLikelihood(LikelihoodFunction):
    """
    高斯似然函数
    假设观测误差服从独立高斯分布: y_obs ~ N(y_pred, sigma^2)
    Log Likelihood = -0.5 * sum( (y_pred - y_obs)^2 / sigma^2 + log(2*pi*sigma^2) )
    """

    def __init__(self,
                 observed_input: np.ndarray,
                 observed_output_mean: np.ndarray,
                 observed_output_std: np.ndarray,
                 model: callable):
        """
        初始化高斯似然函数

        参数:
        ----------
        observed_input : np.ndarray, shape (n_obs, x_dim)
            试验输入
        observed_output_mean : np.ndarray, shape (n_obs,)
            试验输出观测值 (y_data)
        observed_output_std : np.ndarray, shape (n_obs,)
            试验观测噪声标准差 (sigma)。
            注意：在高斯似然中，sigma 必须 > 0。如果是确定性数据，建议给一个极小值代表数值误差。
        model : callable
            模型函数，接受形状为 [batch_size, x_dim + theta_dim] 的输入
        """
        self.observed_input = observed_input
        self.observed_output_mean = observed_output_mean

        # 数值稳定性处理：防止 sigma 为 0 导致除零错误
        # 高斯似然在 sigma -> 0 时趋向无穷大，必须截断
        self.observed_output_std = np.where(observed_output_std < 1e-9, 1e-9, observed_output_std)

        self.model_func = model
        self.n_obs = len(observed_output_mean)

        # 调用父类构造函数，指向自身的 evaluate
        super().__init__(lambda theta: self.evaluate(theta))

    def _predict_batch(self, theta: np.ndarray) -> np.ndarray:
        """
        执行批量预测 (与 BVMLikelihood 逻辑完全一致)
        参数:
        ----------
        theta : np.ndarray, shape (chain_size, theta_dim)
        返回:
        ----------
        y_pred : np.ndarray, shape (chain_size, n_obs)
        """
        n_particles = theta.shape[0]
        n_obs = self.n_obs

        # 1. 处理 Theta: 按行重复
        # shape: (n_particles * n_obs, theta_dim)
        theta_repeated = np.repeat(theta, n_obs, axis=0)

        # 2. 处理 X: 整体堆叠
        # shape: (n_particles * n_obs, x_dim)
        x_tiled = np.tile(self.observed_input, (n_particles, 1))

        # 3. 拼接输入
        # shape: (n_particles * n_obs, x_dim + theta_dim)
        input_concat = np.hstack([x_tiled, theta_repeated])

        # 4. 调用模型
        y_pred_flat = self.model_func(input_concat)

        # 5. 还原形状 -> (n_particles, n_obs)
        y_pred = y_pred_flat.reshape(n_particles, n_obs)

        return y_pred

    def log_likelihood(self, theta: np.ndarray) -> np.ndarray:
        """
        计算对数高斯似然
        """
        # 确保 theta 是二维的
        if theta.ndim == 1:
            theta = theta.reshape(1, -1)

        # 1. 获取模型预测: (chain_size, n_obs)
        y_pred = self._predict_batch(theta)

        # 2. 准备数据
        y_obs = self.observed_output_mean  # (n_obs,)
        sigma = self.observed_output_std  # (n_obs,)

        # 3. 计算残差 (Residuals)
        # 利用广播: (chain_size, n_obs) - (n_obs,)
        residuals = y_pred - y_obs

        # 4. 计算对数似然 (Log-Likelihood)
        # 公式: -0.5 * log(2*pi) - log(sigma) - 0.5 * (residual / sigma)^2
        # 注意: 这里是对每个观测点计算，然后求和

        term1 = -0.5 * np.log(2 * np.pi)
        term2 = -np.log(sigma)
        term3 = -0.5 * (residuals / sigma) ** 2

        # log_prob_matrix: shape (chain_size, n_obs)
        log_prob_matrix = term1 + term2 + term3

        # 5. 总对数似然
        # shape: (chain_size, 1)
        log_lik = np.sum(log_prob_matrix, axis=1).reshape(-1, 1)

        return log_lik

    def evaluate(self, theta: np.ndarray) -> np.ndarray:
        """
        计算原始似然值 (Exp of Log-Likelihood)
        """
        log_lik = self.log_likelihood(theta)
        # 为了防止数值下溢 (underflow) 导致变为0，可以考虑减去最大值 (在TMCMC内部通常会处理)
        # 这里直接返回 exp
        return np.exp(log_lik)

    def __repr__(self):
        return (f"GaussianLikelihood(n_obs={self.n_obs}, "
                f"sigma_min={self.observed_output_std.min():.2e})")