NumpyWDL/wide_layer.py at master · stasi009/NumpyWDL · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
import numpy as np
from ftrl import FtrlEstimator
from base_estimator import BaseEstimator
from collections import namedtuple


class WideLayer:
    def __init__(self, field_names, alpha, beta, L1, L2, proba_fn):
        """
        :param proba_fn:    proba_fn(example_idx,logit)=probability
                            之所以用function是因为如果与DNN结合，计算probability还要考虑DNN提供的logit
        """
        self._estimators = {field: FtrlEstimator(alpha=alpha,
                                                 beta=beta,
                                                 L1=L1,
                                                 L2=L2) for field in (['bias'] + field_names)}
        self._proba_fn = proba_fn

    def __predict_logit(self, sp_features, example_idx):
        logit = 0

        for field, estimator in self._estimators.items():
            if field == 'bias':
                feat_ids = [0]
                feat_vals = [1]
            else:
                sp_input = sp_features[field]
                feat_ids, feat_vals = sp_input.get_example_in_order(example_idx)

            logit += estimator.predict_logit(feature_ids=feat_ids, feature_values=feat_vals)

        return logit

    def train(self, sp_features, labels):
        """
        :param sp_features: dict from field_name ==> SparseInput
        :return: probabilities from this train batch
        """
        probas = []
        for example_idx, label in enumerate(labels):
            logit = self.__predict_logit(sp_features, example_idx)

            pred_proba = self._proba_fn(example_idx, logit)
            probas.append(pred_proba)

            for _, estimator in self._estimators.items():
                estimator.update(pred_proba=pred_proba, label=label)

        return np.asarray(probas)

    def predict_logits(self, sp_features):
        # 假定所有sp_feature都拥有相同的行数
        batch_size = None
        for sp_input in sp_features.values():
            batch_size = sp_input.n_total_examples
            break

        logits = [self.__predict_logit(sp_features, example_idx) for example_idx in range(batch_size)]
        return np.asarray(logits)


WideHParams = namedtuple("WideHParams", ['field_names', 'alpha', 'beta', 'L1', 'L2'])


def _sigmoid(example_idx, logit):
    return 1 / (1 + np.exp(-logit))


class WideEstimator(BaseEstimator):
    def __init__(self, hparams, data_source):
        self._layer = WideLayer(field_names=hparams.field_names,
                                alpha=hparams.alpha,
                                beta=hparams.beta,
                                L1=hparams.L1,
                                L2=hparams.L2,
                                proba_fn=_sigmoid)
        super().__init__(data_source)

    def train_batch(self, features, labels):
        return self._layer.train(sp_features=features, labels=labels)

    def predict(self, features):
        pred_logits = self._layer.predict_logits(sp_features=features)
        return 1 / (1 + np.exp(-pred_logits))