在Keras模型中嵌入可训练双喷射器

import tensorflow as tf import tensorflow_probability as tfp tfd = tfp.distributions tfb = tfp.bijectors class Flow(tfb.Bijector, tf.Module): """ tf.Module to register trainable_variables """ def __init__(self, d, init_sigma=0.1, **kwargs): super(Flow, self).__init__( dtype=tf.float32, forward_min_event_ndims=0, inverse_min_event_ndims=0, **kwargs ) # Shape of the flow goes from Rd to Rd self.d = d # Weights/Variables initializer self.init_sigma = init_sigma w_init = tf.random_normal_initializer(stddev=self.init_sigma) # Variables self.u = tf.Variable( w_init(shape=[1, self.d], dtype=tf.float32), dtype=tf.float32, name='u', trainable=True, ) def _forward(self, x): return x def _inverse(self, y): return y class Flows(tf.keras.Model): def __init__(self, d=2, shape=(100, 2), n_flows=10, ): super(Flows, self).__init__() # Parameters self.d = d self.shape = shape self.n_flows = n_flows # Base distribution - MF = Multivariate normal diag base_distribution = tfd.MultivariateNormalDiag( loc=tf.zeros(shape=shape, dtype=tf.float32) ) # Flows as chain of bijector flows = [] for n in range(n_flows): flows.append(Flow(self.d, name=f"flow_{n + 1}")) bijector = tfb.Chain(list(reversed(flows))) self.flow = tfd.TransformedDistribution( distribution=base_distribution, bijector=bijector ) def call(self, *inputs): return self.flow.bijector.forward(*inputs) def log_prob(self, *inputs): return self.flow.log_prob(*inputs) def sample(self, num): return self.flow.sample(num) q = Flows() # Call to instantiate variables q(tf.zeros(q.shape)) # Prints no trainable params print(q.summary()) # Prints expected trainable params print(q.flow.trainable_variables)

1条回答

网友

1楼 · 发布于 2024-04-26 17:32:37

我也碰到了这个问题。这似乎是由TFP和TF2.0之间的不兼容问题（两个相关问题https://github.com/tensorflow/probability/issues/355和https://github.com/tensorflow/probability/issues/946）造成的

作为一种解决方法，您需要将转换后的分布/对象的（可训练的）变量作为属性添加到Keras模型中：

class Flows(tf.keras.Model):

    def __init__(self, d=2, shape=(100, 2), n_flows=10, ):
        super(Flows, self).__init__()
        # Parameters
        self.d = d
        self.shape = shape
        self.n_flows = n_flows
        # Base distribution - MF = Multivariate normal diag
        base_distribution = tfd.MultivariateNormalDiag(
            loc=tf.zeros(shape=shape, dtype=tf.float32)
        )
        # Flows as chain of bijector
        flows = []
        for n in range(n_flows):
            flows.append(Flow(self.d, name=f"flow_{n + 1}"))
        bijector = tfb.Chain(list(reversed(flows)))
        self.flow = tfd.TransformedDistribution(
            distribution=base_distribution,
            bijector=bijector
        )
        # issue: https://github.com/tensorflow/probability/issues/355, https://github.com/tensorflow/probability/issues/946
        # need to add bijector's trainable variables as an attribute (name does not matter)
        # otherwise this layer has zero trainable variables
        self._variables = self.flow.variables # https://github.com/tensorflow/probability/issues/355

    def call(self, *inputs):
        return self.flow.bijector.forward(*inputs)

    def log_prob(self, *inputs):
        return self.flow.log_prob(*inputs)

    def sample(self, num):
        return self.flow.sample(num)

添加此项后，您的模型应具有可训练的变量和权重以进行优化

相关问题更多 >

编程相关推荐

热门问题

热门文章