Fix GroupedLinearLayer in TF ConvBERT (#9972)

This commit is contained in:
abhishek thakur 2021-02-03 10:49:07 +01:00 committed by GitHub
parent 71bdc076dd
commit a1a67a3ced
No known key found for this signature in database
GPG Key ID: 4AEE18F83AFDEB23

View File

@ -435,9 +435,10 @@ class GroupedLinearLayer(tf.keras.layers.Layer):
)
def call(self, hidden_states):
batch_size = shape_list(tensor=hidden_states)[1]
x = tf.reshape(hidden_states, [-1, self.num_groups, self.group_in_dim])
x = tf.matmul(a=x, b=self.kernel, transpose_b=True)
batch_size = shape_list(hidden_states)[0]
x = tf.transpose(tf.reshape(hidden_states, [-1, self.num_groups, self.group_in_dim]), [1, 0, 2])
x = tf.matmul(x, self.kernel)
x = tf.transpose(x, [1, 0, 2])
x = tf.reshape(x, [batch_size, -1, self.output_size])
x = tf.nn.bias_add(value=x, bias=self.bias)
return x