在上次的文章中我写了如何自定义loss，但是我真正想要的使用的场景比那些还要复杂一些。

问题出现

是想在自定义loss函数中对y_pred进行reshape然后进行sigmoid_cross_entropy_with_logits，但是keras他是将loss构建成一个graph，并且loss中的y_true并不是占位符，他的shape是根据模型最终的输出维度来确定的虚占位符，如果模型最后输出的维度和真正的y_true维度不匹配，那么是肯定报错的。

看下面这个例子：

import tensorflow as tf
from tensorflow.python import keras
import numpy as np
keras.backend.clear_session()
x = keras.Input(shape=(10))
x_1 = keras.layers.Dense(35)(x)
x_2 = keras.layers.Dense(70)(x)
model = keras.Model(inputs=x, outputs=[x_1, x_2])
model.summary()

def l_1(true, pred):
    pred = tf.reshape(pred, (-1, 5, 7))
    print(true.shape, pred.shape)
    # NOTE reshape之后 shape是匹配的，但是检查维度时候会报错
    return tf.reduce_sum(tf.nn.sigmoid_cross_entropy_with_logits(labels=true, logits=pred))

def l_2(true, pred):
    pred = tf.reshape(pred, (-1, 10, 7))
    print(true.shape, pred.shape)
    # NOTE reshape之后 shape是匹配的，但是检查维度时候会报错
    return tf.reduce_sum(tf.nn.sigmoid_cross_entropy_with_logits(labels=true, logits=pred))

train_set = tf.data.Dataset.from_tensor_slices((np.random.rand(100, 10), np.random.rand(100, 5, 7),
                                                np.random.rand(100, 10, 7))).repeat()  # type: tf.data.Dataset
train_set = train_set.map(lambda x, y, z: (x, (y, z))).batch(32)

model.compile('adam', loss=[l_1, l_2])
model.fit(train_set, steps_per_epoch=30)  # NOTE 不可训练

输出：

(?, ?) (?, 5, 7)
ValueError: logits and labels must have the same shape ((?, 5, 7) vs (?, ?))

可以看到我打印出y_true的shape就是和网络输出尺寸相同的，但实际上y_true输入是正确的，这个实在是让人蛋疼。

错误解决

因为y_true的shape就是和网络输出尺寸相同，所以就从网络上面下手，构建一个model_warrper用于训练。等待训练完成之后直接保存model即可。

import tensorflow as tf
from tensorflow.python import keras
import numpy as np
keras.backend.clear_session()
x = keras.Input(shape=(10))
x_1 = keras.layers.Dense(35)(x)
x_2 = keras.layers.Dense(70)(x)
model = keras.Model(inputs=x, outputs=[x_1, x_2])
model.summary()


def l_1(true, pred):
    pred = tf.reshape(pred, (-1, 5, 7))
    print(true.shape, pred.shape)
    # NOTE reshape之后 shape是匹配的，但是检查维度时候会报错
    return tf.reduce_sum(tf.nn.sigmoid_cross_entropy_with_logits(labels=true, logits=pred))


def l_2(true, pred):
    pred = tf.reshape(pred, (-1, 10, 7))
    print(true.shape, pred.shape)
    # NOTE reshape之后 shape是匹配的，但是检查维度时候会报错
    return tf.reduce_sum(tf.nn.sigmoid_cross_entropy_with_logits(labels=true, logits=pred))


train_set = tf.data.Dataset.from_tensor_slices((np.random.rand(100, 10), np.random.rand(100, 5, 7),
                                                np.random.rand(100, 10, 7))).repeat()  # type: tf.data.Dataset
train_set = train_set.map(lambda x, y, z: (x, (y, z))).batch(32)

# model.compile('adam', loss=[l_1, l_2])
# model.fit(train_set, steps_per_epoch=30)  # NOTE 不可训练

x_1 = keras.layers.Reshape((5, 7))(x_1)
x_2 = keras.layers.Reshape((10, 7))(x_2)
model_warpper = keras.Model(inputs=x, outputs=[x_1, x_2])
model_warpper.summary()
model_warpper.compile('adam', loss=[l_1, l_2])
model_warpper.fit(train_set, steps_per_epoch=30)  # NOTE 可训练

tf.keras自定义loss报错shape mismatch

tf.keras自定义loss报错shape mismatch

问题出现

错误解决