2020-08-14 16:31:13 +08:00
|
|
|
#copyright (c) 2019 PaddlePaddle Authors. All Rights Reserve.
|
|
|
|
#
|
|
|
|
#Licensed under the Apache License, Version 2.0 (the "License");
|
|
|
|
#you may not use this file except in compliance with the License.
|
|
|
|
#You may obtain a copy of the License at
|
|
|
|
#
|
|
|
|
# http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
#
|
|
|
|
#Unless required by applicable law or agreed to in writing, software
|
|
|
|
#distributed under the License is distributed on an "AS IS" BASIS,
|
|
|
|
#WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
|
|
#See the License for the specific language governing permissions and
|
|
|
|
#limitations under the License.
|
|
|
|
|
|
|
|
from __future__ import absolute_import
|
|
|
|
from __future__ import division
|
|
|
|
from __future__ import print_function
|
|
|
|
|
|
|
|
import math
|
|
|
|
|
|
|
|
import paddle
|
|
|
|
import paddle.fluid as fluid
|
|
|
|
|
|
|
|
|
|
|
|
class SRNLoss(object):
|
|
|
|
def __init__(self, params):
|
|
|
|
super(SRNLoss, self).__init__()
|
|
|
|
self.char_num = params['char_num']
|
|
|
|
|
|
|
|
def __call__(self, predicts, others):
|
|
|
|
predict = predicts['predict']
|
|
|
|
word_predict = predicts['word_out']
|
|
|
|
gsrm_predict = predicts['gsrm_out']
|
|
|
|
label = others['label']
|
|
|
|
lbl_weight = others['lbl_weight']
|
|
|
|
|
|
|
|
casted_label = fluid.layers.cast(x=label, dtype='int64')
|
2020-08-15 15:45:55 +08:00
|
|
|
cost_word = fluid.layers.cross_entropy(
|
|
|
|
input=word_predict, label=casted_label)
|
|
|
|
cost_gsrm = fluid.layers.cross_entropy(
|
|
|
|
input=gsrm_predict, label=casted_label)
|
|
|
|
cost_vsfd = fluid.layers.cross_entropy(
|
|
|
|
input=predict, label=casted_label)
|
|
|
|
|
|
|
|
cost_word = fluid.layers.reshape(
|
|
|
|
x=fluid.layers.reduce_sum(cost_word), shape=[1])
|
|
|
|
cost_gsrm = fluid.layers.reshape(
|
|
|
|
x=fluid.layers.reduce_sum(cost_gsrm), shape=[1])
|
|
|
|
cost_vsfd = fluid.layers.reshape(
|
|
|
|
x=fluid.layers.reduce_sum(cost_vsfd), shape=[1])
|
|
|
|
|
|
|
|
sum_cost = fluid.layers.sum(
|
|
|
|
[cost_word, cost_vsfd * 2.0, cost_gsrm * 0.15])
|
|
|
|
|
|
|
|
return [sum_cost, cost_vsfd, cost_word]
|