2019-06-05 15:06:02 -06:00
|
|
|
# Copyright 2018, The TensorFlow Authors.
|
|
|
|
#
|
|
|
|
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
|
|
# you may not use this file except in compliance with the License.
|
|
|
|
# You may obtain a copy of the License at
|
|
|
|
#
|
|
|
|
# http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
#
|
|
|
|
# Unless required by applicable law or agreed to in writing, software
|
|
|
|
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
|
|
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
|
|
# See the License for the specific language governing permissions and
|
|
|
|
# limitations under the License.
|
|
|
|
"""Loss functions for bolton method"""
|
|
|
|
|
|
|
|
from __future__ import absolute_import
|
|
|
|
from __future__ import division
|
|
|
|
from __future__ import print_function
|
|
|
|
import tensorflow as tf
|
|
|
|
from tensorflow.python.keras import losses
|
|
|
|
from tensorflow.python.keras.utils import losses_utils
|
|
|
|
from tensorflow.python.framework import ops as _ops
|
2019-06-10 14:11:47 -06:00
|
|
|
from tensorflow.python.keras.regularizers import L1L2
|
2019-06-05 15:06:02 -06:00
|
|
|
|
|
|
|
|
2019-06-10 14:11:47 -06:00
|
|
|
class StrongConvexMixin:
|
2019-06-05 15:06:02 -06:00
|
|
|
"""
|
2019-06-10 14:11:47 -06:00
|
|
|
Strong Convex Mixin base class for any loss function that will be used with
|
2019-06-05 15:06:02 -06:00
|
|
|
Bolton model. Subclasses must be strongly convex and implement the
|
|
|
|
associated constants. They must also conform to the requirements of tf losses
|
2019-06-10 14:11:47 -06:00
|
|
|
(see super class).
|
|
|
|
|
|
|
|
For more details on the strong convexity requirements, see:
|
|
|
|
Bolt-on Differential Privacy for Scalable Stochastic Gradient
|
|
|
|
Descent-based Analytics by Xi Wu et. al.
|
2019-06-05 15:06:02 -06:00
|
|
|
"""
|
|
|
|
|
|
|
|
def radius(self):
|
2019-06-10 14:11:47 -06:00
|
|
|
"""Radius, R, of the hypothesis space W.
|
|
|
|
W is a convex set that forms the hypothesis space.
|
2019-06-05 15:06:02 -06:00
|
|
|
|
2019-06-10 14:11:47 -06:00
|
|
|
Returns: R
|
2019-06-05 15:06:02 -06:00
|
|
|
|
|
|
|
"""
|
|
|
|
raise NotImplementedError("Radius not implemented for StrongConvex Loss"
|
|
|
|
"function: %s" % str(self.__class__.__name__))
|
|
|
|
|
|
|
|
def gamma(self):
|
2019-06-10 14:11:47 -06:00
|
|
|
""" Strongly convexity, gamma
|
2019-06-05 15:06:02 -06:00
|
|
|
|
|
|
|
Returns: gamma
|
|
|
|
|
|
|
|
"""
|
|
|
|
raise NotImplementedError("Gamma not implemented for StrongConvex Loss"
|
|
|
|
"function: %s" % str(self.__class__.__name__))
|
|
|
|
|
|
|
|
def beta(self, class_weight):
|
2019-06-10 14:11:47 -06:00
|
|
|
"""Smoothness, beta
|
2019-06-05 15:06:02 -06:00
|
|
|
|
|
|
|
Args:
|
2019-06-17 12:46:04 -06:00
|
|
|
class_weight: the class weights as scalar or 1d tensor, where its
|
|
|
|
dimensionality is equal to the number of outputs.
|
2019-06-05 15:06:02 -06:00
|
|
|
|
|
|
|
Returns: Beta
|
|
|
|
|
|
|
|
"""
|
|
|
|
raise NotImplementedError("Beta not implemented for StrongConvex Loss"
|
|
|
|
"function: %s" % str(self.__class__.__name__))
|
|
|
|
|
|
|
|
def lipchitz_constant(self, class_weight):
|
2019-06-10 14:11:47 -06:00
|
|
|
"""Lipchitz constant, L
|
2019-06-05 15:06:02 -06:00
|
|
|
|
|
|
|
Args:
|
|
|
|
class_weight: class weights used
|
|
|
|
|
|
|
|
Returns: L
|
|
|
|
|
|
|
|
"""
|
|
|
|
raise NotImplementedError("lipchitz constant not implemented for "
|
|
|
|
"StrongConvex Loss"
|
|
|
|
"function: %s" % str(self.__class__.__name__))
|
|
|
|
|
2019-06-10 14:11:47 -06:00
|
|
|
def kernel_regularizer(self):
|
|
|
|
"""returns the kernel_regularizer to be used. Any subclass should override
|
|
|
|
this method if they want a kernel_regularizer (if required for
|
|
|
|
the loss function to be StronglyConvex
|
|
|
|
|
|
|
|
:return: None or kernel_regularizer layer
|
|
|
|
"""
|
|
|
|
return None
|
|
|
|
|
|
|
|
def max_class_weight(self, class_weight, dtype):
|
|
|
|
"""the maximum weighting in class weights (max value) as a scalar tensor
|
2019-06-05 15:06:02 -06:00
|
|
|
|
|
|
|
Args:
|
2019-06-10 14:11:47 -06:00
|
|
|
class_weight: class weights used
|
|
|
|
dtype: the data type for tensor conversions.
|
2019-06-05 15:06:02 -06:00
|
|
|
|
2019-06-10 14:11:47 -06:00
|
|
|
Returns: maximum class weighting as tensor scalar
|
2019-06-05 15:06:02 -06:00
|
|
|
|
|
|
|
"""
|
2019-06-10 14:11:47 -06:00
|
|
|
class_weight = _ops.convert_to_tensor_v2(class_weight, dtype)
|
2019-06-05 15:06:02 -06:00
|
|
|
return tf.math.reduce_max(class_weight)
|
|
|
|
|
|
|
|
|
2019-06-17 11:25:30 -06:00
|
|
|
class StrongConvexHuber(losses.Loss, StrongConvexMixin):
|
2019-06-10 14:11:47 -06:00
|
|
|
"""Strong Convex version of Huber loss using l2 weight regularization.
|
2019-06-05 15:06:02 -06:00
|
|
|
"""
|
2019-06-10 14:11:47 -06:00
|
|
|
|
2019-06-05 15:06:02 -06:00
|
|
|
def __init__(self,
|
|
|
|
reg_lambda: float,
|
2019-06-10 14:11:47 -06:00
|
|
|
C: float,
|
2019-06-05 15:06:02 -06:00
|
|
|
radius_constant: float,
|
|
|
|
delta: float,
|
|
|
|
reduction: str = losses_utils.ReductionV2.SUM_OVER_BATCH_SIZE,
|
|
|
|
dtype=tf.float32):
|
2019-06-10 14:11:47 -06:00
|
|
|
"""Constructor.
|
2019-06-05 15:06:02 -06:00
|
|
|
|
|
|
|
Args:
|
|
|
|
reg_lambda: Weight regularization constant
|
2019-06-10 14:11:47 -06:00
|
|
|
C: Penalty parameter C of the loss term
|
2019-06-05 15:06:02 -06:00
|
|
|
radius_constant: constant defining the length of the radius
|
|
|
|
delta: delta value in huber loss. When to switch from quadratic to
|
|
|
|
absolute deviation.
|
|
|
|
reduction: reduction type to use. See super class
|
|
|
|
name: Name of the loss instance
|
|
|
|
dtype: tf datatype to use for tensor conversions.
|
|
|
|
|
|
|
|
Returns:
|
|
|
|
Loss values per sample.
|
|
|
|
"""
|
2019-06-10 14:11:47 -06:00
|
|
|
if C <= 0:
|
|
|
|
raise ValueError('c: {0}, should be >= 0'.format(C))
|
|
|
|
if reg_lambda <= 0:
|
|
|
|
raise ValueError("reg lambda: {0} must be positive".format(reg_lambda))
|
|
|
|
if radius_constant <= 0:
|
|
|
|
raise ValueError('radius_constant: {0}, should be >= 0'.format(
|
|
|
|
radius_constant
|
|
|
|
))
|
2019-06-17 11:25:30 -06:00
|
|
|
if delta <= 0:
|
|
|
|
raise ValueError('delta: {0}, should be >= 0'.format(
|
|
|
|
delta
|
|
|
|
))
|
|
|
|
self.C = C # pylint: disable=invalid-name
|
|
|
|
self.delta = delta
|
2019-06-10 14:11:47 -06:00
|
|
|
self.radius_constant = radius_constant
|
|
|
|
self.dtype = dtype
|
|
|
|
self.reg_lambda = tf.constant(reg_lambda, dtype=self.dtype)
|
|
|
|
super(StrongConvexHuber, self).__init__(
|
2019-06-17 11:25:30 -06:00
|
|
|
name='huber',
|
2019-06-05 15:06:02 -06:00
|
|
|
reduction=reduction,
|
|
|
|
)
|
|
|
|
|
|
|
|
def call(self, y_true, y_pred):
|
|
|
|
"""Compute loss
|
|
|
|
|
|
|
|
Args:
|
2019-06-17 12:46:04 -06:00
|
|
|
y_true: Ground truth values. One hot encoded using -1 and 1.
|
2019-06-05 15:06:02 -06:00
|
|
|
y_pred: The predicted values.
|
|
|
|
|
|
|
|
Returns:
|
|
|
|
Loss values per sample.
|
|
|
|
"""
|
2019-06-10 14:11:47 -06:00
|
|
|
# return super(StrongConvexHuber, self).call(y_true, y_pred) * self._sample_weight
|
2019-06-17 11:25:30 -06:00
|
|
|
h = self.delta
|
2019-06-10 14:11:47 -06:00
|
|
|
z = y_pred * y_true
|
|
|
|
one = tf.constant(1, dtype=self.dtype)
|
|
|
|
four = tf.constant(4, dtype=self.dtype)
|
|
|
|
|
|
|
|
if z > one + h:
|
2019-06-17 11:25:30 -06:00
|
|
|
return _ops.convert_to_tensor_v2(0, dtype=self.dtype)
|
2019-06-10 14:11:47 -06:00
|
|
|
elif tf.math.abs(one - z) <= h:
|
|
|
|
return one / (four * h) * tf.math.pow(one + h - z, 2)
|
|
|
|
elif z < one - h:
|
|
|
|
return one - z
|
2019-06-17 11:25:30 -06:00
|
|
|
raise ValueError('') # shouldn't be possible to get here.
|
2019-06-05 15:06:02 -06:00
|
|
|
|
|
|
|
def radius(self):
|
|
|
|
"""See super class.
|
|
|
|
"""
|
2019-06-10 14:11:47 -06:00
|
|
|
return self.radius_constant / self.reg_lambda
|
2019-06-05 15:06:02 -06:00
|
|
|
|
|
|
|
def gamma(self):
|
|
|
|
"""See super class.
|
|
|
|
"""
|
2019-06-10 14:11:47 -06:00
|
|
|
return self.reg_lambda
|
2019-06-05 15:06:02 -06:00
|
|
|
|
|
|
|
def beta(self, class_weight):
|
|
|
|
"""See super class.
|
|
|
|
"""
|
2019-06-10 14:11:47 -06:00
|
|
|
max_class_weight = self.max_class_weight(class_weight, self.dtype)
|
2019-06-17 11:25:30 -06:00
|
|
|
delta = _ops.convert_to_tensor_v2(self.delta,
|
2019-06-10 14:11:47 -06:00
|
|
|
dtype=self.dtype
|
|
|
|
)
|
|
|
|
return self.C * max_class_weight / (delta *
|
|
|
|
tf.constant(2, dtype=self.dtype)) + \
|
|
|
|
self.reg_lambda
|
2019-06-05 15:06:02 -06:00
|
|
|
|
|
|
|
def lipchitz_constant(self, class_weight):
|
|
|
|
"""See super class.
|
|
|
|
"""
|
|
|
|
# if class_weight is provided,
|
|
|
|
# it should be a vector of the same size of number of classes
|
2019-06-10 14:11:47 -06:00
|
|
|
max_class_weight = self.max_class_weight(class_weight, self.dtype)
|
|
|
|
lc = self.C * max_class_weight + \
|
|
|
|
self.reg_lambda * self.radius()
|
2019-06-05 15:06:02 -06:00
|
|
|
return lc
|
|
|
|
|
2019-06-10 14:11:47 -06:00
|
|
|
def kernel_regularizer(self):
|
|
|
|
"""
|
|
|
|
l2 loss using reg_lambda as the l2 term (as desired). Required for
|
|
|
|
this loss function to be strongly convex.
|
|
|
|
:return:
|
|
|
|
"""
|
2019-06-17 12:46:04 -06:00
|
|
|
return L1L2(l2=self.reg_lambda/2)
|
2019-06-10 14:11:47 -06:00
|
|
|
|
2019-06-05 15:06:02 -06:00
|
|
|
|
2019-06-10 14:11:47 -06:00
|
|
|
class StrongConvexBinaryCrossentropy(
|
|
|
|
losses.BinaryCrossentropy,
|
|
|
|
StrongConvexMixin
|
|
|
|
):
|
2019-06-05 15:06:02 -06:00
|
|
|
"""
|
|
|
|
Strong Convex version of BinaryCrossentropy loss using l2 weight
|
|
|
|
regularization.
|
|
|
|
"""
|
2019-06-10 14:11:47 -06:00
|
|
|
|
2019-06-05 15:06:02 -06:00
|
|
|
def __init__(self,
|
|
|
|
reg_lambda: float,
|
2019-06-10 14:11:47 -06:00
|
|
|
C: float,
|
2019-06-05 15:06:02 -06:00
|
|
|
radius_constant: float,
|
|
|
|
from_logits: bool = True,
|
|
|
|
label_smoothing: float = 0,
|
|
|
|
reduction: str = losses_utils.ReductionV2.SUM_OVER_BATCH_SIZE,
|
|
|
|
dtype=tf.float32):
|
|
|
|
"""
|
|
|
|
Args:
|
|
|
|
reg_lambda: Weight regularization constant
|
2019-06-10 14:11:47 -06:00
|
|
|
C: Penalty parameter C of the loss term
|
2019-06-05 15:06:02 -06:00
|
|
|
radius_constant: constant defining the length of the radius
|
|
|
|
reduction: reduction type to use. See super class
|
|
|
|
label_smoothing: amount of smoothing to perform on labels
|
2019-06-17 12:46:04 -06:00
|
|
|
relaxation of trust in labels, e.g. (1 -> 1-x, 0 -> 0+x).
|
|
|
|
Note, the impact of this parameter's effect on privacy
|
|
|
|
is not known and thus the default should be used.
|
2019-06-05 15:06:02 -06:00
|
|
|
name: Name of the loss instance
|
|
|
|
dtype: tf datatype to use for tensor conversions.
|
|
|
|
"""
|
2019-06-10 14:11:47 -06:00
|
|
|
if reg_lambda <= 0:
|
|
|
|
raise ValueError("reg lambda: {0} must be positive".format(reg_lambda))
|
|
|
|
if C <= 0:
|
|
|
|
raise ValueError('c: {0}, should be >= 0'.format(C))
|
|
|
|
if radius_constant <= 0:
|
|
|
|
raise ValueError('radius_constant: {0}, should be >= 0'.format(
|
|
|
|
radius_constant
|
|
|
|
))
|
|
|
|
self.dtype = dtype
|
2019-06-17 11:25:30 -06:00
|
|
|
self.C = C # pylint: disable=invalid-name
|
2019-06-10 14:11:47 -06:00
|
|
|
self.reg_lambda = tf.constant(reg_lambda, dtype=self.dtype)
|
|
|
|
super(StrongConvexBinaryCrossentropy, self).__init__(
|
|
|
|
reduction=reduction,
|
2019-06-17 12:46:04 -06:00
|
|
|
name='binarycrossentropy',
|
2019-06-10 14:11:47 -06:00
|
|
|
from_logits=from_logits,
|
|
|
|
label_smoothing=label_smoothing,
|
|
|
|
)
|
2019-06-05 15:06:02 -06:00
|
|
|
self.radius_constant = radius_constant
|
|
|
|
|
|
|
|
def call(self, y_true, y_pred):
|
|
|
|
"""Compute loss
|
|
|
|
|
|
|
|
Args:
|
|
|
|
y_true: Ground truth values.
|
|
|
|
y_pred: The predicted values.
|
|
|
|
|
|
|
|
Returns:
|
|
|
|
Loss values per sample.
|
|
|
|
"""
|
2019-06-10 14:11:47 -06:00
|
|
|
# loss = tf.nn.sigmoid_cross_entropy_with_logits(
|
|
|
|
# labels=y_true,
|
|
|
|
# logits=y_pred
|
|
|
|
# )
|
|
|
|
loss = super(StrongConvexBinaryCrossentropy, self).call(y_true, y_pred)
|
|
|
|
loss = loss * self.C
|
2019-06-05 15:06:02 -06:00
|
|
|
return loss
|
|
|
|
|
|
|
|
def radius(self):
|
|
|
|
"""See super class.
|
|
|
|
"""
|
2019-06-10 14:11:47 -06:00
|
|
|
return self.radius_constant / self.reg_lambda
|
2019-06-05 15:06:02 -06:00
|
|
|
|
|
|
|
def gamma(self):
|
|
|
|
"""See super class.
|
|
|
|
"""
|
2019-06-10 14:11:47 -06:00
|
|
|
return self.reg_lambda
|
2019-06-05 15:06:02 -06:00
|
|
|
|
|
|
|
def beta(self, class_weight):
|
|
|
|
"""See super class.
|
|
|
|
"""
|
2019-06-10 14:11:47 -06:00
|
|
|
max_class_weight = self.max_class_weight(class_weight, self.dtype)
|
|
|
|
return self.C * max_class_weight + self.reg_lambda
|
2019-06-05 15:06:02 -06:00
|
|
|
|
|
|
|
def lipchitz_constant(self, class_weight):
|
|
|
|
"""See super class.
|
|
|
|
"""
|
2019-06-10 14:11:47 -06:00
|
|
|
max_class_weight = self.max_class_weight(class_weight, self.dtype)
|
|
|
|
return self.C * max_class_weight + self.reg_lambda * self.radius()
|
|
|
|
|
|
|
|
def kernel_regularizer(self):
|
|
|
|
"""
|
|
|
|
l2 loss using reg_lambda as the l2 term (as desired). Required for
|
|
|
|
this loss function to be strongly convex.
|
|
|
|
:return:
|
|
|
|
"""
|
2019-06-17 11:25:30 -06:00
|
|
|
return L1L2(l2=self.reg_lambda/2)
|
2019-06-10 14:11:47 -06:00
|
|
|
|
|
|
|
|
|
|
|
# class StrongConvexSparseCategoricalCrossentropy(
|
|
|
|
# losses.CategoricalCrossentropy,
|
|
|
|
# StrongConvexMixin
|
|
|
|
# ):
|
|
|
|
# """
|
|
|
|
# Strong Convex version of CategoricalCrossentropy loss using l2 weight
|
|
|
|
# regularization.
|
|
|
|
# """
|
|
|
|
#
|
|
|
|
# def __init__(self,
|
|
|
|
# reg_lambda: float,
|
|
|
|
# C: float,
|
|
|
|
# radius_constant: float,
|
|
|
|
# from_logits: bool = True,
|
|
|
|
# label_smoothing: float = 0,
|
|
|
|
# reduction: str = losses_utils.ReductionV2.SUM_OVER_BATCH_SIZE,
|
|
|
|
# name: str = 'binarycrossentropy',
|
|
|
|
# dtype=tf.float32):
|
|
|
|
# """
|
|
|
|
# Args:
|
|
|
|
# reg_lambda: Weight regularization constant
|
|
|
|
# C: Penalty parameter C of the loss term
|
|
|
|
# radius_constant: constant defining the length of the radius
|
|
|
|
# reduction: reduction type to use. See super class
|
|
|
|
# label_smoothing: amount of smoothing to perform on labels
|
|
|
|
# relaxation of trust in labels, e.g. (1 -> 1-x, 0 -> 0+x)
|
|
|
|
# name: Name of the loss instance
|
|
|
|
# dtype: tf datatype to use for tensor conversions.
|
|
|
|
# """
|
|
|
|
# if reg_lambda <= 0:
|
|
|
|
# raise ValueError("reg lambda: {0} must be positive".format(reg_lambda))
|
|
|
|
# if C <= 0:
|
|
|
|
# raise ValueError('c: {0}, should be >= 0'.format(C))
|
|
|
|
# if radius_constant <= 0:
|
|
|
|
# raise ValueError('radius_constant: {0}, should be >= 0'.format(
|
|
|
|
# radius_constant
|
|
|
|
# ))
|
|
|
|
#
|
|
|
|
# self.C = C
|
|
|
|
# self.dtype = dtype
|
|
|
|
# self.reg_lambda = tf.constant(reg_lambda, dtype=self.dtype)
|
|
|
|
# super(StrongConvexSparseCategoricalCrossentropy, self).__init__(
|
|
|
|
# reduction=reduction,
|
|
|
|
# name=name,
|
|
|
|
# from_logits=from_logits,
|
|
|
|
# label_smoothing=label_smoothing,
|
|
|
|
# )
|
|
|
|
# self.radius_constant = radius_constant
|
|
|
|
#
|
|
|
|
# def call(self, y_true, y_pred):
|
|
|
|
# """Compute loss
|
|
|
|
#
|
|
|
|
# Args:
|
|
|
|
# y_true: Ground truth values.
|
|
|
|
# y_pred: The predicted values.
|
|
|
|
#
|
|
|
|
# Returns:
|
|
|
|
# Loss values per sample.
|
|
|
|
# """
|
|
|
|
# loss = super()
|
|
|
|
# loss = loss * self.C
|
|
|
|
# return loss
|
|
|
|
#
|
|
|
|
# def radius(self):
|
|
|
|
# """See super class.
|
|
|
|
# """
|
|
|
|
# return self.radius_constant / self.reg_lambda
|
|
|
|
#
|
|
|
|
# def gamma(self):
|
|
|
|
# """See super class.
|
|
|
|
# """
|
|
|
|
# return self.reg_lambda
|
|
|
|
#
|
|
|
|
# def beta(self, class_weight):
|
|
|
|
# """See super class.
|
|
|
|
# """
|
|
|
|
# max_class_weight = self.max_class_weight(class_weight, self.dtype)
|
|
|
|
# return self.C * max_class_weight + self.reg_lambda
|
|
|
|
#
|
|
|
|
# def lipchitz_constant(self, class_weight):
|
|
|
|
# """See super class.
|
|
|
|
# """
|
|
|
|
# max_class_weight = self.max_class_weight(class_weight, self.dtype)
|
|
|
|
# return self.C * max_class_weight + self.reg_lambda * self.radius()
|
|
|
|
#
|
|
|
|
# def kernel_regularizer(self):
|
|
|
|
# """
|
|
|
|
# l2 loss using reg_lambda as the l2 term (as desired). Required for
|
|
|
|
# this loss function to be strongly convex.
|
|
|
|
# :return:
|
|
|
|
# """
|
|
|
|
# return L1L2(l2=self.reg_lambda)
|
|
|
|
#
|
|
|
|
# class StrongConvexSparseCategoricalCrossentropy(
|
|
|
|
# losses.SparseCategoricalCrossentropy,
|
|
|
|
# StrongConvexMixin
|
|
|
|
# ):
|
|
|
|
# """
|
|
|
|
# Strong Convex version of SparseCategoricalCrossentropy loss using l2 weight
|
|
|
|
# regularization.
|
|
|
|
# """
|
|
|
|
#
|
|
|
|
# def __init__(self,
|
|
|
|
# reg_lambda: float,
|
|
|
|
# C: float,
|
|
|
|
# radius_constant: float,
|
|
|
|
# from_logits: bool = True,
|
|
|
|
# label_smoothing: float = 0,
|
|
|
|
# reduction: str = losses_utils.ReductionV2.SUM_OVER_BATCH_SIZE,
|
|
|
|
# name: str = 'binarycrossentropy',
|
|
|
|
# dtype=tf.float32):
|
|
|
|
# """
|
|
|
|
# Args:
|
|
|
|
# reg_lambda: Weight regularization constant
|
|
|
|
# C: Penalty parameter C of the loss term
|
|
|
|
# radius_constant: constant defining the length of the radius
|
|
|
|
# reduction: reduction type to use. See super class
|
|
|
|
# label_smoothing: amount of smoothing to perform on labels
|
|
|
|
# relaxation of trust in labels, e.g. (1 -> 1-x, 0 -> 0+x)
|
|
|
|
# name: Name of the loss instance
|
|
|
|
# dtype: tf datatype to use for tensor conversions.
|
|
|
|
# """
|
|
|
|
# if reg_lambda <= 0:
|
|
|
|
# raise ValueError("reg lambda: {0} must be positive".format(reg_lambda))
|
|
|
|
# if C <= 0:
|
|
|
|
# raise ValueError('c: {0}, should be >= 0'.format(C))
|
|
|
|
# if radius_constant <= 0:
|
|
|
|
# raise ValueError('radius_constant: {0}, should be >= 0'.format(
|
|
|
|
# radius_constant
|
|
|
|
# ))
|
|
|
|
#
|
|
|
|
# self.C = C
|
|
|
|
# self.dtype = dtype
|
|
|
|
# self.reg_lambda = tf.constant(reg_lambda, dtype=self.dtype)
|
|
|
|
# super(StrongConvexHuber, self).__init__(reduction=reduction,
|
|
|
|
# name=name,
|
|
|
|
# from_logits=from_logits,
|
|
|
|
# label_smoothing=label_smoothing,
|
|
|
|
# )
|
|
|
|
# self.radius_constant = radius_constant
|
|
|
|
#
|
|
|
|
# def call(self, y_true, y_pred):
|
|
|
|
# """Compute loss
|
|
|
|
#
|
|
|
|
# Args:
|
|
|
|
# y_true: Ground truth values.
|
|
|
|
# y_pred: The predicted values.
|
|
|
|
#
|
|
|
|
# Returns:
|
|
|
|
# Loss values per sample.
|
|
|
|
# """
|
|
|
|
# loss = super()
|
|
|
|
# loss = loss * self.C
|
|
|
|
# return loss
|
|
|
|
#
|
|
|
|
# def radius(self):
|
|
|
|
# """See super class.
|
|
|
|
# """
|
|
|
|
# return self.radius_constant / self.reg_lambda
|
|
|
|
#
|
|
|
|
# def gamma(self):
|
|
|
|
# """See super class.
|
|
|
|
# """
|
|
|
|
# return self.reg_lambda
|
|
|
|
#
|
|
|
|
# def beta(self, class_weight):
|
|
|
|
# """See super class.
|
|
|
|
# """
|
|
|
|
# max_class_weight = self.max_class_weight(class_weight, self.dtype)
|
|
|
|
# return self.C * max_class_weight + self.reg_lambda
|
|
|
|
#
|
|
|
|
# def lipchitz_constant(self, class_weight):
|
|
|
|
# """See super class.
|
|
|
|
# """
|
|
|
|
# max_class_weight = self.max_class_weight(class_weight, self.dtype)
|
|
|
|
# return self.C * max_class_weight + self.reg_lambda * self.radius()
|
|
|
|
#
|
|
|
|
# def kernel_regularizer(self):
|
|
|
|
# """
|
|
|
|
# l2 loss using reg_lambda as the l2 term (as desired). Required for
|
|
|
|
# this loss function to be strongly convex.
|
|
|
|
# :return:
|
|
|
|
# """
|
|
|
|
# return L1L2(l2=self.reg_lambda)
|
|
|
|
#
|
|
|
|
#
|
|
|
|
# class StrongConvexCategoricalCrossentropy(
|
|
|
|
# losses.CategoricalCrossentropy,
|
|
|
|
# StrongConvexMixin
|
|
|
|
# ):
|
|
|
|
# """
|
|
|
|
# Strong Convex version of CategoricalCrossentropy loss using l2 weight
|
|
|
|
# regularization.
|
|
|
|
# """
|
|
|
|
#
|
|
|
|
# def __init__(self,
|
|
|
|
# reg_lambda: float,
|
|
|
|
# C: float,
|
|
|
|
# radius_constant: float,
|
|
|
|
# from_logits: bool = True,
|
|
|
|
# label_smoothing: float = 0,
|
|
|
|
# reduction: str = losses_utils.ReductionV2.SUM_OVER_BATCH_SIZE,
|
|
|
|
# name: str = 'binarycrossentropy',
|
|
|
|
# dtype=tf.float32):
|
|
|
|
# """
|
|
|
|
# Args:
|
|
|
|
# reg_lambda: Weight regularization constant
|
|
|
|
# C: Penalty parameter C of the loss term
|
|
|
|
# radius_constant: constant defining the length of the radius
|
|
|
|
# reduction: reduction type to use. See super class
|
|
|
|
# label_smoothing: amount of smoothing to perform on labels
|
|
|
|
# relaxation of trust in labels, e.g. (1 -> 1-x, 0 -> 0+x)
|
|
|
|
# name: Name of the loss instance
|
|
|
|
# dtype: tf datatype to use for tensor conversions.
|
|
|
|
# """
|
|
|
|
# if reg_lambda <= 0:
|
|
|
|
# raise ValueError("reg lambda: {0} must be positive".format(reg_lambda))
|
|
|
|
# if C <= 0:
|
|
|
|
# raise ValueError('c: {0}, should be >= 0'.format(C))
|
|
|
|
# if radius_constant <= 0:
|
|
|
|
# raise ValueError('radius_constant: {0}, should be >= 0'.format(
|
|
|
|
# radius_constant
|
|
|
|
# ))
|
|
|
|
#
|
|
|
|
# self.C = C
|
|
|
|
# self.dtype = dtype
|
|
|
|
# self.reg_lambda = tf.constant(reg_lambda, dtype=self.dtype)
|
|
|
|
# super(StrongConvexHuber, self).__init__(reduction=reduction,
|
|
|
|
# name=name,
|
|
|
|
# from_logits=from_logits,
|
|
|
|
# label_smoothing=label_smoothing,
|
|
|
|
# )
|
|
|
|
# self.radius_constant = radius_constant
|
|
|
|
#
|
|
|
|
# def call(self, y_true, y_pred):
|
|
|
|
# """Compute loss
|
|
|
|
#
|
|
|
|
# Args:
|
|
|
|
# y_true: Ground truth values.
|
|
|
|
# y_pred: The predicted values.
|
|
|
|
#
|
|
|
|
# Returns:
|
|
|
|
# Loss values per sample.
|
|
|
|
# """
|
|
|
|
# loss = super()
|
|
|
|
# loss = loss * self.C
|
|
|
|
# return loss
|
|
|
|
#
|
|
|
|
# def radius(self):
|
|
|
|
# """See super class.
|
|
|
|
# """
|
|
|
|
# return self.radius_constant / self.reg_lambda
|
|
|
|
#
|
|
|
|
# def gamma(self):
|
|
|
|
# """See super class.
|
|
|
|
# """
|
|
|
|
# return self.reg_lambda
|
|
|
|
#
|
|
|
|
# def beta(self, class_weight):
|
|
|
|
# """See super class.
|
|
|
|
# """
|
|
|
|
# max_class_weight = self.max_class_weight(class_weight, self.dtype)
|
|
|
|
# return self.C * max_class_weight + self.reg_lambda
|
|
|
|
#
|
|
|
|
# def lipchitz_constant(self, class_weight):
|
|
|
|
# """See super class.
|
|
|
|
# """
|
|
|
|
# max_class_weight = self.max_class_weight(class_weight, self.dtype)
|
|
|
|
# return self.C * max_class_weight + self.reg_lambda * self.radius()
|
|
|
|
#
|
|
|
|
# def kernel_regularizer(self):
|
|
|
|
# """
|
|
|
|
# l2 loss using reg_lambda as the l2 term (as desired). Required for
|
|
|
|
# this loss function to be strongly convex.
|
|
|
|
# :return:
|
|
|
|
# """
|
|
|
|
# return L1L2(l2=self.reg_lambda)
|