2019-07-16 08:33:57 -06:00
|
|
|
# Copyright 2019, The TensorFlow Authors.
|
2019-06-05 15:06:02 -06:00
|
|
|
#
|
|
|
|
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
|
|
# you may not use this file except in compliance with the License.
|
|
|
|
# You may obtain a copy of the License at
|
|
|
|
#
|
|
|
|
# http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
#
|
|
|
|
# Unless required by applicable law or agreed to in writing, software
|
|
|
|
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
|
|
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
|
|
# See the License for the specific language governing permissions and
|
|
|
|
# limitations under the License.
|
|
|
|
"""Loss functions for bolton method"""
|
|
|
|
|
|
|
|
from __future__ import absolute_import
|
|
|
|
from __future__ import division
|
|
|
|
from __future__ import print_function
|
|
|
|
import tensorflow as tf
|
|
|
|
from tensorflow.python.keras import losses
|
|
|
|
from tensorflow.python.keras.utils import losses_utils
|
|
|
|
from tensorflow.python.framework import ops as _ops
|
2019-06-10 14:11:47 -06:00
|
|
|
from tensorflow.python.keras.regularizers import L1L2
|
2019-06-19 08:46:30 -06:00
|
|
|
from tensorflow.python.platform import tf_logging as logging
|
2019-06-05 15:06:02 -06:00
|
|
|
|
|
|
|
|
2019-06-10 14:11:47 -06:00
|
|
|
class StrongConvexMixin:
|
2019-06-05 15:06:02 -06:00
|
|
|
"""
|
2019-06-10 14:11:47 -06:00
|
|
|
Strong Convex Mixin base class for any loss function that will be used with
|
2019-06-05 15:06:02 -06:00
|
|
|
Bolton model. Subclasses must be strongly convex and implement the
|
|
|
|
associated constants. They must also conform to the requirements of tf losses
|
2019-06-10 14:11:47 -06:00
|
|
|
(see super class).
|
|
|
|
|
|
|
|
For more details on the strong convexity requirements, see:
|
|
|
|
Bolt-on Differential Privacy for Scalable Stochastic Gradient
|
|
|
|
Descent-based Analytics by Xi Wu et. al.
|
2019-06-05 15:06:02 -06:00
|
|
|
"""
|
|
|
|
|
|
|
|
def radius(self):
|
2019-06-10 14:11:47 -06:00
|
|
|
"""Radius, R, of the hypothesis space W.
|
|
|
|
W is a convex set that forms the hypothesis space.
|
2019-06-05 15:06:02 -06:00
|
|
|
|
2019-07-16 08:33:57 -06:00
|
|
|
Returns:
|
|
|
|
R
|
2019-06-05 15:06:02 -06:00
|
|
|
"""
|
|
|
|
raise NotImplementedError("Radius not implemented for StrongConvex Loss"
|
|
|
|
"function: %s" % str(self.__class__.__name__))
|
|
|
|
|
|
|
|
def gamma(self):
|
2019-07-16 08:33:57 -06:00
|
|
|
"""Returns strongly convex parameter, gamma."""
|
2019-06-05 15:06:02 -06:00
|
|
|
raise NotImplementedError("Gamma not implemented for StrongConvex Loss"
|
|
|
|
"function: %s" % str(self.__class__.__name__))
|
|
|
|
|
|
|
|
def beta(self, class_weight):
|
2019-07-16 08:33:57 -06:00
|
|
|
"""Smoothness, beta.
|
2019-06-05 15:06:02 -06:00
|
|
|
|
|
|
|
Args:
|
2019-06-17 12:46:04 -06:00
|
|
|
class_weight: the class weights as scalar or 1d tensor, where its
|
|
|
|
dimensionality is equal to the number of outputs.
|
2019-06-05 15:06:02 -06:00
|
|
|
|
2019-07-16 08:33:57 -06:00
|
|
|
Returns:
|
|
|
|
Beta
|
2019-06-05 15:06:02 -06:00
|
|
|
"""
|
|
|
|
raise NotImplementedError("Beta not implemented for StrongConvex Loss"
|
|
|
|
"function: %s" % str(self.__class__.__name__))
|
|
|
|
|
|
|
|
def lipchitz_constant(self, class_weight):
|
2019-07-16 08:33:57 -06:00
|
|
|
"""Lipchitz constant, L.
|
2019-06-05 15:06:02 -06:00
|
|
|
|
|
|
|
Args:
|
|
|
|
class_weight: class weights used
|
|
|
|
|
|
|
|
Returns: L
|
|
|
|
"""
|
|
|
|
raise NotImplementedError("lipchitz constant not implemented for "
|
|
|
|
"StrongConvex Loss"
|
|
|
|
"function: %s" % str(self.__class__.__name__))
|
|
|
|
|
2019-06-10 14:11:47 -06:00
|
|
|
def kernel_regularizer(self):
|
2019-07-16 08:33:57 -06:00
|
|
|
"""Returns the kernel_regularizer to be used.
|
2019-06-10 14:11:47 -06:00
|
|
|
|
2019-07-16 08:33:57 -06:00
|
|
|
Any subclass should override this method if they want a kernel_regularizer
|
|
|
|
(if required for the loss function to be StronglyConvex.
|
2019-06-10 14:11:47 -06:00
|
|
|
"""
|
|
|
|
return None
|
|
|
|
|
|
|
|
def max_class_weight(self, class_weight, dtype):
|
|
|
|
"""the maximum weighting in class weights (max value) as a scalar tensor
|
2019-06-05 15:06:02 -06:00
|
|
|
|
|
|
|
Args:
|
2019-06-10 14:11:47 -06:00
|
|
|
class_weight: class weights used
|
|
|
|
dtype: the data type for tensor conversions.
|
2019-06-05 15:06:02 -06:00
|
|
|
|
2019-07-16 08:33:57 -06:00
|
|
|
Returns:
|
|
|
|
maximum class weighting as tensor scalar
|
2019-06-05 15:06:02 -06:00
|
|
|
"""
|
2019-06-10 14:11:47 -06:00
|
|
|
class_weight = _ops.convert_to_tensor_v2(class_weight, dtype)
|
2019-06-05 15:06:02 -06:00
|
|
|
return tf.math.reduce_max(class_weight)
|
|
|
|
|
|
|
|
|
2019-06-17 11:25:30 -06:00
|
|
|
class StrongConvexHuber(losses.Loss, StrongConvexMixin):
|
2019-07-16 08:33:57 -06:00
|
|
|
"""Strong Convex version of Huber loss using l2 weight regularization."""
|
2019-06-10 14:11:47 -06:00
|
|
|
|
2019-06-05 15:06:02 -06:00
|
|
|
def __init__(self,
|
2019-07-25 10:13:32 -06:00
|
|
|
reg_lambda,
|
|
|
|
C,
|
|
|
|
radius_constant,
|
|
|
|
delta,
|
|
|
|
reduction=losses_utils.ReductionV2.SUM_OVER_BATCH_SIZE,
|
2019-06-05 15:06:02 -06:00
|
|
|
dtype=tf.float32):
|
2019-06-10 14:11:47 -06:00
|
|
|
"""Constructor.
|
2019-06-05 15:06:02 -06:00
|
|
|
|
|
|
|
Args:
|
|
|
|
reg_lambda: Weight regularization constant
|
2019-06-10 14:11:47 -06:00
|
|
|
C: Penalty parameter C of the loss term
|
2019-06-05 15:06:02 -06:00
|
|
|
radius_constant: constant defining the length of the radius
|
|
|
|
delta: delta value in huber loss. When to switch from quadratic to
|
|
|
|
absolute deviation.
|
|
|
|
reduction: reduction type to use. See super class
|
|
|
|
name: Name of the loss instance
|
|
|
|
dtype: tf datatype to use for tensor conversions.
|
|
|
|
|
|
|
|
Returns:
|
|
|
|
Loss values per sample.
|
|
|
|
"""
|
2019-06-10 14:11:47 -06:00
|
|
|
if C <= 0:
|
|
|
|
raise ValueError('c: {0}, should be >= 0'.format(C))
|
|
|
|
if reg_lambda <= 0:
|
|
|
|
raise ValueError("reg lambda: {0} must be positive".format(reg_lambda))
|
|
|
|
if radius_constant <= 0:
|
|
|
|
raise ValueError('radius_constant: {0}, should be >= 0'.format(
|
|
|
|
radius_constant
|
|
|
|
))
|
2019-06-17 11:25:30 -06:00
|
|
|
if delta <= 0:
|
|
|
|
raise ValueError('delta: {0}, should be >= 0'.format(
|
|
|
|
delta
|
|
|
|
))
|
|
|
|
self.C = C # pylint: disable=invalid-name
|
|
|
|
self.delta = delta
|
2019-06-10 14:11:47 -06:00
|
|
|
self.radius_constant = radius_constant
|
|
|
|
self.dtype = dtype
|
|
|
|
self.reg_lambda = tf.constant(reg_lambda, dtype=self.dtype)
|
|
|
|
super(StrongConvexHuber, self).__init__(
|
2019-06-19 08:46:30 -06:00
|
|
|
name='strongconvexhuber',
|
2019-06-05 15:06:02 -06:00
|
|
|
reduction=reduction,
|
|
|
|
)
|
|
|
|
|
|
|
|
def call(self, y_true, y_pred):
|
2019-07-16 08:33:57 -06:00
|
|
|
"""Computes loss
|
2019-06-05 15:06:02 -06:00
|
|
|
|
|
|
|
Args:
|
2019-06-17 12:46:04 -06:00
|
|
|
y_true: Ground truth values. One hot encoded using -1 and 1.
|
2019-06-05 15:06:02 -06:00
|
|
|
y_pred: The predicted values.
|
|
|
|
|
|
|
|
Returns:
|
|
|
|
Loss values per sample.
|
|
|
|
"""
|
2019-06-17 11:25:30 -06:00
|
|
|
h = self.delta
|
2019-06-10 14:11:47 -06:00
|
|
|
z = y_pred * y_true
|
|
|
|
one = tf.constant(1, dtype=self.dtype)
|
|
|
|
four = tf.constant(4, dtype=self.dtype)
|
|
|
|
|
2019-07-18 13:04:35 -06:00
|
|
|
if z > one + h: # pylint: disable=no-else-return
|
2019-06-17 11:25:30 -06:00
|
|
|
return _ops.convert_to_tensor_v2(0, dtype=self.dtype)
|
2019-06-10 14:11:47 -06:00
|
|
|
elif tf.math.abs(one - z) <= h:
|
|
|
|
return one / (four * h) * tf.math.pow(one + h - z, 2)
|
2019-07-18 13:04:35 -06:00
|
|
|
return one - z
|
2019-06-05 15:06:02 -06:00
|
|
|
|
|
|
|
def radius(self):
|
2019-07-16 08:33:57 -06:00
|
|
|
"""See super class."""
|
2019-06-10 14:11:47 -06:00
|
|
|
return self.radius_constant / self.reg_lambda
|
2019-06-05 15:06:02 -06:00
|
|
|
|
|
|
|
def gamma(self):
|
2019-07-16 08:33:57 -06:00
|
|
|
"""See super class."""
|
2019-06-10 14:11:47 -06:00
|
|
|
return self.reg_lambda
|
2019-06-05 15:06:02 -06:00
|
|
|
|
|
|
|
def beta(self, class_weight):
|
2019-07-16 08:33:57 -06:00
|
|
|
"""See super class."""
|
2019-06-10 14:11:47 -06:00
|
|
|
max_class_weight = self.max_class_weight(class_weight, self.dtype)
|
2019-06-17 11:25:30 -06:00
|
|
|
delta = _ops.convert_to_tensor_v2(self.delta,
|
2019-06-10 14:11:47 -06:00
|
|
|
dtype=self.dtype
|
|
|
|
)
|
|
|
|
return self.C * max_class_weight / (delta *
|
|
|
|
tf.constant(2, dtype=self.dtype)) + \
|
|
|
|
self.reg_lambda
|
2019-06-05 15:06:02 -06:00
|
|
|
|
|
|
|
def lipchitz_constant(self, class_weight):
|
2019-07-16 08:33:57 -06:00
|
|
|
"""See super class."""
|
2019-06-05 15:06:02 -06:00
|
|
|
# if class_weight is provided,
|
|
|
|
# it should be a vector of the same size of number of classes
|
2019-06-10 14:11:47 -06:00
|
|
|
max_class_weight = self.max_class_weight(class_weight, self.dtype)
|
|
|
|
lc = self.C * max_class_weight + \
|
|
|
|
self.reg_lambda * self.radius()
|
2019-06-05 15:06:02 -06:00
|
|
|
return lc
|
|
|
|
|
2019-06-10 14:11:47 -06:00
|
|
|
def kernel_regularizer(self):
|
2019-07-16 08:33:57 -06:00
|
|
|
"""Return l2 loss using 0.5*reg_lambda as the l2 term (as desired).
|
|
|
|
|
|
|
|
L2 regularization is required for this loss function to be strongly convex.
|
|
|
|
|
|
|
|
Returns:
|
|
|
|
The L2 regularizer layer for this loss function, with regularizer constant
|
|
|
|
set to half the 0.5 * reg_lambda.
|
2019-06-10 14:11:47 -06:00
|
|
|
"""
|
2019-06-17 12:46:04 -06:00
|
|
|
return L1L2(l2=self.reg_lambda/2)
|
2019-06-10 14:11:47 -06:00
|
|
|
|
2019-06-05 15:06:02 -06:00
|
|
|
|
2019-06-10 14:11:47 -06:00
|
|
|
class StrongConvexBinaryCrossentropy(
|
|
|
|
losses.BinaryCrossentropy,
|
|
|
|
StrongConvexMixin
|
|
|
|
):
|
2019-07-16 08:33:57 -06:00
|
|
|
"""Strongly Convex BinaryCrossentropy loss using l2 weight regularization."""
|
2019-06-10 14:11:47 -06:00
|
|
|
|
2019-06-05 15:06:02 -06:00
|
|
|
def __init__(self,
|
2019-07-29 15:20:40 -06:00
|
|
|
reg_lambda,
|
|
|
|
C,
|
|
|
|
radius_constant,
|
|
|
|
from_logits=True,
|
|
|
|
label_smoothing=0,
|
|
|
|
reduction=losses_utils.ReductionV2.SUM_OVER_BATCH_SIZE,
|
2019-06-05 15:06:02 -06:00
|
|
|
dtype=tf.float32):
|
|
|
|
"""
|
|
|
|
Args:
|
|
|
|
reg_lambda: Weight regularization constant
|
2019-06-10 14:11:47 -06:00
|
|
|
C: Penalty parameter C of the loss term
|
2019-06-05 15:06:02 -06:00
|
|
|
radius_constant: constant defining the length of the radius
|
|
|
|
reduction: reduction type to use. See super class
|
2019-07-16 08:33:57 -06:00
|
|
|
from_logits: True if the input are unscaled logits. False if they are
|
|
|
|
already scaled.
|
2019-06-05 15:06:02 -06:00
|
|
|
label_smoothing: amount of smoothing to perform on labels
|
2019-07-16 08:33:57 -06:00
|
|
|
relaxation of trust in labels, e.g. (1 -> 1-x, 0 -> 0+x). Note, the
|
|
|
|
impact of this parameter's effect on privacy is not known and thus the
|
|
|
|
default should be used.
|
2019-06-05 15:06:02 -06:00
|
|
|
name: Name of the loss instance
|
|
|
|
dtype: tf datatype to use for tensor conversions.
|
|
|
|
"""
|
2019-06-19 08:46:30 -06:00
|
|
|
if label_smoothing != 0:
|
|
|
|
logging.warning('The impact of label smoothing on privacy is unknown. '
|
|
|
|
'Use label smoothing at your own risk as it may not '
|
|
|
|
'guarantee privacy.')
|
|
|
|
|
2019-06-10 14:11:47 -06:00
|
|
|
if reg_lambda <= 0:
|
|
|
|
raise ValueError("reg lambda: {0} must be positive".format(reg_lambda))
|
|
|
|
if C <= 0:
|
|
|
|
raise ValueError('c: {0}, should be >= 0'.format(C))
|
|
|
|
if radius_constant <= 0:
|
|
|
|
raise ValueError('radius_constant: {0}, should be >= 0'.format(
|
|
|
|
radius_constant
|
|
|
|
))
|
|
|
|
self.dtype = dtype
|
2019-06-17 11:25:30 -06:00
|
|
|
self.C = C # pylint: disable=invalid-name
|
2019-06-10 14:11:47 -06:00
|
|
|
self.reg_lambda = tf.constant(reg_lambda, dtype=self.dtype)
|
|
|
|
super(StrongConvexBinaryCrossentropy, self).__init__(
|
|
|
|
reduction=reduction,
|
2019-06-19 08:46:30 -06:00
|
|
|
name='strongconvexbinarycrossentropy',
|
2019-06-10 14:11:47 -06:00
|
|
|
from_logits=from_logits,
|
|
|
|
label_smoothing=label_smoothing,
|
|
|
|
)
|
2019-06-05 15:06:02 -06:00
|
|
|
self.radius_constant = radius_constant
|
|
|
|
|
|
|
|
def call(self, y_true, y_pred):
|
2019-07-16 08:33:57 -06:00
|
|
|
"""Computes loss
|
2019-06-05 15:06:02 -06:00
|
|
|
|
2019-07-16 08:33:57 -06:00
|
|
|
Args:
|
|
|
|
y_true: Ground truth values.
|
|
|
|
y_pred: The predicted values.
|
2019-06-05 15:06:02 -06:00
|
|
|
|
2019-07-16 08:33:57 -06:00
|
|
|
Returns:
|
|
|
|
Loss values per sample.
|
2019-06-05 15:06:02 -06:00
|
|
|
"""
|
2019-06-10 14:11:47 -06:00
|
|
|
loss = super(StrongConvexBinaryCrossentropy, self).call(y_true, y_pred)
|
|
|
|
loss = loss * self.C
|
2019-06-05 15:06:02 -06:00
|
|
|
return loss
|
|
|
|
|
|
|
|
def radius(self):
|
2019-07-16 08:33:57 -06:00
|
|
|
"""See super class."""
|
2019-06-10 14:11:47 -06:00
|
|
|
return self.radius_constant / self.reg_lambda
|
2019-06-05 15:06:02 -06:00
|
|
|
|
|
|
|
def gamma(self):
|
2019-07-16 08:33:57 -06:00
|
|
|
"""See super class."""
|
2019-06-10 14:11:47 -06:00
|
|
|
return self.reg_lambda
|
2019-06-05 15:06:02 -06:00
|
|
|
|
|
|
|
def beta(self, class_weight):
|
2019-07-16 08:33:57 -06:00
|
|
|
"""See super class."""
|
2019-06-10 14:11:47 -06:00
|
|
|
max_class_weight = self.max_class_weight(class_weight, self.dtype)
|
|
|
|
return self.C * max_class_weight + self.reg_lambda
|
2019-06-05 15:06:02 -06:00
|
|
|
|
|
|
|
def lipchitz_constant(self, class_weight):
|
2019-07-16 08:33:57 -06:00
|
|
|
"""See super class."""
|
2019-06-10 14:11:47 -06:00
|
|
|
max_class_weight = self.max_class_weight(class_weight, self.dtype)
|
|
|
|
return self.C * max_class_weight + self.reg_lambda * self.radius()
|
|
|
|
|
|
|
|
def kernel_regularizer(self):
|
2019-07-16 08:33:57 -06:00
|
|
|
"""Return l2 loss using 0.5*reg_lambda as the l2 term (as desired).
|
|
|
|
|
|
|
|
L2 regularization is required for this loss function to be strongly convex.
|
|
|
|
|
|
|
|
Returns:
|
|
|
|
The L2 regularizer layer for this loss function, with regularizer constant
|
|
|
|
set to half the 0.5 * reg_lambda.
|
2019-06-10 14:11:47 -06:00
|
|
|
"""
|
2019-06-17 11:25:30 -06:00
|
|
|
return L1L2(l2=self.reg_lambda/2)
|