# Copyright 2018, The TensorFlow Authors. # # Licensed under the Apache License, Version 2.0 (the "License"); # you may not use this file except in compliance with the License. # You may obtain a copy of the License at # # http://www.apache.org/licenses/LICENSE-2.0 # # Unless required by applicable law or agreed to in writing, software # distributed under the License is distributed on an "AS IS" BASIS, # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. # See the License for the specific language governing permissions and # limitations under the License. """Implements DPQuery interface for queries over nested structures. """ from __future__ import absolute_import from __future__ import division from __future__ import print_function from distutils.version import LooseVersion import tensorflow as tf from privacy.dp_query import dp_query if LooseVersion(tf.__version__) < LooseVersion('2.0.0'): nest = tf.contrib.framework.nest else: nest = tf.nest class NestedQuery(dp_query.DPQuery): """Implements DPQuery interface for structured queries. NestedQuery evaluates arbitrary nested structures of queries. Records must be nested structures of tensors that are compatible (in type and arity) with the query structure, but are allowed to have deeper structure within each leaf of the query structure. For example, the nested query [q1, q2] is compatible with the record [t1, t2] or [t1, (t2, t3)], but not with (t1, t2), [t1] or [t1, t2, t3]. The entire substructure of each record corresponding to a leaf node of the query structure is routed to the corresponding query. If the same tensor should be consumed by multiple sub-queries, it can be replicated in the record, for example [t1, t1]. NestedQuery is intended to allow privacy mechanisms for groups as described in [McMahan & Andrew, 2018: "A General Approach to Adding Differential Privacy to Iterative Training Procedures" (https://arxiv.org/abs/1812.06210)]. """ def __init__(self, queries): """Initializes the NestedQuery. Args: queries: A nested structure of queries. """ self._queries = queries def _map_to_queries(self, fn, *inputs): def caller(query, *args): return getattr(query, fn)(*args) return nest.map_structure_up_to( self._queries, caller, self._queries, *inputs) def initial_global_state(self): """Returns the initial global state for the NestedQuery.""" return self._map_to_queries('initial_global_state') def derive_sample_params(self, global_state): """Given the global state, derives parameters to use for the next sample. Args: global_state: The current global state. Returns: Parameters to use to process records in the next sample. """ return self._map_to_queries('derive_sample_params', global_state) def initial_sample_state(self, global_state, tensors): """Returns an initial state to use for the next sample. Args: global_state: The current global state. tensors: A structure of tensors used as a template to create the initial sample state. Returns: An initial sample state. """ return self._map_to_queries('initial_sample_state', global_state, tensors) def accumulate_record(self, params, sample_state, record): """Accumulates a single record into the sample state. Args: params: The parameters for the sample. sample_state: The current sample state. record: The record to accumulate. Returns: The updated sample state. """ return self._map_to_queries( 'accumulate_record', params, sample_state, record) def get_noised_result(self, sample_state, global_state): """Gets query result after all records of sample have been accumulated. Args: sample_state: The sample state after all records have been accumulated. global_state: The global state. Returns: A tuple (result, new_global_state) where "result" is a structure matching the query structure containing the results of the subqueries and "new_global_state" is a structure containing the updated global states for the subqueries. """ estimates_and_new_global_states = self._map_to_queries( 'get_noised_result', sample_state, global_state) flat_estimates, flat_new_global_states = zip( *nest.flatten_up_to(self._queries, estimates_and_new_global_states)) return ( nest.pack_sequence_as(self._queries, flat_estimates), nest.pack_sequence_as(self._queries, flat_new_global_states))