tensorflow/python/tpu/tests/tpu_embedding_v2_enqueue_mode_test.py - third_party/github.com/tensorflow/tensorflow - Git at Google

 # Copyright 2020 The TensorFlow Authors. All Rights Reserved.
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
 #
 #     http://www.apache.org/licenses/LICENSE-2.0
 #
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.
 # ==============================================================================
 """Tests for TPU Embeddings mid level API on TPU."""
 from absl.testing import parameterized
 import numpy as np

 from tensorflow.python.compat import v2_compat
 from tensorflow.python.distribute import distribute_lib
 from tensorflow.python.eager import def_function
 from tensorflow.python.framework import config
 from tensorflow.python.framework.tensor_shape import TensorShape
 from tensorflow.python.ops import array_ops
 from tensorflow.python.platform import test
 from tensorflow.python.tpu.tests import tpu_embedding_base_test
 from tensorflow.python.util import nest


 class TPUEmbeddingTest(tpu_embedding_base_test.TPUEmbeddingBaseTest):

   @parameterized.parameters([True, False])
   def test_enqueue_with_outside_compilation(self, use_mlir):
     if use_mlir:
       config.enable_mlir_bridge()

     strategy, mid_level_api, _ = self._create_strategy_and_mid_level('sgd')
     mid_level_api.build([
         TensorShape((self.batch_size, 2)),
         TensorShape((self.batch_size, 2)),
         TensorShape((self.batch_size, 3))
     ])
     dataset = self._create_sparse_dataset(strategy)
     dataset_iter = iter(
         strategy.experimental_distribute_dataset(
             dataset,
             options=distribute_lib.InputOptions(
                 experimental_fetch_to_device=False)))

     @def_function.function
     def enqueue_with_outside_compilation(data):
       def get_activations(features):
         mid_level_api.enqueue(features, training=False)
         return mid_level_api.dequeue()
       return strategy.run(get_activations, args=(data,))

     @def_function.function
     def enqueue_without_outside_compilation(data):
       def get_activations():
         return mid_level_api.dequeue()
       mid_level_api.enqueue(data, training=False)
       return strategy.run(get_activations)

     features = next(dataset_iter)

     activations_oc = enqueue_with_outside_compilation(features)
     activations = enqueue_without_outside_compilation(features)

     # Extact per core numpy arrays.
     activations_oc0 = self._get_replica_numpy(activations_oc, strategy, 0)
     activations0 = self._get_replica_numpy(activations, strategy, 0)

     self.assertAllClose(activations_oc0, activations0)

   @parameterized.parameters(True, False)
   def test_enqueue_with_outside_compilation_in_control_flow(self, use_mlir):
     self.skip_if_oss()
     if use_mlir:
       config.enable_mlir_bridge()

     strategy, mid_level_api, _ = self._create_strategy_and_mid_level('sgd')
     dataset = self._create_sparse_dataset(strategy)
     dataset_iter = iter(
         strategy.experimental_distribute_dataset(
             dataset,
             options=distribute_lib.InputOptions(
                 experimental_fetch_to_device=False)))

     # This is one way to force the enqueue in some control flow. @tf.functions
     # aren't inlined in the calling tf.function. An alternative would be to
     # place the enqueue in a switch_v2 or something similar.
     @def_function.function
     def enqueue_fn(features):
       mid_level_api.enqueue(features, training=False)

     @def_function.function
     def enqueue_with_outside_compilation():
       def get_activations(features):
         enqueue_fn(features)
         return mid_level_api.dequeue()
       return strategy.run(get_activations, args=(next(dataset_iter),))

     with self.assertRaisesRegex(
         RuntimeError,
         'does not match graph which contains TPUReplicateContext'):
       enqueue_with_outside_compilation()

   def test_enqueue_with_outside_compilation_non_direct_input(self):
     strategy, mid_level_api, _ = self._create_strategy_and_mid_level('sgd')
     mid_level_api.build([
         TensorShape((self.batch_size, 2)),
         TensorShape((self.batch_size, 2)),
         TensorShape((self.batch_size, 3))
     ])
     dataset = self._create_sparse_dataset(strategy)
     dataset_iter = iter(
         strategy.experimental_distribute_dataset(
             dataset,
             options=distribute_lib.InputOptions(
                 experimental_fetch_to_device=False)))

     @def_function.function
     def enqueue_with_outside_compilation():
       def get_activations(features):
         # This inserts a mul operation on the TPU to trigger the direct input
         # error.
         features = (features[0]*2, features[1]*2, features[2]*2)
         mid_level_api.enqueue(features, training=False)
         return mid_level_api.dequeue()
       return strategy.run(get_activations, args=(next(dataset_iter),))

     with self.assertRaisesRegex(
         ValueError, 'which does not have the `_tpu_input_identity` attr'):
       enqueue_with_outside_compilation()

   def test_enqueue_with_outside_compilation_auto_mode(self):
     strategy, mid_level_api, _ = self._create_strategy_and_mid_level('sgd')
     mid_level_api.build([
         TensorShape((self.batch_size, 2)),
         TensorShape((self.batch_size, 2)),
         TensorShape((self.batch_size, 3))
     ])
     dataset = self._create_sparse_dataset(strategy)
     dataset_iter = iter(
         strategy.experimental_distribute_dataset(
             dataset,
             options=distribute_lib.InputOptions(
                 experimental_fetch_to_device=False)))

     @def_function.function
     def enqueue_with_no_gradient_apply(data):
       def get_activations(features):
         # Note the lack of setting training=False, so training defaults to true
         # here even though we don't have apply gradients.
         # We detect the correct mode based on which ops exist that share the
         # same 'name'.
         mid_level_api.enqueue(features, name='call1')
         return mid_level_api.dequeue(name='call1')
       return strategy.run(get_activations, args=(data,))

     @def_function.function
     def enqueue_with_gradient_apply(data):
       def get_activations(features):
         mid_level_api.enqueue(features, name='call2')
         activations = mid_level_api.dequeue(name='call2')
         # Apply an all ones gradient
         gradients = nest.map_structure(array_ops.ones_like, activations)
         mid_level_api.apply_gradients(gradients, name='call2')
         return activations
       return strategy.run(get_activations, args=(data,))

     data = next(dataset_iter)
     before_gradient_apply = enqueue_with_gradient_apply(data)
     after_gradient_apply = enqueue_with_no_gradient_apply(data)
     before_gradient_apply0 = self._get_replica_numpy(before_gradient_apply,
                                                      strategy, 0)
     after_gradient_apply0 = self._get_replica_numpy(after_gradient_apply,
                                                     strategy, 0)

     num_replicas = strategy.num_replicas_in_sync
     # We are passing a gradient of 1 for all lookups, optimizer is SGD with a
     # learning rate of 0.1. Feature 0 and 1 are looked up with a sum combiner
     # with the following ids:
     # Feature 0: [0, 0, 1], [0, 1, 1], ... repeated over num_replicas
     # Feature 1: [0, 1, 1], [0, 0, 1], ... repeated over num_replicas
     # i.e. Row 0 and 1 were looked up 3*num_replicas times over all cores and as
     # the gradient is 1, the accumulated gradient is 3*num_replicas for each
     # position in row 0 and 1 in table.
     #
     # See comments in test_pass_none_to_apply_gradients for the update to
     # Feature 2 and its table.
     # The *2 in the next tests are because those rows have 2 lookups vs
     # the 1 lookup in the other row.
     update = ([[0.3 * num_replicas], [0.3 * num_replicas * 2]],
               [[0.3 * num_replicas * 2], [0.3 * num_replicas]],
               [[0.1 * num_replicas], [0.1 / 3 * num_replicas]])
     golden = tuple([before - np.array(up) for before, up in
                     zip(before_gradient_apply0, update)])

     self.assertAllClose(golden, after_gradient_apply0)


 if __name__ == '__main__':
   v2_compat.enable_v2_behavior()
   test.main()
	# Copyright 2020 The TensorFlow Authors. All Rights Reserved.
	#
	# Licensed under the Apache License, Version 2.0 (the "License");
	# you may not use this file except in compliance with the License.
	# You may obtain a copy of the License at
	#
	# http://www.apache.org/licenses/LICENSE-2.0
	#
	# Unless required by applicable law or agreed to in writing, software
	# distributed under the License is distributed on an "AS IS" BASIS,
	# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
	# See the License for the specific language governing permissions and
	# limitations under the License.
	# ==============================================================================
	"""Tests for TPU Embeddings mid level API on TPU."""
	from absl.testing import parameterized
	import numpy as np

	from tensorflow.python.compat import v2_compat
	from tensorflow.python.distribute import distribute_lib
	from tensorflow.python.eager import def_function
	from tensorflow.python.framework import config
	from tensorflow.python.framework.tensor_shape import TensorShape
	from tensorflow.python.ops import array_ops
	from tensorflow.python.platform import test
	from tensorflow.python.tpu.tests import tpu_embedding_base_test
	from tensorflow.python.util import nest


	class TPUEmbeddingTest(tpu_embedding_base_test.TPUEmbeddingBaseTest):

	@parameterized.parameters([True, False])
	def test_enqueue_with_outside_compilation(self, use_mlir):
	if use_mlir:
	config.enable_mlir_bridge()

	strategy, mid_level_api, _ = self._create_strategy_and_mid_level('sgd')
	mid_level_api.build([
	TensorShape((self.batch_size, 2)),
	TensorShape((self.batch_size, 2)),
	TensorShape((self.batch_size, 3))
	])
	dataset = self._create_sparse_dataset(strategy)
	dataset_iter = iter(
	strategy.experimental_distribute_dataset(
	dataset,
	options=distribute_lib.InputOptions(
	experimental_fetch_to_device=False)))

	@def_function.function
	def enqueue_with_outside_compilation(data):
	def get_activations(features):
	mid_level_api.enqueue(features, training=False)
	return mid_level_api.dequeue()
	return strategy.run(get_activations, args=(data,))

	@def_function.function
	def enqueue_without_outside_compilation(data):
	def get_activations():
	return mid_level_api.dequeue()
	mid_level_api.enqueue(data, training=False)
	return strategy.run(get_activations)

	features = next(dataset_iter)

	activations_oc = enqueue_with_outside_compilation(features)
	activations = enqueue_without_outside_compilation(features)

	# Extact per core numpy arrays.
	activations_oc0 = self._get_replica_numpy(activations_oc, strategy, 0)
	activations0 = self._get_replica_numpy(activations, strategy, 0)

	self.assertAllClose(activations_oc0, activations0)

	@parameterized.parameters(True, False)
	def test_enqueue_with_outside_compilation_in_control_flow(self, use_mlir):
	self.skip_if_oss()
	if use_mlir:
	config.enable_mlir_bridge()

	strategy, mid_level_api, _ = self._create_strategy_and_mid_level('sgd')
	dataset = self._create_sparse_dataset(strategy)
	dataset_iter = iter(
	strategy.experimental_distribute_dataset(
	dataset,
	options=distribute_lib.InputOptions(
	experimental_fetch_to_device=False)))

	# This is one way to force the enqueue in some control flow. @tf.functions
	# aren't inlined in the calling tf.function. An alternative would be to
	# place the enqueue in a switch_v2 or something similar.
	@def_function.function
	def enqueue_fn(features):
	mid_level_api.enqueue(features, training=False)

	@def_function.function
	def enqueue_with_outside_compilation():
	def get_activations(features):
	enqueue_fn(features)
	return mid_level_api.dequeue()
	return strategy.run(get_activations, args=(next(dataset_iter),))

	with self.assertRaisesRegex(
	RuntimeError,
	'does not match graph which contains TPUReplicateContext'):
	enqueue_with_outside_compilation()

	def test_enqueue_with_outside_compilation_non_direct_input(self):
	strategy, mid_level_api, _ = self._create_strategy_and_mid_level('sgd')
	mid_level_api.build([
	TensorShape((self.batch_size, 2)),
	TensorShape((self.batch_size, 2)),
	TensorShape((self.batch_size, 3))
	])
	dataset = self._create_sparse_dataset(strategy)
	dataset_iter = iter(
	strategy.experimental_distribute_dataset(
	dataset,
	options=distribute_lib.InputOptions(
	experimental_fetch_to_device=False)))

	@def_function.function
	def enqueue_with_outside_compilation():
	def get_activations(features):
	# This inserts a mul operation on the TPU to trigger the direct input
	# error.
	features = (features[0]2, features[1]2, features[2]*2)
	mid_level_api.enqueue(features, training=False)
	return mid_level_api.dequeue()
	return strategy.run(get_activations, args=(next(dataset_iter),))

	with self.assertRaisesRegex(
	ValueError, 'which does not have the `_tpu_input_identity` attr'):
	enqueue_with_outside_compilation()

	def test_enqueue_with_outside_compilation_auto_mode(self):
	strategy, mid_level_api, _ = self._create_strategy_and_mid_level('sgd')
	mid_level_api.build([
	TensorShape((self.batch_size, 2)),
	TensorShape((self.batch_size, 2)),
	TensorShape((self.batch_size, 3))
	])
	dataset = self._create_sparse_dataset(strategy)
	dataset_iter = iter(
	strategy.experimental_distribute_dataset(
	dataset,
	options=distribute_lib.InputOptions(
	experimental_fetch_to_device=False)))

	@def_function.function
	def enqueue_with_no_gradient_apply(data):
	def get_activations(features):
	# Note the lack of setting training=False, so training defaults to true
	# here even though we don't have apply gradients.
	# We detect the correct mode based on which ops exist that share the
	# same 'name'.
	mid_level_api.enqueue(features, name='call1')
	return mid_level_api.dequeue(name='call1')
	return strategy.run(get_activations, args=(data,))

	@def_function.function
	def enqueue_with_gradient_apply(data):
	def get_activations(features):
	mid_level_api.enqueue(features, name='call2')
	activations = mid_level_api.dequeue(name='call2')
	# Apply an all ones gradient
	gradients = nest.map_structure(array_ops.ones_like, activations)
	mid_level_api.apply_gradients(gradients, name='call2')
	return activations
	return strategy.run(get_activations, args=(data,))

	data = next(dataset_iter)
	before_gradient_apply = enqueue_with_gradient_apply(data)
	after_gradient_apply = enqueue_with_no_gradient_apply(data)
	before_gradient_apply0 = self._get_replica_numpy(before_gradient_apply,
	strategy, 0)
	after_gradient_apply0 = self._get_replica_numpy(after_gradient_apply,
	strategy, 0)

	num_replicas = strategy.num_replicas_in_sync
	# We are passing a gradient of 1 for all lookups, optimizer is SGD with a
	# learning rate of 0.1. Feature 0 and 1 are looked up with a sum combiner
	# with the following ids:
	# Feature 0: [0, 0, 1], [0, 1, 1], ... repeated over num_replicas
	# Feature 1: [0, 1, 1], [0, 0, 1], ... repeated over num_replicas
	# i.e. Row 0 and 1 were looked up 3*num_replicas times over all cores and as
	# the gradient is 1, the accumulated gradient is 3*num_replicas for each
	# position in row 0 and 1 in table.
	#
	# See comments in test_pass_none_to_apply_gradients for the update to
	# Feature 2 and its table.
	# The *2 in the next tests are because those rows have 2 lookups vs
	# the 1 lookup in the other row.
	update = ([[0.3 * num_replicas], [0.3 * num_replicas * 2]],
	[[0.3 * num_replicas * 2], [0.3 * num_replicas]],
	[[0.1 * num_replicas], [0.1 / 3 * num_replicas]])
	golden = tuple([before - np.array(up) for before, up in
	zip(before_gradient_apply0, update)])

	self.assertAllClose(golden, after_gradient_apply0)


	if __name__ == '__main__':
	v2_compat.enable_v2_behavior()
	test.main()