tensorflow/python/distribute/custom_training_loop_gradient_test.py - third_party/github.com/tensorflow/tensorflow - Git at Google

 # Copyright 2019 The TensorFlow Authors. All Rights Reserved.
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
 #
 #     http://www.apache.org/licenses/LICENSE-2.0
 #
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.
 # ==============================================================================
 """Tests for custom training loops."""

 from absl.testing import parameterized

 from tensorflow.python import tf2
 from tensorflow.python.data.ops import dataset_ops
 from tensorflow.python.distribute import combinations
 from tensorflow.python.distribute import strategy_combinations
 from tensorflow.python.eager import backprop
 from tensorflow.python.eager import def_function
 from tensorflow.python.eager import test
 from tensorflow.python.ops import math_ops
 from tensorflow.python.ops import variables


 def get_dataset_from_tensor_slices(inp_array):
   dataset = dataset_ops.DatasetV2.from_tensor_slices(inp_array)
   # TODO(b/138326910): Remove Dataset V1 version once bug resolved.
   if not tf2.enabled():
     dataset = dataset_ops.Dataset.from_tensor_slices(inp_array)
   return dataset


 class AssertFlattenedMixin(object):
   """Mixin for specialized asserts."""

   def assert_equal_flattened(self, expected_results, actual_results):
     """Asserts that flattened results are equal.

     Due to the number of replicas in the strategy, the output may have a
     different structure and needs to be flattened for comparison.

     Args:
       expected_results: The results expected as a result of a computation.
       actual_results: The actual results of a computation.
     """
     self.assertEqual(len(expected_results), len(actual_results))

     for i, expected_result in enumerate(expected_results):
       final_result = []
       actual_result = actual_results[i]
       for val in actual_result:
         final_result.extend(val.numpy())
       self.assertAllEqual(expected_result, final_result)


 class GradientTapeTest(test.TestCase, parameterized.TestCase,
                        AssertFlattenedMixin):

   @combinations.generate(
       combinations.combine(
           distribution=strategy_combinations.all_strategies,
           mode=["eager"]
       ))
   def testStepInFunctionGradient(self, distribution):
     dataset = get_dataset_from_tensor_slices([5., 6., 7., 8.]).batch(2)

     @def_function.function
     def train_step(x):
       def computation(x):
         return math_ops.square(x)
       with backprop.GradientTape() as tape:
         tape.watch(x)  # Manually watch non-variable tensors.
         y = computation(x)
       grads = tape.gradient(y, x)
       return grads

     dist_dataset = distribution.experimental_distribute_dataset(dataset)
     results = []
     for x in dist_dataset:
       output = distribution.experimental_local_results(
           distribution.run(train_step, args=(x,)))
       results.append(output)
     self.assert_equal_flattened([[10., 12.], [14., 16.]], results)

   @combinations.generate(
       combinations.combine(
           distribution=strategy_combinations.all_strategies,
           mode=["eager"]
       ))
   def testRunInFunctionGradient(self, distribution):
     dataset = get_dataset_from_tensor_slices([5., 6., 7., 8.]).batch(2)

     @def_function.function
     def run(x):
       def train_step(x):
         def computation(x):
           return math_ops.square(x)
         with backprop.GradientTape() as tape:
           tape.watch(x)  # Manually watch non-variable tensors.
           y = computation(x)
         grads = tape.gradient(y, x)
         return grads
       return distribution.experimental_local_results(
           distribution.run(train_step, args=(x,)))
     dist_dataset = distribution.experimental_distribute_dataset(dataset)
     results = []
     for x in dist_dataset:
       output = run(x)
       results.append(output)
     self.assert_equal_flattened([[10., 12.], [14., 16.]], results)

   @combinations.generate(
       combinations.combine(
           distribution=strategy_combinations.all_strategies,
           mode=["eager"],
           model_in_tf_function=[True, False]
       ))
   def testNestedFunction(self, distribution, model_in_tf_function):
     def model(x):
       return x * x

     if model_in_tf_function:
       model = def_function.function(model)

     with distribution.scope():
       x = variables.Variable(1.0)

       @def_function.function
       def train_step():
         def replica_step():
           with backprop.GradientTape() as tape:
             y = model(x)
           return tape.gradient(y, x)
         return distribution.run(replica_step)

       grads = distribution.experimental_local_results(train_step())
       self.assertLen(grads, distribution.num_replicas_in_sync)
       self.assertTrue(all(g is not None for g in grads))


 if __name__ == "__main__":
   test.main()
	# Copyright 2019 The TensorFlow Authors. All Rights Reserved.
	#
	# Licensed under the Apache License, Version 2.0 (the "License");
	# you may not use this file except in compliance with the License.
	# You may obtain a copy of the License at
	#
	# http://www.apache.org/licenses/LICENSE-2.0
	#
	# Unless required by applicable law or agreed to in writing, software
	# distributed under the License is distributed on an "AS IS" BASIS,
	# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
	# See the License for the specific language governing permissions and
	# limitations under the License.
	# ==============================================================================
	"""Tests for custom training loops."""

	from absl.testing import parameterized

	from tensorflow.python import tf2
	from tensorflow.python.data.ops import dataset_ops
	from tensorflow.python.distribute import combinations
	from tensorflow.python.distribute import strategy_combinations
	from tensorflow.python.eager import backprop
	from tensorflow.python.eager import def_function
	from tensorflow.python.eager import test
	from tensorflow.python.ops import math_ops
	from tensorflow.python.ops import variables


	def get_dataset_from_tensor_slices(inp_array):
	dataset = dataset_ops.DatasetV2.from_tensor_slices(inp_array)
	# TODO(b/138326910): Remove Dataset V1 version once bug resolved.
	if not tf2.enabled():
	dataset = dataset_ops.Dataset.from_tensor_slices(inp_array)
	return dataset


	class AssertFlattenedMixin(object):
	"""Mixin for specialized asserts."""

	def assert_equal_flattened(self, expected_results, actual_results):
	"""Asserts that flattened results are equal.

	Due to the number of replicas in the strategy, the output may have a
	different structure and needs to be flattened for comparison.

	Args:
	expected_results: The results expected as a result of a computation.
	actual_results: The actual results of a computation.
	"""
	self.assertEqual(len(expected_results), len(actual_results))

	for i, expected_result in enumerate(expected_results):
	final_result = []
	actual_result = actual_results[i]
	for val in actual_result:
	final_result.extend(val.numpy())
	self.assertAllEqual(expected_result, final_result)


	class GradientTapeTest(test.TestCase, parameterized.TestCase,
	AssertFlattenedMixin):

	@combinations.generate(
	combinations.combine(
	distribution=strategy_combinations.all_strategies,
	mode=["eager"]
	))
	def testStepInFunctionGradient(self, distribution):
	dataset = get_dataset_from_tensor_slices([5., 6., 7., 8.]).batch(2)

	@def_function.function
	def train_step(x):
	def computation(x):
	return math_ops.square(x)
	with backprop.GradientTape() as tape:
	tape.watch(x) # Manually watch non-variable tensors.
	y = computation(x)
	grads = tape.gradient(y, x)
	return grads

	dist_dataset = distribution.experimental_distribute_dataset(dataset)
	results = []
	for x in dist_dataset:
	output = distribution.experimental_local_results(
	distribution.run(train_step, args=(x,)))
	results.append(output)
	self.assert_equal_flattened([[10., 12.], [14., 16.]], results)

	@combinations.generate(
	combinations.combine(
	distribution=strategy_combinations.all_strategies,
	mode=["eager"]
	))
	def testRunInFunctionGradient(self, distribution):
	dataset = get_dataset_from_tensor_slices([5., 6., 7., 8.]).batch(2)

	@def_function.function
	def run(x):
	def train_step(x):
	def computation(x):
	return math_ops.square(x)
	with backprop.GradientTape() as tape:
	tape.watch(x) # Manually watch non-variable tensors.
	y = computation(x)
	grads = tape.gradient(y, x)
	return grads
	return distribution.experimental_local_results(
	distribution.run(train_step, args=(x,)))
	dist_dataset = distribution.experimental_distribute_dataset(dataset)
	results = []
	for x in dist_dataset:
	output = run(x)
	results.append(output)
	self.assert_equal_flattened([[10., 12.], [14., 16.]], results)

	@combinations.generate(
	combinations.combine(
	distribution=strategy_combinations.all_strategies,
	mode=["eager"],
	model_in_tf_function=[True, False]
	))
	def testNestedFunction(self, distribution, model_in_tf_function):
	def model(x):
	return x * x

	if model_in_tf_function:
	model = def_function.function(model)

	with distribution.scope():
	x = variables.Variable(1.0)

	@def_function.function
	def train_step():
	def replica_step():
	with backprop.GradientTape() as tape:
	y = model(x)
	return tape.gradient(y, x)
	return distribution.run(replica_step)

	grads = distribution.experimental_local_results(train_step())
	self.assertLen(grads, distribution.num_replicas_in_sync)
	self.assertTrue(all(g is not None for g in grads))


	if __name__ == "__main__":
	test.main()