compiler_opt/rl/train_bc.py - third_party/github.com/google/ml-compiler-opt - Git at Google

 # coding=utf-8
 # Copyright 2020 Google LLC
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
 #
 #      http://www.apache.org/licenses/LICENSE-2.0
 #
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.

 r"""Train behavioral cloning policy for LLVM Inliner decision rule."""

 import os

 from absl import app
 from absl import flags
 from absl import logging
 import gin

 from compiler_opt.rl import agent_creators
 from compiler_opt.rl import config
 from compiler_opt.rl import constant
 from compiler_opt.rl import data_reader
 from compiler_opt.rl import gin_external_configurables  # pylint: disable=unused-import
 from compiler_opt.rl import policy_saver
 from compiler_opt.rl import trainer

 flags.DEFINE_string('root_dir', os.getenv('TEST_UNDECLARED_OUTPUTS_DIR'),
                     'Root directory for writing logs/summaries/checkpoints.')
 flags.DEFINE_string(
     'data_path', None,
     'Path to TFRecord file(s) containing training data. Skip training and dump'
     'an untrained model with random weights (for testing purpose) if set None.')
 flags.DEFINE_multi_string('gin_files', [],
                           'List of paths to gin configuration files.')
 flags.DEFINE_multi_string(
     'gin_bindings', [],
     'Gin bindings to override the values set in the config files.')

 FLAGS = flags.FLAGS


 @gin.configurable
 def train_eval(agent_name=constant.AgentName.BEHAVIORAL_CLONE,
                problem_type=None,
                num_iterations=100,
                batch_size=64,
                train_sequence_length=1):
   """Train for LLVM inliner."""
   root_dir = os.path.expanduser(FLAGS.root_dir)
   root_dir = os.path.normpath(root_dir)

   time_step_spec, action_spec = config.get_signature_spec(
       problem_type)
   preprocessing_layer_creator = config.get_preprocessing_layer_creator(
       problem_type)

   # Initialize trainer and policy saver.
   tf_agent = agent_creators.create_agent(agent_name, time_step_spec,
                                          action_spec,
                                          preprocessing_layer_creator)
   llvm_trainer = trainer.Trainer(root_dir=root_dir, agent=tf_agent)
   policy_dict = {
       'saved_policy':
           tf_agent.policy,
       'saved_collect_policy':
           tf_agent.collect_policy,
   }
   saver = policy_saver.PolicySaver(policy_dict=policy_dict)

   tfrecord_dataset_fn = data_reader.create_tfrecord_dataset_fn(
       agent_name=agent_name,
       time_step_spec=time_step_spec,
       action_spec=action_spec,
       batch_size=batch_size,
       train_sequence_length=train_sequence_length)

   # Train.
   if FLAGS.data_path:
     dataset_iter = iter(tfrecord_dataset_fn(FLAGS.data_path).repeat())
     monitor_dict = {}
     llvm_trainer.train(dataset_iter, monitor_dict, num_iterations)

   # Save final policy.
   saver.save(root_dir)


 def main(_):
   gin.parse_config_files_and_bindings(
       FLAGS.gin_files, bindings=FLAGS.gin_bindings, skip_unknown=False)
   logging.info(gin.config_str())

   train_eval()


 if __name__ == '__main__':
   app.run(main)
	# coding=utf-8
	# Copyright 2020 Google LLC
	#
	# Licensed under the Apache License, Version 2.0 (the "License");
	# you may not use this file except in compliance with the License.
	# You may obtain a copy of the License at
	#
	# http://www.apache.org/licenses/LICENSE-2.0
	#
	# Unless required by applicable law or agreed to in writing, software
	# distributed under the License is distributed on an "AS IS" BASIS,
	# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
	# See the License for the specific language governing permissions and
	# limitations under the License.

	r"""Train behavioral cloning policy for LLVM Inliner decision rule."""

	import os

	from absl import app
	from absl import flags
	from absl import logging
	import gin

	from compiler_opt.rl import agent_creators
	from compiler_opt.rl import config
	from compiler_opt.rl import constant
	from compiler_opt.rl import data_reader
	from compiler_opt.rl import gin_external_configurables # pylint: disable=unused-import
	from compiler_opt.rl import policy_saver
	from compiler_opt.rl import trainer

	flags.DEFINE_string('root_dir', os.getenv('TEST_UNDECLARED_OUTPUTS_DIR'),
	'Root directory for writing logs/summaries/checkpoints.')
	flags.DEFINE_string(
	'data_path', None,
	'Path to TFRecord file(s) containing training data. Skip training and dump'
	'an untrained model with random weights (for testing purpose) if set None.')
	flags.DEFINE_multi_string('gin_files', [],
	'List of paths to gin configuration files.')
	flags.DEFINE_multi_string(
	'gin_bindings', [],
	'Gin bindings to override the values set in the config files.')

	FLAGS = flags.FLAGS


	@gin.configurable
	def train_eval(agent_name=constant.AgentName.BEHAVIORAL_CLONE,
	problem_type=None,
	num_iterations=100,
	batch_size=64,
	train_sequence_length=1):
	"""Train for LLVM inliner."""
	root_dir = os.path.expanduser(FLAGS.root_dir)
	root_dir = os.path.normpath(root_dir)

	time_step_spec, action_spec = config.get_signature_spec(
	problem_type)
	preprocessing_layer_creator = config.get_preprocessing_layer_creator(
	problem_type)

	# Initialize trainer and policy saver.
	tf_agent = agent_creators.create_agent(agent_name, time_step_spec,
	action_spec,
	preprocessing_layer_creator)
	llvm_trainer = trainer.Trainer(root_dir=root_dir, agent=tf_agent)
	policy_dict = {
	'saved_policy':
	tf_agent.policy,
	'saved_collect_policy':
	tf_agent.collect_policy,
	}
	saver = policy_saver.PolicySaver(policy_dict=policy_dict)

	tfrecord_dataset_fn = data_reader.create_tfrecord_dataset_fn(
	agent_name=agent_name,
	time_step_spec=time_step_spec,
	action_spec=action_spec,
	batch_size=batch_size,
	train_sequence_length=train_sequence_length)

	# Train.
	if FLAGS.data_path:
	dataset_iter = iter(tfrecord_dataset_fn(FLAGS.data_path).repeat())
	monitor_dict = {}
	llvm_trainer.train(dataset_iter, monitor_dict, num_iterations)

	# Save final policy.
	saver.save(root_dir)


	def main(_):
	gin.parse_config_files_and_bindings(
	FLAGS.gin_files, bindings=FLAGS.gin_bindings, skip_unknown=False)
	logging.info(gin.config_str())

	train_eval()


	if __name__ == '__main__':
	app.run(main)