utility class for processing and recording best trajectories. (#152)

yundiqian · web-flow · commit 3ba3ebf215c1 · 2022-09-26T12:13:58.000-07:00
* best trajetcories

* pytype

* pytype

* pylint
diff --git a/compiler_opt/rl/best_trajectory.py b/compiler_opt/rl/best_trajectory.py
@@ -0,0 +1,101 @@
+# coding=utf-8
+# Copyright 2020 Google LLC
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+"""Module for storing and processing best trajectories."""
+
+import dataclasses
+import json
+from typing import Dict, List
+
+import tensorflow as tf
+
+from compiler_opt.rl import constant
+
+
+@dataclasses.dataclass(frozen=True)
+class BestTrajectory:
+  reward: float
+  action_list: List[int]
+
+
+class BestTrajectoryRepo:
+  """Class for storing and processing best trajectory related operations."""
+
+  def __init__(self, action_name: str):
+    """Constructor.
+
+    Args:
+      action_name: action name of the trajectory, used for extracting action
+        list from tensorflow.SequenceExample.
+    """
+    # {module_name: {identifier: best trajectory}}
+    self._best_trajectories: Dict[str, Dict[str, BestTrajectory]] = {}
+    self._action_name: str = action_name
+
+  @property
+  def best_trajectories(self) -> Dict[str, Dict[str, BestTrajectory]]:
+    return self._best_trajectories.copy()
+
+  def sink_to_json_file(self, path: str):
+    with tf.io.gfile.GFile(path, 'w') as f:
+      json.dump(self._best_trajectories, f, cls=constant.DataClassJSONEncoder)
+
+  def load_from_json_file(self, path: str):
+    with tf.io.gfile.GFile(path, 'r') as f:
+      data = json.load(f)
+    for k, v in data.items():
+      if v:
+        self._best_trajectories[k] = {
+            sub_k: BestTrajectory(**sub_v) for sub_k, sub_v in v.items()
+        }
+
+  def sink_to_csv_file(self, path: str):
+    """sink to csv file format consumable by compiler."""
+    with tf.io.gfile.GFile(path, 'w') as f:
+      for k, v in self._best_trajectories.items():
+        for sub_k, sub_v in v.items():
+          f.write(','.join([k, sub_k] + [str(x) for x in sub_v.action_list]) +
+                  '\n')
+
+  def combine_with_other_repo(self, other: 'BestTrajectoryRepo'):
+    """combine and update with other best trajectory repo."""
+    for k, v in other.best_trajectories.items():
+      if k not in self._best_trajectories:
+        self._best_trajectories[k] = v
+        continue
+      for sub_k, sub_v in v.items():
+        if sub_v.reward < self._best_trajectories[k][sub_k].reward:
+          self._best_trajectories[k][sub_k] = sub_v
+
+  def update_if_better_trajectory(self, module_name: str, identifier: str,
+                                  reward: float, trajectory: bytes):
+    """update with incoming trajectory if the reward is lower.
+
+    Args:
+      module_name: module name of the trajectory.
+      identifier: identifier of the trajectory within module.
+      reward: reward of the trajectory.
+      trajectory: trajectory in the format of serialized SequenceExample.
+    """
+    if module_name not in self._best_trajectories:
+      self._best_trajectories[module_name] = {}
+    if (identifier not in self._best_trajectories[module_name] or
+        self._best_trajectories[module_name][identifier].reward > reward):
+      example = tf.train.SequenceExample.FromString(trajectory)
+      action_list = [
+          x.int64_list.value[0]
+          for x in example.feature_lists.feature_list[self._action_name].feature
+      ]
+      self._best_trajectories[module_name][identifier] = BestTrajectory(
+          reward=reward, action_list=action_list)
diff --git a/compiler_opt/rl/best_trajectory_test.py b/compiler_opt/rl/best_trajectory_test.py
@@ -0,0 +1,134 @@
+# coding=utf-8
+# Copyright 2020 Google LLC
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+"""Tests for compiler_opt.rl.best_trajectory."""
+
+from absl.testing import absltest
+from absl.testing import parameterized
+
+import tensorflow as tf
+
+from compiler_opt.rl import best_trajectory
+
+_ACTION_NAME = 'mock'
+
+
+def _get_test_repo_1():
+  repo = best_trajectory.BestTrajectoryRepo(action_name=_ACTION_NAME)
+  # pylint: disable=protected-access
+  repo._best_trajectories['module_1'] = {
+      'function_1':
+          best_trajectory.BestTrajectory(reward=3.4, action_list=[1, 3, 5]),
+      'function_2':
+          best_trajectory.BestTrajectory(reward=1.2, action_list=[9, 7, 5])
+  }
+  # pylint: enable=protected-access
+  return repo
+
+
+def _get_test_repo_2():
+  repo = best_trajectory.BestTrajectoryRepo(action_name=_ACTION_NAME)
+  # pylint: disable=protected-access
+  repo._best_trajectories['module_1'] = {
+      'function_1':
+          best_trajectory.BestTrajectory(reward=2.3, action_list=[1, 3]),
+      'function_2':
+          best_trajectory.BestTrajectory(reward=3.4, action_list=[9, 7])
+  }
+  repo._best_trajectories['module_2'] = {
+      'function_1':
+          best_trajectory.BestTrajectory(reward=7.8, action_list=[2, 4, 6]),
+  }
+  # pylint: enable=protected-access
+  return repo
+
+
+def _get_combined_repo():
+  repo = best_trajectory.BestTrajectoryRepo(action_name=_ACTION_NAME)
+  # pylint: disable=protected-access
+  repo._best_trajectories['module_1'] = {
+      'function_1':
+          best_trajectory.BestTrajectory(reward=2.3, action_list=[1, 3]),
+      'function_2':
+          best_trajectory.BestTrajectory(reward=1.2, action_list=[9, 7, 5])
+  }
+  repo._best_trajectories['module_2'] = {
+      'function_1':
+          best_trajectory.BestTrajectory(reward=7.8, action_list=[2, 4, 6]),
+  }
+  # pylint: enable=protected-access
+  return repo
+
+
+def _create_sequence_example(action_list):
+  example = tf.train.SequenceExample()
+  for action in action_list:
+    example.feature_lists.feature_list[_ACTION_NAME].feature.add(
+    ).int64_list.value.append(action)
+  return example.SerializeToString()
+
+
+class BestTrajectoryTest(parameterized.TestCase):
+
+  @parameterized.named_parameters(('repo_1', _get_test_repo_1()),
+                                  ('repo_2', _get_test_repo_2()))
+  def test_sink_load_json_file(self, repo):
+    path = self.create_tempfile().full_path
+    repo.sink_to_json_file(path)
+    loaded_repo = best_trajectory.BestTrajectoryRepo(action_name=_ACTION_NAME)
+    loaded_repo.load_from_json_file(path)
+    self.assertDictEqual(repo.best_trajectories, loaded_repo.best_trajectories)
+
+  def test_sink_to_csv_file(self):
+    path = self.create_tempfile().full_path
+    repo = _get_test_repo_1()
+    repo.sink_to_csv_file(path)
+    with open(path, 'r', encoding='utf-8') as f:
+      text = f.read()
+
+    self.assertEqual(text,
+                     'module_1,function_1,1,3,5\nmodule_1,function_2,9,7,5\n')
+
+  @parameterized.named_parameters(
+      {
+          'testcase_name': 'repo_1_combine_2',
+          'base_repo': _get_test_repo_1(),
+          'second_repo': _get_test_repo_2()
+      }, {
+          'testcase_name': 'repo_2_combine_1',
+          'base_repo': _get_test_repo_2(),
+          'second_repo': _get_test_repo_1()
+      })
+  def test_combine_with_other_repo(self, base_repo, second_repo):
+    base_repo.combine_with_other_repo(second_repo)
+    self.assertDictEqual(base_repo.best_trajectories,
+                         _get_combined_repo().best_trajectories)
+
+  def test_update_if_better_trajectory(self):
+    repo = _get_test_repo_1()
+    repo.update_if_better_trajectory(
+        'module_1', 'function_1', 2.3,
+        _create_sequence_example(action_list=[1, 3]))
+    repo.update_if_better_trajectory(
+        'module_1', 'function_2', 3.4,
+        _create_sequence_example(action_list=[9, 7]))
+    repo.update_if_better_trajectory(
+        'module_2', 'function_1', 7.8,
+        _create_sequence_example(action_list=[2, 4, 6]))
+    self.assertDictEqual(repo.best_trajectories,
+                         _get_combined_repo().best_trajectories)
+
+
+if __name__ == '__main__':
+  absltest.main()