Merge pull request #612 from ChrisCummins/fix/reward-name-compat

ChrisCummins · web-flow · commit 67ed37a2f9ea · 2022-03-07T22:03:16.000Z
Add backwards compatibility for Reward.id.
diff --git a/compiler_gym/spaces/reward.py b/compiler_gym/spaces/reward.py
@@ -2,6 +2,7 @@
 #
 # This source code is licensed under the MIT license found in the
 # LICENSE file in the root directory of this source tree.
+import warnings
 from typing import List, Optional, Tuple, Union
 
 import numpy as np
@@ -38,7 +39,10 @@ class Reward(Scalar):
 
     def __init__(
         self,
-        name: str,
+        # NOTE(github.com/facebookresearch/CompilerGym/issues/381): Once `id`
+        # argument has been removed, the default value for `name` can be
+        # removed.
+        name: str = None,
         observation_spaces: Optional[List[str]] = None,
         default_value: RewardType = 0,
         min: Optional[RewardType] = None,
@@ -47,6 +51,10 @@ def __init__(
         success_threshold: Optional[RewardType] = None,
         deterministic: bool = False,
         platform_dependent: bool = True,
+        # NOTE(github.com/facebookresearch/CompilerGym/issues/381): Backwards
+        # compatability workaround for deprecated parameter, will be removed in
+        # v0.2.4.
+        id: Optional[str] = None,
     ):
         """Constructor.
 
@@ -56,33 +64,53 @@ def __init__(
             (:class:`space.id <compiler_gym.views.ObservationSpaceSpec>` values)
             that are used to compute the reward. May be an empty list if no
             observations are requested. Requested observations will be provided
-            to the :code:`observations` argument of
-            :meth:`reward.update() <compiler_gym.spaces.Reward.update>`.
+            to the :code:`observations` argument of :meth:`reward.update()
+            <compiler_gym.spaces.Reward.update>`.
         :param default_value: A default reward. This value will be returned by
-            :meth:`env.step() <compiler_gym.envs.CompilerEnv.step>` if
-            the service terminates.
+            :meth:`env.step() <compiler_gym.envs.CompilerEnv.step>` if the
+            service terminates.
         :param min: The lower bound of the reward.
         :param max: The upper bound of the reward.
         :param default_negates_returns: If true, the default value will be
             offset by the sum of all rewards for the current episode. For
             example, given a default reward value of *-10.0* and an episode with
-            prior rewards *[0.1, 0.3, -0.15]*, the default value is:
-            *-10.0 - sum(0.1, 0.3, -0.15)*.
+            prior rewards *[0.1, 0.3, -0.15]*, the default value is: *-10.0 -
+            sum(0.1, 0.3, -0.15)*.
         :param success_threshold: The cumulative reward threshold before an
             episode is considered successful. For example, episodes where reward
             is scaled to an existing heuristic can be considered “successful”
             when the reward exceeds the existing heuristic.
         :param deterministic: Whether the reward space is deterministic.
         :param platform_dependent: Whether the reward values depend on the
             execution environment of the service.
+        :param id: The name of the reward space.
+
+            .. deprecated:: 0.2.3
+                Use :code:`name` instead.
         """
         super().__init__(
             name=name,
             min=-np.inf if min is None else min,
             max=np.inf if max is None else max,
             dtype=np.float64,
         )
-        self.name = name
+
+        # NOTE(github.com/facebookresearch/CompilerGym/issues/381): Backwards
+        # compatability workaround for deprecated parameter, will be removed in
+        # v0.2.4.
+        if id is not None:
+            warnings.warn(
+                "The `id` argument of "
+                "compiler_gym.spaces.Reward.__init__() "
+                "has been renamed `name`. This will break in a future release, "
+                "please update your code.",
+                DeprecationWarning,
+            )
+        self.name = name or id
+        self.id = self.name
+        if not self.name:
+            raise TypeError("No name given")
+
         self.observation_spaces = observation_spaces or []
         self.default_value: RewardType = default_value
         self.default_negates_returns: bool = default_negates_returns
diff --git a/tests/spaces/BUILD b/tests/spaces/BUILD
@@ -24,6 +24,16 @@ py_test(
     ],
 )
 
+py_test(
+    name = "reward_test",
+    timeout = "short",
+    srcs = ["reward_test.py"],
+    deps = [
+        "//compiler_gym/spaces",
+        "//tests:test_main",
+    ],
+)
+
 py_test(
     name = "scalar_test",
     timeout = "short",
diff --git a/tests/spaces/CMakeLists.txt b/tests/spaces/CMakeLists.txt
@@ -25,6 +25,16 @@ cg_py_test(
     tests::test_main
 )
 
+cg_py_test(
+  NAME
+    reward_test
+  SRCS
+    "reward_test.py"
+  DEPS
+    compiler_gym::spaces::spaces
+    tests::test_main
+)
+
 cg_py_test(
   NAME
     scalar_test
diff --git a/tests/spaces/reward_test.py b/tests/spaces/reward_test.py
@@ -0,0 +1,25 @@
+# Copyright (c) Facebook, Inc. and its affiliates.
+#
+# This source code is licensed under the MIT license found in the
+# LICENSE file in the root directory of this source tree.
+"""Unit tests for compiler_gym.spaces.Reward."""
+import pytest
+
+from compiler_gym.spaces import Reward
+from tests.test_main import main
+
+
+def test_reward_id_backwards_compatibility():
+    """Test that Reward.id is backwards compatible with Reward.name.
+
+    See: github.com/facebookresearch/CompilerGym/issues/381
+    """
+    with pytest.warns(DeprecationWarning, match="renamed `name`"):
+        reward = Reward(id="foo")
+
+    assert reward.id == "foo"
+    assert reward.name == "foo"
+
+
+if __name__ == "__main__":
+    main()