Upgrade pre-commit tools (#12)

2022-02-07 21:18:16 -05:00 · 2022-02-07 21:18:16 -05:00 · 9a5a1418ff
--- a/.pre-commit-config.yaml
+++ b/.pre-commit-config.yaml
@ -1,30 +1,32 @@
 repos:
 -   repo: https://github.com/python/black
-    rev: 19.3b0
+    rev: 22.1.0
    hooks:
    -   id: black
        exclude: >
            (?x)^(
                .*_pb2.py|
+                .*_pb2.pyi|
                .*_pb2_grpc.py
            )$

 -   repo: https://github.com/pre-commit/mirrors-mypy
-    rev: v0.761
+    rev: v0.931
    hooks:
    -   id: mypy
        name: mypy-ml-agents
        files: "ml-agents/.*"
-        args: [--ignore-missing-imports, --disallow-incomplete-defs]
+        args: [--ignore-missing-imports, --disallow-incomplete-defs, --no-strict-optional]
+        additional_dependencies: [types-PyYAML, types-attrs, types-protobuf, types-setuptools]
    -   id: mypy
        name: mypy-ml-agents-envs
        files: "ml-agents-envs/.*"
        # Exclude protobuf files and don't follow them when imported
        exclude: ".*_pb2.py"
-        args: [--ignore-missing-imports, --disallow-incomplete-defs]
-
+        args: [--ignore-missing-imports, --disallow-incomplete-defs, --no-strict-optional]
+        additional_dependencies: [types-PyYAML, types-attrs, types-protobuf, types-setuptools]
 -   repo: https://gitlab.com/pycqa/flake8
-    rev: 3.8.1
+    rev: 3.9.2
    hooks:
    -   id: flake8
        exclude: >
@ -36,7 +38,7 @@ repos:
        additional_dependencies: [flake8-comprehensions==3.2.2, flake8-tidy-imports==4.1.0, flake8-bugbear==20.1.4]

 -   repo: https://github.com/asottile/pyupgrade
-    rev: v2.7.0
+    rev: v2.31.0
    hooks:
    -   id: pyupgrade
        args: [--py3-plus, --py36-plus]
@ -47,7 +49,7 @@ repos:
            )$

 -   repo: https://github.com/pre-commit/pre-commit-hooks
-    rev: v2.5.0
+    rev: v4.1.0
    hooks:
    -   id: mixed-line-ending
        exclude: >
@ -68,12 +70,12 @@ repos:
        exclude: \.yamato/.*

 -   repo: https://github.com/pre-commit/pygrep-hooks
-    rev: v1.4.2
+    rev: v1.9.0
    hooks:
    -   id: python-check-mock-methods

 - repo: https://github.com/mattlqx/pre-commit-search-and-replace
-  rev: v1.0.3
+  rev: v1.0.5
  hooks:
  - id: search-and-replace
    types: [markdown]
--- a/ml-agents-envs/mlagents_envs/envs/unity_pettingzoo_base_env.py
+++ b/ml-agents-envs/mlagents_envs/envs/unity_pettingzoo_base_env.py
@ -253,9 +253,15 @@ class UnityPettingzooBaseEnv:
        self._current_action[behavior_name] = self._create_empty_actions(
            behavior_name, len(current_batch[0])
        )
-        agents, obs, dones, rewards, cumulative_rewards, infos, id_map = _unwrap_batch_steps(
-            current_batch, behavior_name
-        )
+        (
+            agents,
+            obs,
+            dones,
+            rewards,
+            cumulative_rewards,
+            infos,
+            id_map,
+        ) = _unwrap_batch_steps(current_batch, behavior_name)
        self._live_agents += agents
        self._agents += agents
        self._observations.update(obs)
--- a/ml-agents-envs/mlagents_envs/registry/binary_utils.py
+++ b/ml-agents-envs/mlagents_envs/registry/binary_utils.py
@ -137,7 +137,7 @@ def download_and_extract_zip(url: str, name: str) -> None:
    try:
        request = urllib.request.urlopen(url, timeout=30)
    except urllib.error.HTTPError as e:  # type: ignore
-        e.msg += " " + url
+        e.reason = f"{e.reason} {url}"
        raise
    zip_size = int(request.headers["content-length"])
    zip_file_path = os.path.join(zip_dir, str(uuid.uuid4()) + ".zip")
@ -193,7 +193,7 @@ def load_remote_manifest(url: str) -> Dict[str, Any]:
    try:
        request = urllib.request.urlopen(url, timeout=30)
    except urllib.error.HTTPError as e:  # type: ignore
-        e.msg += " " + url
+        e.reason = f"{e.reason} {url}"
        raise
    manifest_path = os.path.join(tmp_dir, str(uuid.uuid4()) + ".yaml")
    with open(manifest_path, "wb") as manifest:
--- a/ml-agents-envs/mlagents_envs/side_channel/side_channel_manager.py
+++ b/ml-agents-envs/mlagents_envs/side_channel/side_channel_manager.py
@ -21,7 +21,7 @@ class SideChannelManager:
            try:
                channel_id = uuid.UUID(bytes_le=bytes(data[offset : offset + 16]))
                offset += 16
-                message_len, = struct.unpack_from("<i", data, offset)
+                (message_len,) = struct.unpack_from("<i", data, offset)
                offset = offset + 4
                message_data = data[offset : offset + message_len]
                offset = offset + message_len
@ -63,7 +63,7 @@ class SideChannelManager:

    @staticmethod
    def _get_side_channels_dict(
-        side_channels: Optional[List[SideChannel]]
+        side_channels: Optional[List[SideChannel]],
    ) -> Dict[uuid.UUID, SideChannel]:
        """
        Converts a list of side channels into a dictionary of channel_id to SideChannel
--- a/ml-agents-envs/setup.py
+++ b/ml-agents-envs/setup.py
@ -59,5 +59,6 @@ setup(
        "numpy==1.21.2",
    ],
    python_requires=">=3.7.2,<3.9.10",
-    cmdclass={"verify": VerifyVersionCommand},
+    # TODO: Remove this once mypy stops having spurious setuptools issues.
+    cmdclass={"verify": VerifyVersionCommand},  # type: ignore
 )
--- a/ml-agents/mlagents/trainers/behavior_id_utils.py
+++ b/ml-agents/mlagents/trainers/behavior_id_utils.py
@ -42,11 +42,11 @@ class BehaviorIdentifiers(NamedTuple):

 def create_name_behavior_id(name: str, team_id: int) -> str:
    """
-   Reconstructs fully qualified behavior name from name and team_id
-   :param name: brain name
-   :param team_id: team ID
-   :return: name_behavior_id
-   """
+    Reconstructs fully qualified behavior name from name and team_id
+    :param name: brain name
+    :param team_id: team ID
+    :return: name_behavior_id
+    """
    return name + "?team=" + str(team_id)


--- a/ml-agents/mlagents/trainers/buffer.py
+++ b/ml-agents/mlagents/trainers/buffer.py
@ -264,9 +264,7 @@ class AgentBuffer(MutableMapping):
        )

    def __str__(self):
-        return ", ".join(
-            ["'{}' : {}".format(k, str(self[k])) for k in self._fields.keys()]
-        )
+        return ", ".join([f"'{k}' : {str(self[k])}" for k in self._fields.keys()])

    def reset_agent(self) -> None:
        """
--- a/ml-agents/mlagents/trainers/environment_parameter_manager.py
+++ b/ml-agents/mlagents/trainers/environment_parameter_manager.py
@ -165,7 +165,10 @@ class EnvironmentParameterManager:
            ):
                behavior_to_consider = lesson.completion_criteria.behavior
                if behavior_to_consider in trainer_steps:
-                    must_increment, new_smoothing = lesson.completion_criteria.need_increment(
+                    (
+                        must_increment,
+                        new_smoothing,
+                    ) = lesson.completion_criteria.need_increment(
                        float(trainer_steps[behavior_to_consider])
                        / float(trainer_max_steps[behavior_to_consider]),
                        trainer_reward_buffer[behavior_to_consider],
--- a/ml-agents/mlagents/trainers/stats.py
+++ b/ml-agents/mlagents/trainers/stats.py
@ -33,7 +33,7 @@ def _dict_to_str(param_dict: Dict[str, Any], num_tabs: int) -> str:
            [
                "\t"
                + "  " * num_tabs
-                + "{}:\t{}".format(x, _dict_to_str(param_dict[x], num_tabs + 1))
+                + f"{x}:\t{_dict_to_str(param_dict[x], num_tabs + 1)}"
                for x in param_dict
            ]
        )
--- a/ml-agents/mlagents/trainers/tests/test_trainer_controller.py
+++ b/ml-agents/mlagents/trainers/tests/test_trainer_controller.py
@ -71,7 +71,7 @@ def trainer_controller_with_start_learning_mocks(basic_trainer_controller):


 def test_start_learning_trains_forever_if_no_train_model(
-    trainer_controller_with_start_learning_mocks
+    trainer_controller_with_start_learning_mocks,
 ):
    tc, trainer_mock = trainer_controller_with_start_learning_mocks
    tc.train_model = False
@ -88,7 +88,7 @@ def test_start_learning_trains_forever_if_no_train_model(


 def test_start_learning_trains_until_max_steps_then_saves(
-    trainer_controller_with_start_learning_mocks
+    trainer_controller_with_start_learning_mocks,
 ):
    tc, trainer_mock = trainer_controller_with_start_learning_mocks

@ -120,7 +120,7 @@ def trainer_controller_with_take_step_mocks(basic_trainer_controller):


 def test_advance_adds_experiences_to_trainer_and_trains(
-    trainer_controller_with_take_step_mocks
+    trainer_controller_with_take_step_mocks,
 ):
    tc, trainer_mock = trainer_controller_with_take_step_mocks

--- a/ml-agents/mlagents/trainers/tests/torch/test_action_model.py
+++ b/ml-agents/mlagents/trainers/tests/torch/test_action_model.py
@ -12,7 +12,7 @@ from mlagents_envs.base_env import ActionSpec


 def create_action_model(inp_size, act_size, deterministic=False):
-    mask = torch.ones([1, act_size ** 2])
+    mask = torch.ones([1, act_size**2])
    action_spec = ActionSpec(act_size, tuple(act_size for _ in range(act_size)))
    action_model = ActionModel(inp_size, action_spec, deterministic=deterministic)
    return action_model, mask
--- a/ml-agents/mlagents/trainers/tests/torch/test_attention.py
+++ b/ml-agents/mlagents/trainers/tests/torch/test_attention.py
@ -90,7 +90,10 @@ def test_all_masking(mask_value):
    # We make sure that a mask of all zeros or all ones will not trigger an error
    np.random.seed(1336)
    torch.manual_seed(1336)
-    size, n_k, = 3, 5
+    size, n_k, = (
+        3,
+        5,
+    )
    embedding_size = 64
    entity_embeddings = EntityEmbedding(size, n_k, embedding_size)
    entity_embeddings.add_self_embedding(size)
@ -134,7 +137,10 @@ def test_all_masking(mask_value):
 def test_predict_closest_training():
    np.random.seed(1336)
    torch.manual_seed(1336)
-    size, n_k, = 3, 5
+    size, n_k, = (
+        3,
+        5,
+    )
    embedding_size = 64
    entity_embeddings = EntityEmbedding(size, n_k, embedding_size)
    entity_embeddings.add_self_embedding(size)
--- a/ml-agents/mlagents/trainers/tests/torch/test_policy.py
+++ b/ml-agents/mlagents/trainers/tests/torch/test_policy.py
@ -138,7 +138,7 @@ def test_sample_actions(rnn, visual, discrete):

 def test_step_overflow():
    policy = create_policy_mock(TrainerSettings())
-    policy.set_step(2 ** 31 - 1)
-    assert policy.get_current_step() == 2 ** 31 - 1  # step = 2147483647
+    policy.set_step(2**31 - 1)
+    assert policy.get_current_step() == 2**31 - 1  # step = 2147483647
    policy.increment_step(3)
-    assert policy.get_current_step() == 2 ** 31 + 2  # step = 2147483650
+    assert policy.get_current_step() == 2**31 + 2  # step = 2147483650
--- a/ml-agents/mlagents/trainers/torch/attention.py
+++ b/ml-agents/mlagents/trainers/torch/attention.py
@ -39,7 +39,7 @@ def get_zero_entities_mask(entities: List[torch.Tensor]) -> List[torch.Tensor]:

        # Generate the masking tensors for each entities tensor (mask only if all zeros)
        key_masks: List[torch.Tensor] = [
-            (torch.sum(ent ** 2, axis=2) < 0.01).float() for ent in entities
+            (torch.sum(ent**2, axis=2) < 0.01).float() for ent in entities
        ]
    return key_masks

@ -101,11 +101,11 @@ class MultiHeadAttention(torch.nn.Module):
        qk = torch.matmul(query, key)  # (b, h, n_q, n_k)

        if key_mask is None:
-            qk = qk / (self.embedding_size ** 0.5)
+            qk = qk / (self.embedding_size**0.5)
        else:
            key_mask = key_mask.reshape(b, 1, 1, n_k)
            qk = (1 - key_mask) * qk / (
-                self.embedding_size ** 0.5
+                self.embedding_size**0.5
            ) + key_mask * self.NEG_INF

        att = torch.softmax(qk, dim=3)  # (b, h, n_q, n_k)
--- a/ml-agents/mlagents/trainers/torch/components/bc/module.py
+++ b/ml-agents/mlagents/trainers/torch/components/bc/module.py
@ -33,7 +33,9 @@ class BCModule:
        self._anneal_steps = settings.steps
        self.current_lr = policy_learning_rate * settings.strength

-        learning_rate_schedule: ScheduleType = ScheduleType.LINEAR if self._anneal_steps > 0 else ScheduleType.CONSTANT
+        learning_rate_schedule: ScheduleType = (
+            ScheduleType.LINEAR if self._anneal_steps > 0 else ScheduleType.CONSTANT
+        )
        self.decay_learning_rate = ModelUtils.DecayedValue(
            learning_rate_schedule, self.current_lr, 1e-10, self._anneal_steps
        )
--- a/ml-agents/mlagents/trainers/torch/components/reward_providers/gail_reward_provider.py
+++ b/ml-agents/mlagents/trainers/torch/components/reward_providers/gail_reward_provider.py
@ -183,10 +183,10 @@ class DiscriminatorNetwork(torch.nn.Module):
            kl_loss = torch.mean(
                -torch.sum(
                    1
-                    + (self._z_sigma ** 2).log()
-                    - 0.5 * expert_mu ** 2
-                    - 0.5 * policy_mu ** 2
-                    - (self._z_sigma ** 2),
+                    + (self._z_sigma**2).log()
+                    - 0.5 * expert_mu**2
+                    - 0.5 * policy_mu**2
+                    - (self._z_sigma**2),
                    dim=1,
                )
            )
@ -255,6 +255,6 @@ class DiscriminatorNetwork(torch.nn.Module):
        estimate = self._estimator(hidden).squeeze(1).sum()
        gradient = torch.autograd.grad(estimate, encoder_input, create_graph=True)[0]
        # Norm's gradient could be NaN at 0. Use our own safe_norm
-        safe_norm = (torch.sum(gradient ** 2, dim=1) + self.EPSILON).sqrt()
+        safe_norm = (torch.sum(gradient**2, dim=1) + self.EPSILON).sqrt()
        gradient_mag = torch.mean((safe_norm - 1) ** 2)
        return gradient_mag
--- a/ml-agents/mlagents/trainers/torch/distributions.py
+++ b/ml-agents/mlagents/trainers/torch/distributions.py
@ -70,7 +70,7 @@ class GaussianDistInstance(DistInstance):
        return self.mean

    def log_prob(self, value):
-        var = self.std ** 2
+        var = self.std**2
        log_scale = torch.log(self.std + EPSILON)
        return (
            -((value - self.mean) ** 2) / (2 * var + EPSILON)
@ -84,7 +84,7 @@ class GaussianDistInstance(DistInstance):

    def entropy(self):
        return torch.mean(
-            0.5 * torch.log(2 * math.pi * math.e * self.std ** 2 + EPSILON),
+            0.5 * torch.log(2 * math.pi * math.e * self.std**2 + EPSILON),
            dim=1,
            keepdim=True,
        )  # Use equivalent behavior to TF
--- a/ml-agents/mlagents/trainers/trainer/rl_trainer.py
+++ b/ml-agents/mlagents/trainers/trainer/rl_trainer.py
@ -137,7 +137,7 @@ class RLTrainer(Trainer):
        return model_saver

    def _policy_mean_reward(self) -> Optional[float]:
-        """ Returns the mean episode reward for the current policy. """
+        """Returns the mean episode reward for the current policy."""
        rewards = self.cumulative_returns_since_policy_update
        if len(rewards) == 0:
            return None
--- a/ml-agents/setup.py
+++ b/ml-agents/setup.py
@ -89,5 +89,6 @@ setup(
            "default=mlagents.plugins.stats_writer:get_default_stats_writers"
        ],
    },
-    cmdclass={"verify": VerifyVersionCommand},
+    # TODO: Remove this once mypy stops having spurious setuptools issues.
+    cmdclass={"verify": VerifyVersionCommand},  # type: ignore
 )
--- a/ml-agents/tests/yamato/scripts/run_llapi.py
+++ b/ml-agents/tests/yamato/scripts/run_llapi.py
@ -47,9 +47,7 @@ def test_run_environment(env_name):
        print("Is there a visual observation ?", vis_obs)

        # Examine the state space for the first observation for the first agent
-        print(
-            "First Agent observation looks like: \n{}".format(decision_steps.obs[0][0])
-        )
+        print(f"First Agent observation looks like: \n{decision_steps.obs[0][0]}")

        for _episode in range(10):
            env.reset()
--- a/ml-agents/tests/yamato/yamato_utils.py
+++ b/ml-agents/tests/yamato/yamato_utils.py
@ -24,7 +24,7 @@ def get_base_path():


 def get_base_output_path():
-    """"
+    """ "
    Returns the artifact folder to use for yamato jobs.
    """
    return os.path.join(get_base_path(), "artifacts")
--- a/utils/validate_release_links.py
+++ b/utils/validate_release_links.py
@ -188,7 +188,7 @@ def check_file(
                        new_file.write(line)
                    else:
                        bad_lines.append(f"{filename}: {line}")
-                        new_line = re.sub(r"release_[0-9]+", fr"{release_tag}", line)
+                        new_line = re.sub(r"release_[0-9]+", rf"{release_tag}", line)
                        new_line = update_pip_install_line(new_line, package_version)
                        new_file.write(new_line)
        if bad_lines:
@ -235,7 +235,7 @@ def main():
    print(f"Python package version: {package_version}")
    release_allow_pattern = re.compile(f"{release_tag}(_docs)?")
    pip_allow_pattern = re.compile(
-        fr"python -m pip install (-q )?mlagents(_envs)?=={package_version}"
+        rf"python -m pip install (-q )?mlagents(_envs)?=={package_version}"
    )
    bad_lines = check_all_files(
        release_allow_pattern, release_tag, pip_allow_pattern, package_version