rlworkgroup · ManavR123 · Dec 4, 2020 · Dec 4, 2020 · Dec 5, 2020 · ryanjulian
@@ -102,6 +102,8 @@ def __init__(self,
         self.policy = policy
         self._scope = scope
         self.max_episode_length = env_spec.max_episode_length
+        if self.max_episode_length == None:
+            raise ValueError("max_episode_length must not be None")
         self._env_spec = env_spec
         self._baseline = baseline
         self._discount = discount

@@ -115,6 +115,22 @@ def test_npo_with_invalid_no_entropy_configuration(self):
                 entropy_method='no_entropy',
                 policy_ent_coeff=0.02,
             )
+
+    @pytest.mark.mujoco
+    def test_npo_with_invalid_max_episode_length(self):
+        """Test NPO with invalid max_episode_length."""
+        with pytest.raises(ValueError):
+            env = normalize(
+            GymEnv('InvertedDoublePendulum-v2', max_episode_length=None))
+            NPO(
+                env_spec=env.spec,
+                policy=self.policy,
+                baseline=self.baseline,
+                sampler=self.sampler,
+                discount=0.99,
+                gae_lambda=0.98,
+                policy_ent_coeff=0.0
+            )
 
     def teardown_method(self):
         self.env.close()