ray-project · sven1977 · Jan 28, 2022 · Jan 20, 2022 · Jan 20, 2022 · Jan 21, 2022
@@ -22,8 +22,6 @@ def test_bandit_lin_ts_compilation(self):
         config = {
             # Use a simple bandit friendly env.
             "env": SimpleContextualBandit,
-            # Run locally.
-            "num_workers": 0,
         }
 
         num_iterations = 5
@@ -38,6 +36,26 @@ def test_bandit_lin_ts_compilation(self):
             # Force good learning behavior (this is a very simple env).
             self.assertTrue(results["episode_reward_mean"] == 10.0)
 
+    def test_bandit_lin_ucb_compilation(self):
+        """Test whether a BanditLinUCBTrainer can be built on all frameworks.
+        """
+        config = {
+            # Use a simple bandit friendly env.
+            "env": SimpleContextualBandit,
+        }
+
+        num_iterations = 5
+
+        for _ in framework_iterator(config, frameworks="torch"):
+            trainer = bandit.BanditLinUCBTrainer(config=config)
+            results = None
+            for i in range(num_iterations):
+                results = trainer.train()
+                check_train_results(results)
+                print(results)
+            # Force good learning behavior (this is a very simple env).
+            self.assertTrue(results["episode_reward_mean"] == 10.0)
+
     def test_deprecated_locations(self):
         """Tests, whether importing from old contrib dir fails gracefully.