ray-project · sven1977 · Aug 22, 2022 · Aug 18, 2022 · Aug 18, 2022 · Aug 18, 2022
@@ -148,8 +148,10 @@ def reduce_mean_valid(t):
             mean_vf_loss = reduce_mean_valid(vf_loss_clipped)
         # Ignore the value function.
         else:
-            value_fn_out = 0
-            vf_loss_clipped = mean_vf_loss = 0.0
+            value_fn_out = torch.tensor(0.0).to(mean_policy_loss.device)
+            vf_loss_clipped = mean_vf_loss = torch.tensor(0.0).to(
+                mean_policy_loss.device
+            )
 
         total_loss = reduce_mean_valid(
             -surrogate_loss

@@ -211,6 +211,9 @@ def explained_variance(y: TensorType, pred: TensorType) -> TensorType:
         The explained variance given a pair of labels and predictions.
     """
     y_var = torch.var(y, dim=[0])
+    if y_var == 0.0:
+        # Model case in which y does not vary with explained variance of -1
+        return torch.tensor(-1.0).to(pred.device)
     diff_var = torch.var(y - pred, dim=[0])
     min_ = torch.tensor([-1.0]).to(pred.device)
     return torch.max(min_, 1 - (diff_var / y_var))[0]