Changed the init_final value to center the starting mean and std of the policy

Co-authored-by: Adil Zouitine <adilzouitinegm@gmail.com>
2025-02-13 16:42:43 +01:00
parent 0c32008466
commit d9a70376d8
4 changed files with 5 additions and 4 deletions
--- a/lerobot/common/policies/hilserl/classifier/modeling_classifier.py
+++ b/lerobot/common/policies/hilserl/classifier/modeling_classifier.py
@@ -148,7 +148,7 @@ class Classifier(
    def predict_reward(self, x, threshold=0.6):
        if self.config.num_classes == 2:
            probs = self.forward(x).probabilities
-            logging.info(f"Predicted reward images: {probs}")
+            logging.debug(f"Predicted reward images: {probs}")
            return (probs > threshold).float()
        else:
            return torch.argmax(self.forward(x).probabilities, dim=1)