We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 78f31e8 commit 4fa5618Copy full SHA for 4fa5618
sota-implementations/cql/utils.py
@@ -18,8 +18,7 @@
18
TensorDictPrioritizedReplayBuffer,
19
TensorDictReplayBuffer,
20
)
21
-from torchrl.data.datasets.d4rl import D4RLExperienceReplay
22
-from torchrl.data.datasets.minari_data import MinariExperienceReplay
+from torchrl.data.datasets.minari_data import MinariExperienceReplay
23
from torchrl.data.replay_buffers import SamplerWithoutReplacement
24
from torchrl.envs import (
25
CatTensors,
torchrl/envs/llm/transforms/reason.py
@@ -153,7 +153,6 @@ def _step(
153
Returns:
154
The modified next_tensordict
155
"""
156
- print("Reward", next_tensordict["reward"])
157
# Handle batch dimensions
158
if next_tensordict.batch_dims >= 1:
159
ntds = []
0 commit comments