Skip to content

Commit 8604b4b

Browse files
svekarsvmoens
andauthored
Cherry-pick: Fix torchrl scripts for PT 2.6 TorchRL>=0.6 (#3199) (#3266)
Fixes #3195 Fixing TorchRL scripts for Pytorch 2.6 release Co-authored-by: Vincent Moens <vmoens@meta.com>
1 parent 8f0518c commit 8604b4b

File tree

5 files changed

+5
-6
lines changed

5 files changed

+5
-6
lines changed

.jenkins/validate_tutorials_built.py

-1
Original file line numberDiff line numberDiff line change
@@ -51,7 +51,6 @@
5151
"intermediate_source/text_to_speech_with_torchaudio",
5252
"intermediate_source/tensorboard_profiler_tutorial", # reenable after 2.0 release.
5353
"intermediate_source/torch_export_tutorial", # reenable after 2940 is fixed.
54-
"advanced_source/pendulum",
5554
]
5655

5756
def tutorial_source_dirs() -> List[Path]:

advanced_source/coding_ddpg.py

+1-1
Original file line numberDiff line numberDiff line change
@@ -893,7 +893,7 @@ def make_recorder(actor_model_explore, transform_state_dict, record_interval):
893893
record_frames=1000,
894894
policy_exploration=actor_model_explore,
895895
environment=environment,
896-
exploration_type=ExplorationType.MEAN,
896+
exploration_type=ExplorationType.DETERMINISTIC,
897897
record_interval=record_interval,
898898
)
899899
return recorder_obj

advanced_source/pendulum.py

+1-1
Original file line numberDiff line numberDiff line change
@@ -604,7 +604,7 @@ def __init__(self, td_params=None, seed=None, device="cpu"):
604604
env,
605605
# ``Unsqueeze`` the observations that we will concatenate
606606
UnsqueezeTransform(
607-
unsqueeze_dim=-1,
607+
dim=-1,
608608
in_keys=["th", "thdot"],
609609
in_keys_inv=["th", "thdot"],
610610
),

intermediate_source/dqn_with_rnn_tutorial.py

+1-1
Original file line numberDiff line numberDiff line change
@@ -433,7 +433,7 @@
433433
exploration_module.step(data.numel())
434434
updater.step()
435435

436-
with set_exploration_type(ExplorationType.MODE), torch.no_grad():
436+
with set_exploration_type(ExplorationType.DETERMINISTIC), torch.no_grad():
437437
rollout = env.rollout(10000, stoch_policy)
438438
traj_lens.append(rollout.get(("next", "step_count")).max().item())
439439

intermediate_source/reinforcement_ppo.py

+2-2
Original file line numberDiff line numberDiff line change
@@ -419,8 +419,8 @@
419419
in_keys=["loc", "scale"],
420420
distribution_class=TanhNormal,
421421
distribution_kwargs={
422-
"min": env.action_spec.space.low,
423-
"max": env.action_spec.space.high,
422+
"low": env.action_spec.space.low,
423+
"high": env.action_spec.space.high,
424424
},
425425
return_log_prob=True,
426426
# we'll need the log-prob for the numerator of the importance weights

0 commit comments

Comments
 (0)