Skip to content

Commit 5a41933

Browse files
authored
update notebook (#39)
1 parent 626f0b8 commit 5a41933

1 file changed

Lines changed: 6 additions & 15 deletions

File tree

train.ipynb

Lines changed: 6 additions & 15 deletions
Original file line numberDiff line numberDiff line change
@@ -43,7 +43,7 @@
4343
"source": [
4444
"# Install packages\n",
4545
"\n",
46-
"!pip install ksim==0.1.0 xax==0.3.0 mujoco-scenes"
46+
"!pip install ksim==0.1.2 xax==0.3.0 mujoco-scenes"
4747
]
4848
},
4949
{
@@ -474,10 +474,6 @@
474474
" value=True,\n",
475475
" help=\"Whether to use the IMU acceleration and gyroscope observations.\",\n",
476476
" )\n",
477-
" use_domain_randomization: bool = xax.field(\n",
478-
" value=True,\n",
479-
" help=\"Whether to use domain randomization.\",\n",
480-
" )\n",
481477
"\n",
482478
" # Curriculum parameters.\n",
483479
" num_curriculum_levels: int = xax.field(\n",
@@ -628,22 +624,20 @@
628624
" def get_rewards(self, physics_model: ksim.PhysicsModel) -> list[ksim.Reward]:\n",
629625
" return [\n",
630626
" # Standard rewards.\n",
631-
" ksim.NaiveForwardReward(clip_max=2.0, in_robot_frame=False, scale=3.0),\n",
627+
" ksim.NaiveForwardReward(clip_max=1.25, in_robot_frame=False, scale=3.0),\n",
632628
" ksim.NaiveForwardOrientationReward(scale=1.0),\n",
633629
" ksim.StayAliveReward(scale=1.0),\n",
634630
" ksim.UprightReward(scale=0.5),\n",
635631
" # Avoid movement penalties.\n",
636-
" ksim.AngularVelocityPenalty(index=(\"x\", \"y\"), scale=-0.005),\n",
637-
" ksim.LinearVelocityPenalty(index=(\"z\"), scale=-0.005),\n",
632+
" ksim.AngularVelocityPenalty(index=(\"x\", \"y\"), scale=-0.1),\n",
633+
" ksim.LinearVelocityPenalty(index=(\"z\"), scale=-0.1),\n",
638634
" # Normalization penalties.\n",
639635
" ksim.AvoidLimitsPenalty.create(physics_model, scale=-0.01),\n",
640-
" ksim.JointVelocityPenalty(scale=-0.01, scale_by_curriculum=True),\n",
641636
" ksim.JointAccelerationPenalty(scale=-0.01, scale_by_curriculum=True),\n",
642637
" ksim.JointJerkPenalty(scale=-0.01, scale_by_curriculum=True),\n",
643638
" ksim.LinkAccelerationPenalty(scale=-0.01, scale_by_curriculum=True),\n",
644639
" ksim.LinkJerkPenalty(scale=-0.01, scale_by_curriculum=True),\n",
645640
" ksim.ActionAccelerationPenalty(scale=-0.01, scale_by_curriculum=True),\n",
646-
" ksim.CtrlPenalty(scale=-0.01, scale_by_curriculum=True),\n",
647641
" # Bespoke rewards.\n",
648642
" BentArmPenalty.create_penalty(physics_model, scale=-0.1),\n",
649643
" StraightLegPenalty.create_penalty(physics_model, scale=-0.1),\n",
@@ -656,11 +650,8 @@
656650
" ]\n",
657651
"\n",
658652
" def get_curriculum(self, physics_model: ksim.PhysicsModel) -> ksim.Curriculum:\n",
659-
" return ksim.ConstantCurriculum(\n",
660-
" # We toggle domain randomization by setting the curriculum level.\n",
661-
" # Since the domain randomization functions all use this level,\n",
662-
" # this effectively toggles them on and off.\n",
663-
" level=1.0 if self.config.use_domain_randomization else 0.0,\n",
653+
" return ksim.DistanceFromOriginCurriculum(\n",
654+
" min_level_steps=5,\n",
664655
" )\n",
665656
"\n",
666657
" def get_model(self, key: PRNGKeyArray) -> Model:\n",

0 commit comments

Comments
 (0)