We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 8cc0677 commit 9f2ebd9Copy full SHA for 9f2ebd9
improving_transformers_world_model/agent.py
@@ -503,7 +503,7 @@ def critic_loss(
503
504
# value clipping
505
506
- clipped_value = old_values + (critic_value - old_values).clamp(1. - eps, 1. + eps)
+ clipped_value = old_values + (critic_value - old_values).clamp(-eps, eps)
507
508
clipped_loss = loss_fn(clipped_value, returns, reduction = 'none')
509
loss = loss_fn(critic_logits, returns, reduction = 'none')
pyproject.toml
@@ -1,6 +1,6 @@
1
[project]
2
name = "improving-transformers-world-model"
3
-version = "0.0.55"
+version = "0.0.56"
4
description = "Improving Transformers World Model for RL"
5
authors = [
6
{ name = "Phil Wang", email = "lucidrains@gmail.com" }
0 commit comments