We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent 80a60f1 commit 0ebebecCopy full SHA for 0ebebec
1 file changed
experiments/g1/main.py
@@ -36,12 +36,12 @@ class ExperimentConfig:
36
torso_offset_range: tuple[float, float] = (-2.0, 5.0)
37
38
# L2C2
39
- l2c2_lambda_pi: float = 1.0
40
- l2c2_lambda_v: float = 0.1
+ l2c2_lambda_pi: float = 5.0
+ l2c2_lambda_v: float = 0.5
41
42
# Reward weights
43
task_weight: float = 2.5
44
- regularization_weight: float = 0.1
+ regularization_weight: float = 1.0
45
style_weight: float = 1.0
46
target_weight: float = 1.0
47
0 commit comments