Behaviour refinement - fence penalty
This commit is contained in:
@@ -61,11 +61,11 @@ class HerdingEnv(gym.Env):
|
||||
W_COMPLETE = 100.0 # all sheep penned
|
||||
W_STEP_COST = 0.02 # time penalty — strong enough to punish doing nothing
|
||||
W_COMPACT = 0.0 # reward for flock-radius reduction (off by default)
|
||||
W_WALL_TOUCH = 0.05 # per-sheep, per-step penalty when an active sheep is
|
||||
# pinned against the outside of a pen W/E wall. Direct
|
||||
# signal against the wall-corraling exploit so the
|
||||
# policy generalises better to Webots pillared walls.
|
||||
WALL_TOUCH_BUFFER = 0.5 # metres outside the wall counted as "touching"
|
||||
W_WALL_TOUCH = 0.01 # per-sheep, per-step penalty when an active sheep is
|
||||
# pinned against the outside of a pen W/E wall. Kept
|
||||
# small (<step_cost) so the dog isn't incentivised to
|
||||
# hover above the entrance to avoid the penalty.
|
||||
WALL_TOUCH_BUFFER = 0.3 # metres outside the wall counted as "touching"
|
||||
ALIGN_SHAPE = "standoff" # "standoff" (peaks at IDEAL) | "near" (peaks at 0)
|
||||
ALIGN_GATED = True # gate alignment on action magnitude
|
||||
ENTRY_AWARE = True # progress reward targets PEN_ENTRY (entrance face), not
|
||||
|
||||
Reference in New Issue
Block a user