Skip to content

Commit

Permalink
update and align new terms
Browse files Browse the repository at this point in the history
  • Loading branch information
rradules committed Jun 18, 2024
1 parent ceb2473 commit 70a15fe
Show file tree
Hide file tree
Showing 4 changed files with 7 additions and 7 deletions.
6 changes: 3 additions & 3 deletions momaland/learning/morl/random_centralised_agent_example.py
Original file line number Diff line number Diff line change
Expand Up @@ -44,7 +44,7 @@ def train_random(moma_env):
num_timesteps=50,
initial_map=test_map,
randomise=True,
reward_mode="test",
reward_mode="individual",
render_mode=None,
)

Expand All @@ -55,11 +55,11 @@ def train_random(moma_env):
type_distribution=[0.5, 0.5],
position_distribution=[0.5, 1],
num_timesteps=10,
reward_scheme="local",
reward_mode="individual",
)

train_random(ig_env)
# train_random(mobpd_env)
train_random(mobpd_env)

# train_sa_random(ig_env)
# train_sa_random(mobpd_env)
4 changes: 2 additions & 2 deletions momaland/learning/morl/sa_env_factory.py
Original file line number Diff line number Diff line change
Expand Up @@ -34,7 +34,7 @@ def make_single_agent_bpd_env(size="small"):
bpd_env = mobeach_v0.parallel_env(
num_timesteps=5,
num_agents=10,
reward_scheme="global",
reward_mode="team",
sections=3,
capacity=2,
type_distribution=(0.7, 0.3),
Expand All @@ -44,7 +44,7 @@ def make_single_agent_bpd_env(size="small"):
bpd_env = moitem_gathering_v0.parallel_env(
num_timesteps=1,
num_agents=50,
reward_scheme="global",
reward_mode="team",
sections=5,
capacity=3,
type_distribution=(0.7, 0.3),
Expand Down
2 changes: 1 addition & 1 deletion momaland/learning/morl/train_ig_GPILS.py
Original file line number Diff line number Diff line change
Expand Up @@ -43,7 +43,7 @@
gradient_updates=10,
target_net_update_freq=200,
tau=1,
log=False, # set this to True to turn on wandb logging
log=True,
project_name=project_name,
seed=seed,
)
Expand Down
2 changes: 1 addition & 1 deletion momaland/learning/morl/train_ig_PCN.py
Original file line number Diff line number Diff line change
Expand Up @@ -40,7 +40,7 @@
batch_size=256,
project_name=project_name,
experiment_name="PCN",
log=False, # set this to True to turn on wandb logging
log=True,
)
timesteps_per_iter = 10000
agent.train(
Expand Down

0 comments on commit 70a15fe

Please sign in to comment.