90 lines
3.4 KiB
JSON
90 lines
3.4 KiB
JSON
|
{
|
||
|
"args": {
|
||
|
"seed": [1],
|
||
|
"agent_rl_algo": ["ppo"],
|
||
|
"n_total_updates": [30000],
|
||
|
"train_runner": ["paired"],
|
||
|
"n_devices": [1],
|
||
|
"student_model_name": ["default_student_actor_cnn"],
|
||
|
"student_critic_model_name": ["default_student_critic_cnn"],
|
||
|
"env_name": ["Overcooked"],
|
||
|
"verbose": [false],
|
||
|
"is_multi_agent": [true],
|
||
|
"log_dir": ["~/logs/minimax"],
|
||
|
"log_interval": [10],
|
||
|
"from_last_checkpoint": [false],
|
||
|
"checkpoint_interval": [1000],
|
||
|
"archive_interval": [0],
|
||
|
"archive_init_checkpoint": [false],
|
||
|
"test_interval": [100],
|
||
|
"n_students": [2],
|
||
|
"n_parallel": [32],
|
||
|
"n_eval": [1],
|
||
|
"n_rollout_steps": [400],
|
||
|
"lr": [3e-4],
|
||
|
"lr_anneal_steps": [0],
|
||
|
"max_grad_norm": [0.5],
|
||
|
"adam_eps": [1e-05],
|
||
|
"track_env_metrics": [true],
|
||
|
"discount": [0.999],
|
||
|
"n_unroll_rollout": [10],
|
||
|
"render": [false],
|
||
|
"ued_score": ["relative_regret"],
|
||
|
"student_gae_lambda": [0.98],
|
||
|
"teacher_discount": [0.999],
|
||
|
"teacher_lr_anneal_steps": [0],
|
||
|
"teacher_gae_lambda": [0.98],
|
||
|
"student_entropy_coef": [0.01],
|
||
|
"student_value_loss_coef": [0.5],
|
||
|
"student_n_unroll_update": [5],
|
||
|
"student_ppo_n_epochs": [8],
|
||
|
"student_ppo_n_minibatches": [4],
|
||
|
"student_ppo_clip_eps": [0.2],
|
||
|
"student_ppo_clip_value_loss": [true],
|
||
|
"teacher_entropy_coef": [0.01],
|
||
|
"teacher_value_loss_coef": [0.5],
|
||
|
"teacher_n_unroll_update": [5],
|
||
|
"teacher_ppo_n_epochs": [8],
|
||
|
"teacher_ppo_n_minibatches": [4],
|
||
|
"teacher_ppo_clip_eps": [0.2],
|
||
|
"teacher_ppo_clip_value_loss": [true],
|
||
|
"student_recurrent_arch": ["s5"],
|
||
|
"student_recurrent_hidden_dim": [64],
|
||
|
"student_hidden_dim": [64],
|
||
|
"student_n_hidden_layers": [3],
|
||
|
"student_n_conv_layers": [3],
|
||
|
"student_n_conv_filters": [32],
|
||
|
"student_n_scalar_embeddings": [4],
|
||
|
"student_scalar_embed_dim": [5],
|
||
|
"student_s5_n_blocks": [2],
|
||
|
"student_s5_n_layers": [2],
|
||
|
"student_s5_layernorm_pos": ["pre"],
|
||
|
"student_s5_activation": ["half_glu1"],
|
||
|
"student_agent_kind": ["mappo"],
|
||
|
"teacher_model_name": ["default_teacher_cnn"],
|
||
|
"teacher_recurrent_arch": ["lstm"],
|
||
|
"teacher_recurrent_hidden_dim": [64],
|
||
|
"teacher_hidden_dim": [64],
|
||
|
"teacher_n_hidden_layers": [1],
|
||
|
"teacher_n_conv_filters": [128],
|
||
|
"teacher_scalar_embed_dim": [10],
|
||
|
"overcooked_height": [6],
|
||
|
"overcooked_width": [9],
|
||
|
"overcooked_n_walls": [5],
|
||
|
"overcooked_normalize_obs": [true],
|
||
|
"overcooked_max_steps": [400],
|
||
|
"overcooked_random_reset": [false],
|
||
|
"overcooked_ued_replace_wall_pos": [true],
|
||
|
"overcooked_ued_fixed_n_wall_steps": [false],
|
||
|
"overcooked_ued_first_wall_pos_sets_budget": [true],
|
||
|
"overcooked_ued_noise_dim": [50],
|
||
|
"overcooked_ued_n_walls": [15],
|
||
|
"overcooked_ued_normalize_obs": [true],
|
||
|
"n_shaped_reward_updates": [30000],
|
||
|
"test_n_episodes": [10],
|
||
|
"test_env_names": [
|
||
|
"Overcooked-CoordRing6_9,Overcooked-ForcedCoord6_9,Overcooked-CounterCircuit6_9,Overcooked-AsymmAdvantages6_9,Overcooked-CrampedRoom6_9"
|
||
|
],
|
||
|
"overcooked_test_normalize_obs": [true]
|
||
|
}
|
||
|
}
|