{ "args": { "seed": [1], "agent_rl_algo": ["ppo"], "n_total_updates": [30000], "train_runner": ["paired"], "n_devices": [1], "student_model_name": ["default_student_actor_cnn"], "student_critic_model_name": ["default_student_critic_cnn"], "env_name": ["Overcooked"], "verbose": [false], "is_multi_agent": [true], "log_dir": ["~/logs/minimax"], "log_interval": [10], "from_last_checkpoint": [false], "checkpoint_interval": [1000], "archive_interval": [0], "archive_init_checkpoint": [false], "test_interval": [100], "n_students": [2], "n_parallel": [32], "n_eval": [1], "n_rollout_steps": [400], "lr": [3e-4], "lr_anneal_steps": [0], "max_grad_norm": [0.5], "adam_eps": [1e-05], "track_env_metrics": [true], "discount": [0.999], "n_unroll_rollout": [10], "render": [false], "ued_score": ["relative_regret"], "student_gae_lambda": [0.98], "teacher_discount": [0.999], "teacher_lr_anneal_steps": [0], "teacher_gae_lambda": [0.98], "student_entropy_coef": [0.01], "student_value_loss_coef": [0.5], "student_n_unroll_update": [5], "student_ppo_n_epochs": [8], "student_ppo_n_minibatches": [4], "student_ppo_clip_eps": [0.2], "student_ppo_clip_value_loss": [true], "teacher_entropy_coef": [0.01], "teacher_value_loss_coef": [0.5], "teacher_n_unroll_update": [5], "teacher_ppo_n_epochs": [8], "teacher_ppo_n_minibatches": [4], "teacher_ppo_clip_eps": [0.2], "teacher_ppo_clip_value_loss": [true], "student_recurrent_arch": ["s5"], "student_recurrent_hidden_dim": [64], "student_hidden_dim": [64], "student_n_hidden_layers": [3], "student_n_conv_layers": [3], "student_n_conv_filters": [32], "student_n_scalar_embeddings": [4], "student_scalar_embed_dim": [5], "student_s5_n_blocks": [2], "student_s5_n_layers": [2], "student_s5_layernorm_pos": ["pre"], "student_s5_activation": ["half_glu1"], "student_agent_kind": ["mappo"], "teacher_model_name": ["default_teacher_cnn"], "teacher_recurrent_arch": ["lstm"], "teacher_recurrent_hidden_dim": [64], "teacher_hidden_dim": [64], "teacher_n_hidden_layers": [1], "teacher_n_conv_filters": [128], "teacher_scalar_embed_dim": [10], "overcooked_height": [6], "overcooked_width": [9], "overcooked_n_walls": [5], "overcooked_normalize_obs": [true], "overcooked_max_steps": [400], "overcooked_random_reset": [false], "overcooked_ued_replace_wall_pos": [true], "overcooked_ued_fixed_n_wall_steps": [false], "overcooked_ued_first_wall_pos_sets_budget": [true], "overcooked_ued_noise_dim": [50], "overcooked_ued_n_walls": [15], "overcooked_ued_normalize_obs": [true], "n_shaped_reward_updates": [30000], "test_n_episodes": [10], "test_env_names": [ "Overcooked-CoordRing6_9,Overcooked-ForcedCoord6_9,Overcooked-CounterCircuit6_9,Overcooked-AsymmAdvantages6_9,Overcooked-CrampedRoom6_9" ], "overcooked_test_normalize_obs": [true] } }