{ "args": { "seed": [1], "agent_rl_algo": ["ppo"], "n_total_updates": [30000], "train_runner": ["plr"], "n_devices": [1], "student_model_name": ["default_student_cnn"], "env_name": ["Maze"], "verbose": [false], "log_dir": ["~/logs/minimax"], "log_interval": [10], "from_last_checkpoint": [true], "checkpoint_interval": [1000], "archive_interval": [0], "archive_init_checkpoint": [false], "test_interval": [100], "n_students": [1], "n_parallel": [32], "n_eval": [1], "n_rollout_steps": [256], "lr": [1e-05], "lr_anneal_steps": [0], "max_grad_norm": [0.5], "adam_eps": [1e-05], "track_env_metrics": [true], "discount": [0.999], "n_unroll_rollout": [10], "render": [false], "ued_score": ["max_mc"], "plr_replay_prob": [0.8], "plr_buffer_size": [4000], "plr_staleness_coef": [0.3], "plr_temp": [0.3], "plr_use_score_ranks": [true], "plr_min_fill_ratio": [0.5], "plr_use_robust_plr": [true], "plr_use_parallel_eval": [true], "plr_force_unique": [true], "plr_mutation_fn": ["default"], "plr_n_mutations": [20], "plr_mutation_criterion": ["batch"], "plr_mutation_subsample_size": [4], "student_gae_lambda": [0.98], "student_entropy_coef": [0.0], "student_value_loss_coef": [0.5], "student_n_unroll_update": [5], "student_ppo_n_epochs": [5], "student_ppo_n_minibatches": [1], "student_ppo_clip_eps": [0.2], "student_ppo_clip_value_loss": [true], "student_recurrent_arch": ["s5"], "student_recurrent_hidden_dim": [256], "student_hidden_dim": [32], "student_n_hidden_layers": [1], "student_n_conv_filters": [16], "student_n_scalar_embeddings": [4], "student_scalar_embed_dim": [5], "student_s5_n_blocks": [2], "student_s5_n_layers": [2], "student_s5_layernorm_pos": ["post"], "student_s5_activation": ["half_glu1"], "maze_height": [13], "maze_width": [13], "maze_n_walls": [0], "maze_replace_wall_pos": [true], "maze_sample_n_walls": [false], "maze_see_agent": [false], "maze_normalize_obs": [true], "maze_obs_agent_pos": [false], "maze_max_episode_steps": [250], "test_n_episodes": [10], "test_env_names": ["Maze-SixteenRooms,Maze-Labyrinth,Maze-StandardMaze"], "maze_test_see_agent": [false], "maze_test_normalize_obs": [true] } }