TrainConfig( version: 3, env: EnvConfig( kwargs: "{}", id: "BevyMultiSnake", validate: true, ), net: RogueNetConfig( embd_pdrop: 0.0, resid_pdrop: 0.0, attn_pdrop: 0.0, n_layer: 2, n_head: 2, d_model: 8, pooling: None, relpos_encoding: RelposEncodingConfig( extent: [ 10, 10, ], position_features: [ "x", "y", ], scale: 1.0, per_entity_values: false, exclude_entities: [], value_relpos_projection: false, key_relpos_projection: false, per_entity_projections: false, radial: false, distance: false, rotation_vec_features: None, rotation_angle_feature: None, interpolate: false, value_gate: "relu", ), d_qk: 16, translation: None, ), optim: OptimizerConfig( lr: 0.001, bs: 1024, weight_decay: 0.0, micro_bs: None, anneal_lr: true, update_epochs: 3, max_grad_norm: 2.0, ), ppo: PPOConfig( gae: true, gamma: 0.99, gae_lambda: 0.95, norm_adv: true, clip_coef: 0.2, clip_vloss: true, ent_coef: 0.1, vf_coef: 0.5, target_kl: None, anneal_entropy: true, ), rollout: RolloutConfig( steps: 16, num_envs: 128, processes: 4, ), eval: None, vf_net: None, name: "config", seed: 1, total_timesteps: 25000, max_train_time: None, torch_deterministic: true, cuda: true, track: false, wandb_project_name: "autochess", wandb_entity: "cswinter", capture_samples: None, capture_logits: false, capture_samples_subsample: 1, trial: None, data_dir: ".", cuda_empty_cache: false, )