TrainConfig(
    version: 3,
    env: EnvConfig(
        kwargs: "{}",
        id: "BevyMultiSnake",
        validate: true,
    ),
    net: RogueNetConfig(
        embd_pdrop: 0.0,
        resid_pdrop: 0.0,
        attn_pdrop: 0.0,
        n_layer: 2,
        n_head: 2,
        d_model: 8,
        pooling: None,
        relpos_encoding: RelposEncodingConfig(
            extent: [
                10,
                10,
            ],
            position_features: [
                "x",
                "y",
            ],
            scale: 1.0,
            per_entity_values: false,
            exclude_entities: [],
            value_relpos_projection: false,
            key_relpos_projection: false,
            per_entity_projections: false,
            radial: false,
            distance: false,
            rotation_vec_features: None,
            rotation_angle_feature: None,
            interpolate: false,
            value_gate: "relu",
        ),
        d_qk: 16,
        translation: None,
    ),
    optim: OptimizerConfig(
        lr: 0.001,
        bs: 1024,
        weight_decay: 0.0,
        micro_bs: None,
        anneal_lr: true,
        update_epochs: 3,
        max_grad_norm: 2.0,
    ),
    ppo: PPOConfig(
        gae: true,
        gamma: 0.99,
        gae_lambda: 0.95,
        norm_adv: true,
        clip_coef: 0.2,
        clip_vloss: true,
        ent_coef: 0.1,
        vf_coef: 0.5,
        target_kl: None,
        anneal_entropy: true,
    ),
    rollout: RolloutConfig(
        steps: 16,
        num_envs: 128,
        processes: 4,
    ),
    eval: None,
    vf_net: None,
    name: "config",
    seed: 1,
    total_timesteps: 25000,
    max_train_time: None,
    torch_deterministic: true,
    cuda: true,
    track: false,
    wandb_project_name: "autochess",
    wandb_entity: "cswinter",
    capture_samples: None,
    capture_logits: false,
    capture_samples_subsample: 1,
    trial: None,
    data_dir: ".",
    cuda_empty_cache: false,
)