|
# Parameters for Actor: |
|
# ============================================================================== |
|
Actor.activation = 'leaky_relu' |
|
Actor.cont_dist_kind = 'normal' |
|
Actor.d_hidden = 512 |
|
Actor.dropout_p = 0.0 |
|
Actor.gmm_modes = 5 |
|
Actor.log_std_high = 2.0 |
|
Actor.log_std_low = -5.0 |
|
Actor.n_layers = 2 |
|
|
|
# Parameters for Agent: |
|
# ============================================================================== |
|
Agent.fake_filter = False |
|
Agent.gamma = 0.999 |
|
Agent.num_critics = 6 |
|
Agent.num_critics_td = 2 |
|
Agent.offline_coeff = 1.0 |
|
Agent.online_coeff = 0.0 |
|
Agent.popart = True |
|
Agent.reward_multiplier = 10.0 |
|
Agent.tau = 0.003 |
|
Agent.use_multigamma = True |
|
Agent.use_target_actor = True |
|
|
|
# Parameters for Experiment: |
|
# ============================================================================== |
|
Experiment.batches_per_update = 1 |
|
Experiment.critic_loss_weight = 10.0 |
|
Experiment.env_mode = 'async' |
|
Experiment.force_reset_train_envs_every = None |
|
Experiment.grad_clip = 1.0 |
|
Experiment.has_replay_buffer_rights = True |
|
Experiment.l2_coeff = 0.001 |
|
Experiment.learning_rate = 0.0001 |
|
Experiment.local_time_optimizer = False |
|
Experiment.lr_warmup_steps = 500 |
|
Experiment.mixed_precision = 'no' |
|
Experiment.padded_sampling = 'none' |
|
Experiment.save_trajs_as = 'npz' |
|
Experiment.stagger_traj_file_lengths = True |
|
Experiment.wandb_group_name = None |
|
|
|
# Parameters for FlashAttention: |
|
# ============================================================================== |
|
FlashAttention.window_size = (-1, -1) |
|
|
|
# Parameters for MetamonTstepEncoder: |
|
# ============================================================================== |
|
MetamonTstepEncoder.d_model = 160 |
|
MetamonTstepEncoder.extra_emb_dim = 18 |
|
MetamonTstepEncoder.n_heads = 8 |
|
MetamonTstepEncoder.n_layers = 5 |
|
MetamonTstepEncoder.scratch_tokens = 11 |
|
MetamonTstepEncoder.token_mask_aug = False |
|
|
|
# Parameters for Multigammas: |
|
# ============================================================================== |
|
Multigammas.continuous = [0.1, 0.9, 0.95, 0.97, 0.99, 0.995] |
|
Multigammas.discrete = [0.1, 0.9, 0.95, 0.97, 0.99, 0.995] |
|
|
|
# Parameters for MultiModalEmbedding: |
|
# ============================================================================== |
|
MultiModalEmbedding.dropout = 0.05 |
|
MultiModalEmbedding.numerical_tokens = 6 |
|
|
|
# Parameters for NCritics: |
|
# ============================================================================== |
|
NCritics.activation = 'leaky_relu' |
|
NCritics.d_hidden = 512 |
|
NCritics.dropout_p = 0.0 |
|
NCritics.n_layers = 2 |
|
|
|
# Parameters for PopArtLayer: |
|
# ============================================================================== |
|
PopArtLayer.beta = 0.0005 |
|
PopArtLayer.init_nu = 100.0 |
|
|
|
# Parameters for TformerTrajEncoder: |
|
# ============================================================================== |
|
TformerTrajEncoder.activation = 'leaky_relu' |
|
TformerTrajEncoder.causal = True |
|
TformerTrajEncoder.d_ff = 5120 |
|
TformerTrajEncoder.d_model = 1280 |
|
TformerTrajEncoder.dropout_attn = 0.0 |
|
TformerTrajEncoder.dropout_emb = 0.05 |
|
TformerTrajEncoder.dropout_ff = 0.05 |
|
TformerTrajEncoder.dropout_qkv = 0.0 |
|
TformerTrajEncoder.head_scaling = True |
|
TformerTrajEncoder.n_heads = 20 |
|
TformerTrajEncoder.n_layers = 9 |
|
TformerTrajEncoder.norm = 'layer' |
|
TformerTrajEncoder.normformer_norms = True |
|
TformerTrajEncoder.sigma_reparam = True |
|
|
|
# Parameters for TimestepTransformer: |
|
# ============================================================================== |
|
# None. |
|
|
|
# Parameters for TokenEmbedding: |
|
# ============================================================================== |
|
# None. |
|
|
|
# Parameters for TransformerTurnEmbedding: |
|
# ============================================================================== |
|
TransformerTurnEmbedding.dropout = 0.05 |
|
|