jakegrigsby commited on
Commit
99683fc
·
verified ·
1 Parent(s): 033b28d

Delete synthetic-rl-v2/synthetic-rl-v1

Browse files
synthetic-rl-v2/synthetic-rl-v1/config.txt DELETED
@@ -1,106 +0,0 @@
1
- # Parameters for Actor:
2
- # ==============================================================================
3
- Actor.activation = 'leaky_relu'
4
- Actor.cont_dist_kind = 'normal'
5
- Actor.d_hidden = 512
6
- Actor.dropout_p = 0.0
7
- Actor.gmm_modes = 5
8
- Actor.log_std_high = 2.0
9
- Actor.log_std_low = -5.0
10
- Actor.n_layers = 2
11
-
12
- # Parameters for Agent:
13
- # ==============================================================================
14
- Agent.fake_filter = False
15
- Agent.gamma = 0.999
16
- Agent.num_critics = 6
17
- Agent.num_critics_td = 2
18
- Agent.offline_coeff = 1.0
19
- Agent.online_coeff = 0.0
20
- Agent.popart = True
21
- Agent.reward_multiplier = 10.0
22
- Agent.tau = 0.003
23
- Agent.use_multigamma = True
24
- Agent.use_target_actor = True
25
-
26
- # Parameters for Experiment:
27
- # ==============================================================================
28
- Experiment.batches_per_update = 1
29
- Experiment.critic_loss_weight = 10.0
30
- Experiment.env_mode = 'async'
31
- Experiment.force_reset_train_envs_every = None
32
- Experiment.grad_clip = 1.0
33
- Experiment.has_replay_buffer_rights = True
34
- Experiment.l2_coeff = 0.001
35
- Experiment.learning_rate = 0.0001
36
- Experiment.local_time_optimizer = False
37
- Experiment.lr_warmup_steps = 500
38
- Experiment.mixed_precision = 'no'
39
- Experiment.padded_sampling = 'none'
40
- Experiment.save_trajs_as = 'npz'
41
- Experiment.stagger_traj_file_lengths = True
42
- Experiment.wandb_group_name = None
43
-
44
- # Parameters for FlashAttention:
45
- # ==============================================================================
46
- FlashAttention.window_size = (-1, -1)
47
-
48
- # Parameters for MetamonTstepEncoder:
49
- # ==============================================================================
50
- MetamonTstepEncoder.d_model = 160
51
- MetamonTstepEncoder.extra_emb_dim = 18
52
- MetamonTstepEncoder.n_heads = 8
53
- MetamonTstepEncoder.n_layers = 5
54
- MetamonTstepEncoder.scratch_tokens = 11
55
- MetamonTstepEncoder.token_mask_aug = False
56
-
57
- # Parameters for Multigammas:
58
- # ==============================================================================
59
- Multigammas.continuous = [0.1, 0.9, 0.95, 0.97, 0.99, 0.995]
60
- Multigammas.discrete = [0.1, 0.9, 0.95, 0.97, 0.99, 0.995]
61
-
62
- # Parameters for MultiModalEmbedding:
63
- # ==============================================================================
64
- MultiModalEmbedding.dropout = 0.05
65
- MultiModalEmbedding.numerical_tokens = 6
66
-
67
- # Parameters for NCritics:
68
- # ==============================================================================
69
- NCritics.activation = 'leaky_relu'
70
- NCritics.d_hidden = 512
71
- NCritics.dropout_p = 0.0
72
- NCritics.n_layers = 2
73
-
74
- # Parameters for PopArtLayer:
75
- # ==============================================================================
76
- PopArtLayer.beta = 0.0005
77
- PopArtLayer.init_nu = 100.0
78
-
79
- # Parameters for TformerTrajEncoder:
80
- # ==============================================================================
81
- TformerTrajEncoder.activation = 'leaky_relu'
82
- TformerTrajEncoder.causal = True
83
- TformerTrajEncoder.d_ff = 5120
84
- TformerTrajEncoder.d_model = 1280
85
- TformerTrajEncoder.dropout_attn = 0.0
86
- TformerTrajEncoder.dropout_emb = 0.05
87
- TformerTrajEncoder.dropout_ff = 0.05
88
- TformerTrajEncoder.dropout_qkv = 0.0
89
- TformerTrajEncoder.head_scaling = True
90
- TformerTrajEncoder.n_heads = 20
91
- TformerTrajEncoder.n_layers = 9
92
- TformerTrajEncoder.norm = 'layer'
93
- TformerTrajEncoder.normformer_norms = True
94
- TformerTrajEncoder.sigma_reparam = True
95
-
96
- # Parameters for TimestepTransformer:
97
- # ==============================================================================
98
- # None.
99
-
100
- # Parameters for TokenEmbedding:
101
- # ==============================================================================
102
- # None.
103
-
104
- # Parameters for TransformerTurnEmbedding:
105
- # ==============================================================================
106
- TransformerTurnEmbedding.dropout = 0.05