imone commited on
Commit
ee2c595
·
verified ·
1 Parent(s): e11817d

Upload folder using huggingface_hub

Browse files
Files changed (3) hide show
  1. .gitattributes +1 -0
  2. all_config.yaml +35 -0
  3. checkpoint +3 -0
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ checkpoint filter=lfs diff=lfs merge=lfs -text
all_config.yaml ADDED
@@ -0,0 +1,35 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ arch:
2
+ H_cycles: 2
3
+ H_layers: 4
4
+ L_cycles: 2
5
+ L_layers: 4
6
+ expansion: 4
7
+ halt_exploration_prob: 0.1
8
+ halt_max_steps: 16
9
+ hidden_size: 512
10
+ loss:
11
+ loss_type: stablemax_cross_entropy
12
+ name: losses@ACTLossHead
13
+ name: hrm.hrm_act_v1@HierarchicalReasoningModel_ACTV1
14
+ num_heads: 8
15
+ pos_encodings: rope
16
+ puzzle_emb_ndim: 512
17
+ beta1: 0.9
18
+ beta2: 0.95
19
+ checkpoint_every_eval: true
20
+ checkpoint_path: checkpoints/Arc-2-aug-1000 ACT-torch/HierarchicalReasoningModel_ACTV1
21
+ bright-mustang
22
+ data_path: data/arc-2-aug-1000
23
+ epochs: 100000
24
+ eval_interval: 10000
25
+ eval_save_outputs: []
26
+ global_batch_size: 768
27
+ lr: 0.0001
28
+ lr_min_ratio: 1.0
29
+ lr_warmup_steps: 2000
30
+ project_name: Arc-2-aug-1000 ACT-torch
31
+ puzzle_emb_lr: 0.01
32
+ puzzle_emb_weight_decay: 0.1
33
+ run_name: HierarchicalReasoningModel_ACTV1 bright-mustang
34
+ seed: 0
35
+ weight_decay: 0.1
checkpoint ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:58719e51da6cd7712eb4197f908fbfdc88403ee48c42a3a92bab9f9c968df64d
3
+ size 2250983821