Ryukijano commited on
Commit
24d9572
·
verified ·
1 Parent(s): 23cd0bf

Add 13-06-07_gemma_le/checkpoints/005000

Browse files
runs/13-06-07_gemma_le/checkpoints/005000/config.json ADDED
@@ -0,0 +1,65 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "n_obs_steps": 1,
3
+ "normalization_mapping": {
4
+ "VISUAL": "MEAN_STD",
5
+ "STATE": "MIN_MAX",
6
+ "ACTION": "MIN_MAX"
7
+ },
8
+ "input_features": {
9
+ "observation.images.egoview": {
10
+ "type": "VISUAL",
11
+ "shape": [
12
+ 3,
13
+ 800,
14
+ 1280
15
+ ]
16
+ },
17
+ "observation.images.ego_view": {
18
+ "type": "VISUAL",
19
+ "shape": [
20
+ 3,
21
+ 256,
22
+ 256
23
+ ]
24
+ },
25
+ "observation.state": {
26
+ "type": "STATE",
27
+ "shape": [
28
+ 44
29
+ ]
30
+ }
31
+ },
32
+ "output_features": {
33
+ "action": {
34
+ "type": "ACTION",
35
+ "shape": [
36
+ 44
37
+ ]
38
+ }
39
+ },
40
+ "device": "cuda",
41
+ "use_amp": true,
42
+ "chunk_size": 16,
43
+ "n_action_steps": 8,
44
+ "vision_model_id": "/scratch/cbjp404/.cache/hf/models/siglip-so400m-patch14-384",
45
+ "text_model_id": "/scratch/cbjp404/.cache/hf/models/gemma-3-4b-it",
46
+ "use_2d_rope": false,
47
+ "lora_rank": 16,
48
+ "lora_alpha": 16,
49
+ "lora_dropout": 0.1,
50
+ "lora_target_modules": [
51
+ "q_proj",
52
+ "k_proj",
53
+ "v_proj",
54
+ "o_proj"
55
+ ],
56
+ "scaledp_num_layers": 4,
57
+ "scaledp_num_heads": 8,
58
+ "scaledp_dim_model": 512,
59
+ "scaledp_dim_feedforward": 2048,
60
+ "num_diffusion_steps": 100,
61
+ "conditioning_dim": 768,
62
+ "plan_update_interval": 10,
63
+ "optimizer_lr": 0.0001,
64
+ "optimizer_weight_decay": 1e-06
65
+ }
runs/13-06-07_gemma_le/checkpoints/005000/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9f2982cef6ea71f434d6c2a611efbc2072396b8c3aa970941a2d81e8dddf66df
3
+ size 9518415952
runs/13-06-07_gemma_le/checkpoints/005000/train_config.json ADDED
@@ -0,0 +1,183 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset": {
3
+ "repo_id": "local/robot_sim.PickNPlace",
4
+ "root": "/scratch/cbjp404/Isaac-GR00T/demo_data/robot_sim.PickNPlace",
5
+ "episodes": [
6
+ 0,
7
+ 1,
8
+ 2,
9
+ 3,
10
+ 4
11
+ ],
12
+ "image_transforms": {
13
+ "enable": false,
14
+ "max_num_transforms": 3,
15
+ "random_order": false,
16
+ "tfs": {
17
+ "brightness": {
18
+ "weight": 1.0,
19
+ "type": "ColorJitter",
20
+ "kwargs": {
21
+ "brightness": [
22
+ 0.8,
23
+ 1.2
24
+ ]
25
+ }
26
+ },
27
+ "contrast": {
28
+ "weight": 1.0,
29
+ "type": "ColorJitter",
30
+ "kwargs": {
31
+ "contrast": [
32
+ 0.8,
33
+ 1.2
34
+ ]
35
+ }
36
+ },
37
+ "saturation": {
38
+ "weight": 1.0,
39
+ "type": "ColorJitter",
40
+ "kwargs": {
41
+ "saturation": [
42
+ 0.5,
43
+ 1.5
44
+ ]
45
+ }
46
+ },
47
+ "hue": {
48
+ "weight": 1.0,
49
+ "type": "ColorJitter",
50
+ "kwargs": {
51
+ "hue": [
52
+ -0.05,
53
+ 0.05
54
+ ]
55
+ }
56
+ },
57
+ "sharpness": {
58
+ "weight": 1.0,
59
+ "type": "SharpnessJitter",
60
+ "kwargs": {
61
+ "sharpness": [
62
+ 0.5,
63
+ 1.5
64
+ ]
65
+ }
66
+ }
67
+ }
68
+ },
69
+ "revision": null,
70
+ "use_imagenet_stats": false,
71
+ "video_backend": "pyav"
72
+ },
73
+ "env": null,
74
+ "policy": {
75
+ "type": "gemma_le",
76
+ "n_obs_steps": 1,
77
+ "normalization_mapping": {
78
+ "VISUAL": "MEAN_STD",
79
+ "STATE": "MIN_MAX",
80
+ "ACTION": "MIN_MAX"
81
+ },
82
+ "input_features": {
83
+ "observation.images.egoview": {
84
+ "type": "VISUAL",
85
+ "shape": [
86
+ 3,
87
+ 800,
88
+ 1280
89
+ ]
90
+ },
91
+ "observation.images.ego_view": {
92
+ "type": "VISUAL",
93
+ "shape": [
94
+ 3,
95
+ 256,
96
+ 256
97
+ ]
98
+ },
99
+ "observation.state": {
100
+ "type": "STATE",
101
+ "shape": [
102
+ 44
103
+ ]
104
+ }
105
+ },
106
+ "output_features": {
107
+ "action": {
108
+ "type": "ACTION",
109
+ "shape": [
110
+ 44
111
+ ]
112
+ }
113
+ },
114
+ "device": "cuda",
115
+ "use_amp": true,
116
+ "chunk_size": 16,
117
+ "n_action_steps": 8,
118
+ "vision_model_id": "/scratch/cbjp404/.cache/hf/models/siglip-so400m-patch14-384",
119
+ "text_model_id": "/scratch/cbjp404/.cache/hf/models/gemma-3-4b-it",
120
+ "use_2d_rope": false,
121
+ "lora_rank": 16,
122
+ "lora_alpha": 16,
123
+ "lora_dropout": 0.1,
124
+ "lora_target_modules": [
125
+ "q_proj",
126
+ "k_proj",
127
+ "v_proj",
128
+ "o_proj"
129
+ ],
130
+ "scaledp_num_layers": 4,
131
+ "scaledp_num_heads": 8,
132
+ "scaledp_dim_model": 512,
133
+ "scaledp_dim_feedforward": 2048,
134
+ "num_diffusion_steps": 100,
135
+ "conditioning_dim": 768,
136
+ "plan_update_interval": 10,
137
+ "optimizer_lr": 0.0001,
138
+ "optimizer_weight_decay": 1e-06
139
+ },
140
+ "output_dir": "outputs/train/2025-08-12/13-06-07_gemma_le",
141
+ "job_name": "gemma_le",
142
+ "resume": false,
143
+ "seed": 1000,
144
+ "num_workers": 0,
145
+ "batch_size": 1,
146
+ "steps": 20000,
147
+ "eval_freq": 20000,
148
+ "log_freq": 10,
149
+ "save_checkpoint": true,
150
+ "save_freq": 5000,
151
+ "use_policy_training_preset": true,
152
+ "optimizer": {
153
+ "type": "adamw",
154
+ "lr": 0.0001,
155
+ "weight_decay": 1e-06,
156
+ "grad_clip_norm": 10.0,
157
+ "betas": [
158
+ 0.9,
159
+ 0.999
160
+ ],
161
+ "eps": 1e-08
162
+ },
163
+ "scheduler": null,
164
+ "eval": {
165
+ "n_episodes": 50,
166
+ "batch_size": 50,
167
+ "use_async_envs": false
168
+ },
169
+ "wandb": {
170
+ "enable": false,
171
+ "disable_artifact": false,
172
+ "project": "lerobot",
173
+ "entity": null,
174
+ "notes": null,
175
+ "run_id": null
176
+ },
177
+ "progress_bar": true,
178
+ "push_to_hub": false,
179
+ "push_repo_id": null,
180
+ "push_branch": null,
181
+ "push_private": false,
182
+ "push_exist_ok": false
183
+ }