youliangtan commited on
Commit
71c408e
·
verified ·
1 Parent(s): 33e9a7a

Upload folder using huggingface_hub

Browse files
config.json ADDED
@@ -0,0 +1,64 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "action_dim": 32,
3
+ "action_head_cfg": {
4
+ "action_dim": 32,
5
+ "action_horizon": 16,
6
+ "add_pos_embed": true,
7
+ "backbone_embedding_dim": 2048,
8
+ "diffusion_model_cfg": {
9
+ "attention_head_dim": 48,
10
+ "cross_attention_dim": 2048,
11
+ "dropout": 0.2,
12
+ "final_dropout": true,
13
+ "interleave_self_attention": true,
14
+ "norm_type": "ada_norm",
15
+ "num_attention_heads": 32,
16
+ "num_layers": 16,
17
+ "output_dim": 1024,
18
+ "positional_embeddings": null
19
+ },
20
+ "hidden_size": 1024,
21
+ "input_embedding_dim": 1536,
22
+ "max_action_dim": 32,
23
+ "max_state_dim": 64,
24
+ "model_dtype": "float32",
25
+ "noise_beta_alpha": 1.5,
26
+ "noise_beta_beta": 1.0,
27
+ "noise_s": 0.999,
28
+ "num_inference_timesteps": 4,
29
+ "num_target_vision_tokens": 32,
30
+ "num_timestep_buckets": 1000,
31
+ "tune_diffusion_model": true,
32
+ "tune_projector": true,
33
+ "use_vlln": true,
34
+ "vl_self_attention_cfg": {
35
+ "attention_head_dim": 64,
36
+ "dropout": 0.2,
37
+ "final_dropout": true,
38
+ "num_attention_heads": 32,
39
+ "num_layers": 4,
40
+ "positional_embeddings": null
41
+ }
42
+ },
43
+ "action_horizon": 16,
44
+ "architectures": [
45
+ "GR00T_N1_5"
46
+ ],
47
+ "attn_implementation": null,
48
+ "backbone_cfg": {
49
+ "eagle_path": "NVEagle/eagle_er-qwen3_1_7B-Siglip2_400M_stage1_5_128gpu_er_v7_1mlp_nops",
50
+ "load_bf16": false,
51
+ "project_to_dim": null,
52
+ "reproject_vision": false,
53
+ "select_layer": 12,
54
+ "tune_llm": false,
55
+ "tune_visual": true,
56
+ "use_flash_attention": true
57
+ },
58
+ "compute_dtype": "bfloat16",
59
+ "hidden_size": 2048,
60
+ "model_dtype": "float32",
61
+ "model_type": "gr00t_n1_5",
62
+ "torch_dtype": "bfloat16",
63
+ "transformers_version": "4.51.3"
64
+ }
experiment_cfg/metadata.json ADDED
@@ -0,0 +1,447 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "new_embodiment": {
3
+ "statistics": {
4
+ "state": {
5
+ "x": {
6
+ "max": [
7
+ 1.0534898042678833
8
+ ],
9
+ "min": [
10
+ -0.4436439275741577
11
+ ],
12
+ "mean": [
13
+ 0.5598947405815125
14
+ ],
15
+ "std": [
16
+ 0.12432649731636047
17
+ ],
18
+ "q01": [
19
+ 0.32481380939483645
20
+ ],
21
+ "q99": [
22
+ 0.8750156319141384
23
+ ]
24
+ },
25
+ "y": {
26
+ "max": [
27
+ 0.48018959164619446
28
+ ],
29
+ "min": [
30
+ -0.9970501065254211
31
+ ],
32
+ "mean": [
33
+ -0.08334138244390488
34
+ ],
35
+ "std": [
36
+ 0.11558396369218826
37
+ ],
38
+ "q01": [
39
+ -0.28334290891885755
40
+ ],
41
+ "q99": [
42
+ 0.21247054174542404
43
+ ]
44
+ },
45
+ "z": {
46
+ "max": [
47
+ 1.6896663904190063
48
+ ],
49
+ "min": [
50
+ -0.006579156965017319
51
+ ],
52
+ "mean": [
53
+ 0.7770950198173523
54
+ ],
55
+ "std": [
56
+ 0.24595585465431213
57
+ ],
58
+ "q01": [
59
+ 0.14107070609927178
60
+ ],
61
+ "q99": [
62
+ 1.0727112340927123
63
+ ]
64
+ },
65
+ "rx": {
66
+ "max": [
67
+ 0.9999993443489075
68
+ ],
69
+ "min": [
70
+ -0.8643477559089661
71
+ ],
72
+ "mean": [
73
+ -0.24804554879665375
74
+ ],
75
+ "std": [
76
+ 0.5126774907112122
77
+ ],
78
+ "q01": [
79
+ -0.686474204659462
80
+ ],
81
+ "q99": [
82
+ 0.9377871316671368
83
+ ]
84
+ },
85
+ "ry": {
86
+ "max": [
87
+ 0.9999874830245972
88
+ ],
89
+ "min": [
90
+ -0.7079970240592957
91
+ ],
92
+ "mean": [
93
+ 0.4951382279396057
94
+ ],
95
+ "std": [
96
+ 0.5218117237091064
97
+ ],
98
+ "q01": [
99
+ -0.6808923494815826
100
+ ],
101
+ "q99": [
102
+ 0.9563051050901409
103
+ ]
104
+ },
105
+ "rz": {
106
+ "max": [
107
+ 0.9554369449615479
108
+ ],
109
+ "min": [
110
+ -0.7688722014427185
111
+ ],
112
+ "mean": [
113
+ 0.09266126900911331
114
+ ],
115
+ "std": [
116
+ 0.16630452871322632
117
+ ],
118
+ "q01": [
119
+ -0.36045596331357954
120
+ ],
121
+ "q99": [
122
+ 0.45990042358636823
123
+ ]
124
+ },
125
+ "rw": {
126
+ "max": [
127
+ 0.9914546012878418
128
+ ],
129
+ "min": [
130
+ -0.4999994933605194
131
+ ],
132
+ "mean": [
133
+ 0.2097489982843399
134
+ ],
135
+ "std": [
136
+ 0.2754714787006378
137
+ ],
138
+ "q01": [
139
+ -0.454380963742733
140
+ ],
141
+ "q99": [
142
+ 0.7216041100025177
143
+ ]
144
+ },
145
+ "gripper": {
146
+ "max": [
147
+ 1.0
148
+ ],
149
+ "min": [
150
+ 0.0
151
+ ],
152
+ "mean": [
153
+ 0.4261345863342285
154
+ ],
155
+ "std": [
156
+ 0.4554642140865326
157
+ ],
158
+ "q01": [
159
+ 0.0
160
+ ],
161
+ "q99": [
162
+ 1.0
163
+ ]
164
+ }
165
+ },
166
+ "action": {
167
+ "x": {
168
+ "max": [
169
+ 2.9984593391418457
170
+ ],
171
+ "min": [
172
+ -2.0204520225524902
173
+ ],
174
+ "mean": [
175
+ 0.00698750140145421
176
+ ],
177
+ "std": [
178
+ 0.06921227276325226
179
+ ],
180
+ "q01": [
181
+ -0.22453527510166169
182
+ ],
183
+ "q99": [
184
+ 0.17824687153100965
185
+ ]
186
+ },
187
+ "y": {
188
+ "max": [
189
+ 22.09052848815918
190
+ ],
191
+ "min": [
192
+ -5.497899532318115
193
+ ],
194
+ "mean": [
195
+ 0.006265923380851746
196
+ ],
197
+ "std": [
198
+ 0.059654854238033295
199
+ ],
200
+ "q01": [
201
+ -0.14820013284683228
202
+ ],
203
+ "q99": [
204
+ 0.14938379630446405
205
+ ]
206
+ },
207
+ "z": {
208
+ "max": [
209
+ 2.7507524490356445
210
+ ],
211
+ "min": [
212
+ -2.031663417816162
213
+ ],
214
+ "mean": [
215
+ -0.012625134550035
216
+ ],
217
+ "std": [
218
+ 0.07353131473064423
219
+ ],
220
+ "q01": [
221
+ -0.231589707583189
222
+ ],
223
+ "q99": [
224
+ 0.21842354819178575
225
+ ]
226
+ },
227
+ "roll": {
228
+ "max": [
229
+ 1.570636510848999
230
+ ],
231
+ "min": [
232
+ -1.569917917251587
233
+ ],
234
+ "mean": [
235
+ 0.04333191365003586
236
+ ],
237
+ "std": [
238
+ 0.1561005562543869
239
+ ],
240
+ "q01": [
241
+ -0.3517994859814644
242
+ ],
243
+ "q99": [
244
+ 0.5892666035890578
245
+ ]
246
+ },
247
+ "pitch": {
248
+ "max": [
249
+ 1.5321086645126343
250
+ ],
251
+ "min": [
252
+ -1.569892168045044
253
+ ],
254
+ "mean": [
255
+ -0.005756167229264975
256
+ ],
257
+ "std": [
258
+ 0.13164213299751282
259
+ ],
260
+ "q01": [
261
+ -0.4193011274933815
262
+ ],
263
+ "q99": [
264
+ 0.35272657424211445
265
+ ]
266
+ },
267
+ "yaw": {
268
+ "max": [
269
+ 1.5691522359848022
270
+ ],
271
+ "min": [
272
+ -1.570419430732727
273
+ ],
274
+ "mean": [
275
+ 0.0009130979306064546
276
+ ],
277
+ "std": [
278
+ 0.1459326595067978
279
+ ],
280
+ "q01": [
281
+ -0.43643461108207704
282
+ ],
283
+ "q99": [
284
+ 0.44796681255102094
285
+ ]
286
+ },
287
+ "gripper": {
288
+ "max": [
289
+ 1.0
290
+ ],
291
+ "min": [
292
+ 0.0
293
+ ],
294
+ "mean": [
295
+ 0.5354204773902893
296
+ ],
297
+ "std": [
298
+ 0.4971078634262085
299
+ ],
300
+ "q01": [
301
+ 0.0
302
+ ],
303
+ "q99": [
304
+ 1.0
305
+ ]
306
+ }
307
+ }
308
+ },
309
+ "modalities": {
310
+ "video": {
311
+ "image": {
312
+ "resolution": [
313
+ 320,
314
+ 256
315
+ ],
316
+ "channels": 3,
317
+ "fps": 3.0
318
+ }
319
+ },
320
+ "state": {
321
+ "x": {
322
+ "absolute": true,
323
+ "rotation_type": null,
324
+ "shape": [
325
+ 1
326
+ ],
327
+ "continuous": true
328
+ },
329
+ "y": {
330
+ "absolute": true,
331
+ "rotation_type": null,
332
+ "shape": [
333
+ 1
334
+ ],
335
+ "continuous": true
336
+ },
337
+ "z": {
338
+ "absolute": true,
339
+ "rotation_type": null,
340
+ "shape": [
341
+ 1
342
+ ],
343
+ "continuous": true
344
+ },
345
+ "rx": {
346
+ "absolute": true,
347
+ "rotation_type": null,
348
+ "shape": [
349
+ 1
350
+ ],
351
+ "continuous": true
352
+ },
353
+ "ry": {
354
+ "absolute": true,
355
+ "rotation_type": null,
356
+ "shape": [
357
+ 1
358
+ ],
359
+ "continuous": true
360
+ },
361
+ "rz": {
362
+ "absolute": true,
363
+ "rotation_type": null,
364
+ "shape": [
365
+ 1
366
+ ],
367
+ "continuous": true
368
+ },
369
+ "rw": {
370
+ "absolute": true,
371
+ "rotation_type": null,
372
+ "shape": [
373
+ 1
374
+ ],
375
+ "continuous": true
376
+ },
377
+ "gripper": {
378
+ "absolute": true,
379
+ "rotation_type": null,
380
+ "shape": [
381
+ 1
382
+ ],
383
+ "continuous": true
384
+ }
385
+ },
386
+ "action": {
387
+ "x": {
388
+ "absolute": true,
389
+ "rotation_type": null,
390
+ "shape": [
391
+ 1
392
+ ],
393
+ "continuous": true
394
+ },
395
+ "y": {
396
+ "absolute": true,
397
+ "rotation_type": null,
398
+ "shape": [
399
+ 1
400
+ ],
401
+ "continuous": true
402
+ },
403
+ "z": {
404
+ "absolute": true,
405
+ "rotation_type": null,
406
+ "shape": [
407
+ 1
408
+ ],
409
+ "continuous": true
410
+ },
411
+ "roll": {
412
+ "absolute": true,
413
+ "rotation_type": null,
414
+ "shape": [
415
+ 1
416
+ ],
417
+ "continuous": true
418
+ },
419
+ "pitch": {
420
+ "absolute": true,
421
+ "rotation_type": null,
422
+ "shape": [
423
+ 1
424
+ ],
425
+ "continuous": true
426
+ },
427
+ "yaw": {
428
+ "absolute": true,
429
+ "rotation_type": null,
430
+ "shape": [
431
+ 1
432
+ ],
433
+ "continuous": true
434
+ },
435
+ "gripper": {
436
+ "absolute": true,
437
+ "rotation_type": null,
438
+ "shape": [
439
+ 1
440
+ ],
441
+ "continuous": true
442
+ }
443
+ }
444
+ },
445
+ "embodiment_tag": "new_embodiment"
446
+ }
447
+ }
model-00001-of-00002.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3144c315de74ca87060f90ca08e057c5e93d577b5078074b2916378087d4a130
3
+ size 4999367032
model-00002-of-00002.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e6c971ec2dd9510e44fafdff3452cb0d59d042c942b2945581e6ad344c48e731
3
+ size 2586705312
model.safetensors.index.json ADDED
The diff for this file is too large to render. See raw diff
 
trainer_state.json ADDED
The diff for this file is too large to render. See raw diff