TimeRobber commited on
Commit
79e2321
·
1 Parent(s): 1e33f3e

Upload part 46

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. .gitattributes +47 -0
  2. checkpoint_1007000/state.param_states.decoder.layers_3.pre_self_attention_layer_norm.scale.v/.zarray +1 -0
  3. checkpoint_1007000/state.param_states.decoder.layers_3.pre_self_attention_layer_norm.scale.v/0 +0 -0
  4. checkpoint_1007000/state.param_states.encoder.layers_23.pre_attention_layer_norm.scale.v/.zarray +1 -0
  5. checkpoint_1007000/state.param_states.encoder.layers_23.pre_attention_layer_norm.scale.v/0 +0 -0
  6. checkpoint_1007000/target.decoder.layers_10.self_attention.key.kernel/.zarray +1 -0
  7. checkpoint_1007000/target.decoder.layers_10.self_attention.key.kernel/.zarray.__tmp10130132370000382642.~1663960299882054~ +1 -0
  8. checkpoint_1007000/target.decoder.layers_10.self_attention.key.kernel/.zarray.__tmp10954122248698558262.~1663960300073222~ +1 -0
  9. checkpoint_1007000/target.decoder.layers_10.self_attention.key.kernel/.zarray.__tmp11709688572954520360.~1663960299677964~ +1 -0
  10. checkpoint_1007000/target.decoder.layers_10.self_attention.key.kernel/.zarray.__tmp14956069949774084406.~1663960300075491~ +1 -0
  11. checkpoint_1007000/target.decoder.layers_10.self_attention.key.kernel/.zarray.__tmp4025274537859120413.~1663960300017995~ +1 -0
  12. checkpoint_1007000/target.decoder.layers_10.self_attention.key.kernel/0.0 +3 -0
  13. checkpoint_1007000/target.decoder.layers_10.self_attention.key.kernel/0.1 +3 -0
  14. checkpoint_1007000/target.decoder.layers_10.self_attention.key.kernel/0.2 +3 -0
  15. checkpoint_1007000/target.decoder.layers_10.self_attention.key.kernel/0.3 +3 -0
  16. checkpoint_1007000/target.decoder.layers_10.self_attention.key.kernel/0.4 +3 -0
  17. checkpoint_1007000/target.decoder.layers_10.self_attention.key.kernel/0.5 +3 -0
  18. checkpoint_1007000/target.decoder.layers_10.self_attention.key.kernel/0.6 +3 -0
  19. checkpoint_1007000/target.decoder.layers_10.self_attention.key.kernel/0.7 +3 -0
  20. checkpoint_1007000/target.decoder.layers_14.mlp.wo.kernel/.zarray.__tmp12479244418913466456.~1663960300685403~ +1 -0
  21. checkpoint_1007000/target.decoder.layers_14.mlp.wo.kernel/.zarray.__tmp5189599943241222398.~1663960300885553~ +1 -0
  22. checkpoint_1007000/target.decoder.layers_14.mlp.wo.kernel/.zarray.__tmp9533798046376307163.~1663960300551871~ +1 -0
  23. checkpoint_1007000/target.decoder.layers_14.mlp.wo.kernel/.zarray.__tmp9666493176089962186.~1663960300686970~ +1 -0
  24. checkpoint_1007000/target.decoder.layers_2.mlp.wi_0.kernel/.zarray +1 -0
  25. checkpoint_1007000/target.decoder.layers_2.mlp.wi_0.kernel/.zarray.__tmp10278330172052962831.~1663960300424944~ +1 -0
  26. checkpoint_1007000/target.decoder.layers_2.mlp.wi_0.kernel/.zarray.__tmp11926956483067476319.~1663960300385701~ +1 -0
  27. checkpoint_1007000/target.decoder.layers_2.mlp.wi_0.kernel/.zarray.__tmp15791834445691843274.~1663960300724828~ +1 -0
  28. checkpoint_1007000/target.decoder.layers_2.mlp.wi_0.kernel/.zarray.__tmp1714517278612008761.~1663960300466758~ +1 -0
  29. checkpoint_1007000/target.decoder.layers_2.mlp.wi_0.kernel/.zarray.__tmp18021455530413911774.~1663960300776722~ +1 -0
  30. checkpoint_1007000/target.decoder.layers_2.mlp.wi_0.kernel/.zarray.__tmp4364215189749523097.~1663960300420323~ +1 -0
  31. checkpoint_1007000/target.decoder.layers_2.mlp.wi_0.kernel/.zarray.__tmp5709416680492409645.~1663960300551197~ +1 -0
  32. checkpoint_1007000/target.decoder.layers_2.mlp.wi_0.kernel/0.0 +3 -0
  33. checkpoint_1007000/target.decoder.layers_2.mlp.wi_0.kernel/0.1 +3 -0
  34. checkpoint_1007000/target.decoder.layers_2.mlp.wi_0.kernel/0.2 +3 -0
  35. checkpoint_1007000/target.decoder.layers_2.mlp.wi_0.kernel/0.3 +3 -0
  36. checkpoint_1007000/target.decoder.layers_2.mlp.wi_0.kernel/0.4 +3 -0
  37. checkpoint_1007000/target.decoder.layers_2.mlp.wi_0.kernel/0.5 +3 -0
  38. checkpoint_1007000/target.decoder.layers_2.mlp.wi_0.kernel/0.6 +3 -0
  39. checkpoint_1007000/target.decoder.layers_2.mlp.wi_0.kernel/0.7 +3 -0
  40. checkpoint_1007000/target.encoder.layers_13.attention.query.kernel/.zarray +1 -0
  41. checkpoint_1007000/target.encoder.layers_13.attention.query.kernel/.zarray.__tmp10398387860063871791.~1663960300385660~ +1 -0
  42. checkpoint_1007000/target.encoder.layers_13.attention.query.kernel/.zarray.__tmp10700189453700589260.~1663960300778874~ +1 -0
  43. checkpoint_1007000/target.encoder.layers_13.attention.query.kernel/.zarray.__tmp14196631297793674538.~1663960300685115~ +1 -0
  44. checkpoint_1007000/target.encoder.layers_13.attention.query.kernel/.zarray.__tmp17083914858304621802.~1663960300989814~ +1 -0
  45. checkpoint_1007000/target.encoder.layers_13.attention.query.kernel/.zarray.__tmp6968194478073802803.~1663960300548716~ +1 -0
  46. checkpoint_1007000/target.encoder.layers_13.attention.query.kernel/.zarray.__tmp9240234483793240192.~1663960300610878~ +1 -0
  47. checkpoint_1007000/target.encoder.layers_13.attention.query.kernel/0.0 +3 -0
  48. checkpoint_1007000/target.encoder.layers_13.attention.query.kernel/0.1 +3 -0
  49. checkpoint_1007000/target.encoder.layers_13.attention.query.kernel/0.2 +3 -0
  50. checkpoint_1007000/target.encoder.layers_13.attention.query.kernel/0.3 +3 -0
.gitattributes CHANGED
@@ -2339,3 +2339,50 @@ checkpoint_1007000/target.decoder.layers_14.mlp.wo.kernel/7.0 filter=lfs diff=lf
2339
  checkpoint_1007000/target.decoder.layers_14.mlp.wo.kernel/5.0 filter=lfs diff=lfs merge=lfs -text
2340
  checkpoint_1007000/target.decoder.layers_14.mlp.wo.kernel/2.0 filter=lfs diff=lfs merge=lfs -text
2341
  checkpoint_1007000/target.decoder.layers_14.mlp.wo.kernel/4.0 filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2339
  checkpoint_1007000/target.decoder.layers_14.mlp.wo.kernel/5.0 filter=lfs diff=lfs merge=lfs -text
2340
  checkpoint_1007000/target.decoder.layers_14.mlp.wo.kernel/2.0 filter=lfs diff=lfs merge=lfs -text
2341
  checkpoint_1007000/target.decoder.layers_14.mlp.wo.kernel/4.0 filter=lfs diff=lfs merge=lfs -text
2342
+ checkpoint_1007000/target.decoder.layers_10.self_attention.key.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
2343
+ checkpoint_1007000/target.decoder.layers_10.self_attention.key.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
2344
+ checkpoint_1007000/target.decoder.layers_10.self_attention.key.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
2345
+ checkpoint_1007000/target.decoder.layers_10.self_attention.key.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
2346
+ checkpoint_1007000/target.decoder.layers_10.self_attention.key.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
2347
+ checkpoint_1007000/target.decoder.layers_10.self_attention.key.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
2348
+ checkpoint_1007000/target.decoder.layers_10.self_attention.key.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
2349
+ checkpoint_1007000/target.decoder.layers_10.self_attention.key.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
2350
+ checkpoint_1007000/target.decoder.layers_2.mlp.wi_0.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
2351
+ checkpoint_1007000/target.decoder.layers_2.mlp.wi_0.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
2352
+ checkpoint_1007000/target.decoder.layers_2.mlp.wi_0.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
2353
+ checkpoint_1007000/target.decoder.layers_2.mlp.wi_0.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
2354
+ checkpoint_1007000/target.decoder.layers_2.mlp.wi_0.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
2355
+ checkpoint_1007000/target.decoder.layers_2.mlp.wi_0.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
2356
+ checkpoint_1007000/target.decoder.layers_2.mlp.wi_0.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
2357
+ checkpoint_1007000/target.decoder.layers_2.mlp.wi_0.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
2358
+ checkpoint_1007000/target.encoder.layers_2.attention.query.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
2359
+ checkpoint_1007000/target.encoder.layers_2.attention.query.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
2360
+ checkpoint_1007000/target.encoder.layers_2.attention.query.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
2361
+ checkpoint_1007000/target.encoder.layers_2.attention.query.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
2362
+ checkpoint_1007000/target.encoder.layers_2.attention.query.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
2363
+ checkpoint_1007000/target.encoder.layers_2.attention.query.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
2364
+ checkpoint_1007000/target.encoder.layers_2.attention.query.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
2365
+ checkpoint_1007000/target.encoder.layers_2.attention.query.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
2366
+ checkpoint_1007000/target.encoder.layers_23.attention.value.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
2367
+ checkpoint_1007000/target.encoder.layers_23.attention.value.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
2368
+ checkpoint_1007000/target.encoder.layers_23.attention.value.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
2369
+ checkpoint_1007000/target.encoder.layers_23.attention.value.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
2370
+ checkpoint_1007000/target.encoder.layers_23.attention.value.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
2371
+ checkpoint_1007000/target.encoder.layers_23.attention.value.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
2372
+ checkpoint_1007000/target.encoder.layers_23.attention.value.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
2373
+ checkpoint_1007000/target.encoder.layers_23.attention.value.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
2374
+ checkpoint_1007000/target.encoder.layers_13.attention.query.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
2375
+ checkpoint_1007000/target.encoder.layers_13.attention.query.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
2376
+ checkpoint_1007000/target.encoder.layers_13.attention.query.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
2377
+ checkpoint_1007000/target.encoder.layers_13.attention.query.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
2378
+ checkpoint_1007000/target.encoder.layers_13.attention.query.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
2379
+ checkpoint_1007000/target.encoder.layers_13.attention.query.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
2380
+ checkpoint_1007000/target.encoder.layers_13.attention.query.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
2381
+ checkpoint_1007000/target.encoder.layers_13.attention.query.kernel/0.4 filter=lfs diff=lfs merge=lfs -text
2382
+ checkpoint_1007000/target.encoder.layers_15.attention.query.kernel/0.1 filter=lfs diff=lfs merge=lfs -text
2383
+ checkpoint_1007000/target.encoder.layers_15.attention.query.kernel/0.7 filter=lfs diff=lfs merge=lfs -text
2384
+ checkpoint_1007000/target.encoder.layers_15.attention.query.kernel/0.0 filter=lfs diff=lfs merge=lfs -text
2385
+ checkpoint_1007000/target.encoder.layers_15.attention.query.kernel/0.6 filter=lfs diff=lfs merge=lfs -text
2386
+ checkpoint_1007000/target.encoder.layers_15.attention.query.kernel/0.5 filter=lfs diff=lfs merge=lfs -text
2387
+ checkpoint_1007000/target.encoder.layers_15.attention.query.kernel/0.3 filter=lfs diff=lfs merge=lfs -text
2388
+ checkpoint_1007000/target.encoder.layers_15.attention.query.kernel/0.2 filter=lfs diff=lfs merge=lfs -text
checkpoint_1007000/state.param_states.decoder.layers_3.pre_self_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
checkpoint_1007000/state.param_states.decoder.layers_3.pre_self_attention_layer_norm.scale.v/0 ADDED
Binary file (15 kB). View file
 
checkpoint_1007000/state.param_states.encoder.layers_23.pre_attention_layer_norm.scale.v/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096],"zarr_format":2}
checkpoint_1007000/state.param_states.encoder.layers_23.pre_attention_layer_norm.scale.v/0 ADDED
Binary file (14.8 kB). View file
 
checkpoint_1007000/target.decoder.layers_10.self_attention.key.kernel/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_10.self_attention.key.kernel/.zarray.__tmp10130132370000382642.~1663960299882054~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_10.self_attention.key.kernel/.zarray.__tmp10954122248698558262.~1663960300073222~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_10.self_attention.key.kernel/.zarray.__tmp11709688572954520360.~1663960299677964~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_10.self_attention.key.kernel/.zarray.__tmp14956069949774084406.~1663960300075491~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_10.self_attention.key.kernel/.zarray.__tmp4025274537859120413.~1663960300017995~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_10.self_attention.key.kernel/0.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a83c26214e409481a714f084ece9e067cca4762d0af8aadbe5857ba13d8b0489
3
+ size 7815472
checkpoint_1007000/target.decoder.layers_10.self_attention.key.kernel/0.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c1c317d3ca1e1771c8d5960d333239c9edcd635ef9b51a2f61d25fcec1099851
3
+ size 7829309
checkpoint_1007000/target.decoder.layers_10.self_attention.key.kernel/0.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:21150fdd44d99220013d321faf65228101d41a5df30771c6fde236cf3bc81ad2
3
+ size 7815100
checkpoint_1007000/target.decoder.layers_10.self_attention.key.kernel/0.3 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bab84779b4c131b08620c70171a4a93e3bfb15a0f9f0904557461dcb131670e7
3
+ size 7812569
checkpoint_1007000/target.decoder.layers_10.self_attention.key.kernel/0.4 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6c3770ae12dfce408e692544c4a112b3913e1403433b9a818f362a30046cb11a
3
+ size 7822649
checkpoint_1007000/target.decoder.layers_10.self_attention.key.kernel/0.5 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9d31f30e22520bd72134897be7def712846310aaf0435ebecf107a655664ffb5
3
+ size 7811908
checkpoint_1007000/target.decoder.layers_10.self_attention.key.kernel/0.6 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4d1edf0f281f471f95e9d7c03b83831113eae2dd0f9dd1db13f95097f0ccab88
3
+ size 7819892
checkpoint_1007000/target.decoder.layers_10.self_attention.key.kernel/0.7 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dcac29c17010bb3cc600bb4c44199ff64454ff377a739c1ae328875e15b0a042
3
+ size 7818316
checkpoint_1007000/target.decoder.layers_14.mlp.wo.kernel/.zarray.__tmp12479244418913466456.~1663960300685403~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_14.mlp.wo.kernel/.zarray.__tmp5189599943241222398.~1663960300885553~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_14.mlp.wo.kernel/.zarray.__tmp9533798046376307163.~1663960300551871~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_14.mlp.wo.kernel/.zarray.__tmp9666493176089962186.~1663960300686970~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[1280,4096],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[10240,4096],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_2.mlp.wi_0.kernel/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_2.mlp.wi_0.kernel/.zarray.__tmp10278330172052962831.~1663960300424944~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_2.mlp.wi_0.kernel/.zarray.__tmp11926956483067476319.~1663960300385701~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_2.mlp.wi_0.kernel/.zarray.__tmp15791834445691843274.~1663960300724828~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_2.mlp.wi_0.kernel/.zarray.__tmp1714517278612008761.~1663960300466758~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_2.mlp.wi_0.kernel/.zarray.__tmp18021455530413911774.~1663960300776722~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_2.mlp.wi_0.kernel/.zarray.__tmp4364215189749523097.~1663960300420323~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_2.mlp.wi_0.kernel/.zarray.__tmp5709416680492409645.~1663960300551197~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,1280],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,10240],"zarr_format":2}
checkpoint_1007000/target.decoder.layers_2.mlp.wi_0.kernel/0.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4634fa7bc859ab93145358e930f516b1af4d41af952c998beb0a5c19147ab2a8
3
+ size 19555434
checkpoint_1007000/target.decoder.layers_2.mlp.wi_0.kernel/0.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:288bec55b995218320f7376ac4ed1eaf3ddb0811a2cdf2af1ca4447d1ec3c4f2
3
+ size 19558146
checkpoint_1007000/target.decoder.layers_2.mlp.wi_0.kernel/0.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d74fa8efe1dadeea42b3622f085a18c86a92af50a676d25b6e7f46b1953947d6
3
+ size 19557656
checkpoint_1007000/target.decoder.layers_2.mlp.wi_0.kernel/0.3 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f55a8f784287b7fa506a4f2cc8129dbdb4458afb1886400f39c3e6f6f9e2c47a
3
+ size 19554736
checkpoint_1007000/target.decoder.layers_2.mlp.wi_0.kernel/0.4 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9af2dc6e88c0b52d3b2778c8da695120b4f4af775d75509a76d1c744ec670850
3
+ size 19559210
checkpoint_1007000/target.decoder.layers_2.mlp.wi_0.kernel/0.5 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:13f1571ec30c10983b517f469a67a0205478e823c23cc65ddfa6a99ef136add0
3
+ size 19554503
checkpoint_1007000/target.decoder.layers_2.mlp.wi_0.kernel/0.6 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8bed2a1d4defc5b51618e20425c92f0a80ece226cca3a30953b53574b7fbe590
3
+ size 19558320
checkpoint_1007000/target.decoder.layers_2.mlp.wi_0.kernel/0.7 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4f9aa132b4adfb8e7d663f0897aa41c39ce0c64fa30c8fd078db837654248c08
3
+ size 19556316
checkpoint_1007000/target.encoder.layers_13.attention.query.kernel/.zarray ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.encoder.layers_13.attention.query.kernel/.zarray.__tmp10398387860063871791.~1663960300385660~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.encoder.layers_13.attention.query.kernel/.zarray.__tmp10700189453700589260.~1663960300778874~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.encoder.layers_13.attention.query.kernel/.zarray.__tmp14196631297793674538.~1663960300685115~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.encoder.layers_13.attention.query.kernel/.zarray.__tmp17083914858304621802.~1663960300989814~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.encoder.layers_13.attention.query.kernel/.zarray.__tmp6968194478073802803.~1663960300548716~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.encoder.layers_13.attention.query.kernel/.zarray.__tmp9240234483793240192.~1663960300610878~ ADDED
@@ -0,0 +1 @@
 
 
1
+ {"chunks":[4096,512],"compressor":{"id":"gzip","level":1},"dimension_separator":".","dtype":"<f4","fill_value":null,"filters":null,"order":"C","shape":[4096,4096],"zarr_format":2}
checkpoint_1007000/target.encoder.layers_13.attention.query.kernel/0.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8bac07b58214c98ef696ca8fcfb2bea453d2da5fafe98a4356c6817e7062d7bf
3
+ size 7807422
checkpoint_1007000/target.encoder.layers_13.attention.query.kernel/0.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7753b3cce5efb8ce609ce0728fb7ace2da8186da69b338d25dcb9fc80dd05b6a
3
+ size 7810124
checkpoint_1007000/target.encoder.layers_13.attention.query.kernel/0.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:59bccb8735f098b3d33ecb29e500e8860d1b897e6ecac939b30cd116c8c4e7fb
3
+ size 7807194
checkpoint_1007000/target.encoder.layers_13.attention.query.kernel/0.3 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f9afa991b4eb47d4f2312701000efa22643791e5045668990a9bca467331f15e
3
+ size 7810691