numen-tech commited on
Commit
79796f7
·
1 Parent(s): ce8a752

A minor improvement in model's memory usage

Browse files
Files changed (2) hide show
  1. ndarray-cache.json +6 -6
  2. params_shard_98.bin +2 -2
ndarray-cache.json CHANGED
@@ -4150,7 +4150,7 @@
4150
  {
4151
  "dataPath": "params_shard_98.bin",
4152
  "format": "raw-shard",
4153
- "nbytes": 9926144,
4154
  "records": [
4155
  {
4156
  "name": "param_319",
@@ -4207,24 +4207,24 @@
4207
  {
4208
  "name": "param_325",
4209
  "shape": [
4210
- 2048,
4211
  128
4212
  ],
4213
  "dtype": "float16",
4214
  "format": "raw",
4215
- "nbytes": 524288,
4216
  "byteOffset": 8877568
4217
  },
4218
  {
4219
  "name": "param_326",
4220
  "shape": [
4221
- 2048,
4222
  128
4223
  ],
4224
  "dtype": "float16",
4225
  "format": "raw",
4226
- "nbytes": 524288,
4227
- "byteOffset": 9401856
4228
  }
4229
  ]
4230
  }
 
4150
  {
4151
  "dataPath": "params_shard_98.bin",
4152
  "format": "raw-shard",
4153
+ "nbytes": 9270784,
4154
  "records": [
4155
  {
4156
  "name": "param_319",
 
4207
  {
4208
  "name": "param_325",
4209
  "shape": [
4210
+ 768,
4211
  128
4212
  ],
4213
  "dtype": "float16",
4214
  "format": "raw",
4215
+ "nbytes": 196608,
4216
  "byteOffset": 8877568
4217
  },
4218
  {
4219
  "name": "param_326",
4220
  "shape": [
4221
+ 768,
4222
  128
4223
  ],
4224
  "dtype": "float16",
4225
  "format": "raw",
4226
+ "nbytes": 196608,
4227
+ "byteOffset": 9074176
4228
  }
4229
  ]
4230
  }
params_shard_98.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:eece05d53cb4e2e5b3e5fa96338da001b8152d27ae9948d1f88d33afcd204a07
3
- size 9926144
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bf62fc9cc27097dc9d9ee842625f8b202e6a9e492c3def96db399c06e457d55d
3
+ size 9270784