danielhanchen commited on
Commit
1eee0c0
·
verified ·
1 Parent(s): 4bbec0b

Upload folder using huggingface_hub

Browse files
config.json CHANGED
@@ -1,5 +1,4 @@
1
  {
2
- "_name_or_path": "unsloth/gemma-7b",
3
  "architectures": [
4
  "GemmaForCausalLM"
5
  ],
@@ -28,7 +27,12 @@
28
  "bnb_4bit_use_double_quant": true,
29
  "llm_int8_enable_fp32_cpu_offload": false,
30
  "llm_int8_has_fp16_weight": false,
31
- "llm_int8_skip_modules": null,
 
 
 
 
 
32
  "llm_int8_threshold": 6.0,
33
  "load_in_4bit": true,
34
  "load_in_8bit": false,
@@ -38,7 +42,8 @@
38
  "rope_scaling": null,
39
  "rope_theta": 10000.0,
40
  "torch_dtype": "bfloat16",
41
- "transformers_version": "4.44.2",
 
42
  "unsloth_version": "2024.9",
43
  "use_cache": true,
44
  "vocab_size": 256000
 
1
  {
 
2
  "architectures": [
3
  "GemmaForCausalLM"
4
  ],
 
27
  "bnb_4bit_use_double_quant": true,
28
  "llm_int8_enable_fp32_cpu_offload": false,
29
  "llm_int8_has_fp16_weight": false,
30
+ "llm_int8_skip_modules": [
31
+ "lm_head",
32
+ "multi_modal_projector",
33
+ "merger",
34
+ "modality_projection"
35
+ ],
36
  "llm_int8_threshold": 6.0,
37
  "load_in_4bit": true,
38
  "load_in_8bit": false,
 
42
  "rope_scaling": null,
43
  "rope_theta": 10000.0,
44
  "torch_dtype": "bfloat16",
45
+ "transformers_version": "4.52.4",
46
+ "unsloth_fixed": true,
47
  "unsloth_version": "2024.9",
48
  "use_cache": true,
49
  "vocab_size": 256000
generation_config.json CHANGED
@@ -4,5 +4,5 @@
4
  "eos_token_id": 1,
5
  "max_length": 8192,
6
  "pad_token_id": 0,
7
- "transformers_version": "4.44.2"
8
  }
 
4
  "eos_token_id": 1,
5
  "max_length": 8192,
6
  "pad_token_id": 0,
7
+ "transformers_version": "4.52.4"
8
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:873911a10106ce1a6f3350b161fcaf4ffca2626e0ed589ca6d42ebf376413eac
3
- size 5572148372
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6af91e32a2f16180845a63d436c9dc9daea8aa9d5d0641525b231a9b5a47fd8c
3
+ size 5572148568
tokenizer.json CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7da53ca29fb16f6b2489482fc0bc6a394162cdab14d12764a1755ebc583fea79
3
- size 17518525
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f559f2189f392b4555613965f089e7c4d300b41fbe080bf79da0d676e33ee7f0
3
+ size 34356041
tokenizer_config.json CHANGED
@@ -1115,7 +1115,7 @@
1115
  "special": false
1116
  },
1117
  "139": {
1118
- "content": "▁▁",
1119
  "lstrip": false,
1120
  "normalized": false,
1121
  "rstrip": false,
@@ -1123,7 +1123,7 @@
1123
  "special": false
1124
  },
1125
  "140": {
1126
- "content": "▁▁▁",
1127
  "lstrip": false,
1128
  "normalized": false,
1129
  "rstrip": false,
@@ -1131,7 +1131,7 @@
1131
  "special": false
1132
  },
1133
  "141": {
1134
- "content": "▁▁▁▁",
1135
  "lstrip": false,
1136
  "normalized": false,
1137
  "rstrip": false,
@@ -1139,7 +1139,7 @@
1139
  "special": false
1140
  },
1141
  "142": {
1142
- "content": "▁▁▁▁▁",
1143
  "lstrip": false,
1144
  "normalized": false,
1145
  "rstrip": false,
@@ -1147,7 +1147,7 @@
1147
  "special": false
1148
  },
1149
  "143": {
1150
- "content": "▁▁▁▁▁▁",
1151
  "lstrip": false,
1152
  "normalized": false,
1153
  "rstrip": false,
@@ -1155,7 +1155,7 @@
1155
  "special": false
1156
  },
1157
  "144": {
1158
- "content": "▁▁▁▁▁▁▁",
1159
  "lstrip": false,
1160
  "normalized": false,
1161
  "rstrip": false,
@@ -1163,7 +1163,7 @@
1163
  "special": false
1164
  },
1165
  "145": {
1166
- "content": "▁▁▁▁▁▁▁▁",
1167
  "lstrip": false,
1168
  "normalized": false,
1169
  "rstrip": false,
@@ -1171,7 +1171,7 @@
1171
  "special": false
1172
  },
1173
  "146": {
1174
- "content": "▁▁▁▁▁▁▁▁▁",
1175
  "lstrip": false,
1176
  "normalized": false,
1177
  "rstrip": false,
@@ -1179,7 +1179,7 @@
1179
  "special": false
1180
  },
1181
  "147": {
1182
- "content": "▁▁▁▁▁▁▁▁▁▁",
1183
  "lstrip": false,
1184
  "normalized": false,
1185
  "rstrip": false,
@@ -1187,7 +1187,7 @@
1187
  "special": false
1188
  },
1189
  "148": {
1190
- "content": "▁▁▁▁▁▁▁▁▁▁▁",
1191
  "lstrip": false,
1192
  "normalized": false,
1193
  "rstrip": false,
@@ -1195,7 +1195,7 @@
1195
  "special": false
1196
  },
1197
  "149": {
1198
- "content": "▁▁▁▁▁▁▁▁▁▁▁▁",
1199
  "lstrip": false,
1200
  "normalized": false,
1201
  "rstrip": false,
@@ -1203,7 +1203,7 @@
1203
  "special": false
1204
  },
1205
  "150": {
1206
- "content": "▁▁▁▁▁▁▁▁▁▁▁▁▁",
1207
  "lstrip": false,
1208
  "normalized": false,
1209
  "rstrip": false,
@@ -1211,7 +1211,7 @@
1211
  "special": false
1212
  },
1213
  "151": {
1214
- "content": "▁▁▁▁▁▁▁▁▁▁▁▁▁▁",
1215
  "lstrip": false,
1216
  "normalized": false,
1217
  "rstrip": false,
@@ -1219,7 +1219,7 @@
1219
  "special": false
1220
  },
1221
  "152": {
1222
- "content": "▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁",
1223
  "lstrip": false,
1224
  "normalized": false,
1225
  "rstrip": false,
@@ -1227,7 +1227,7 @@
1227
  "special": false
1228
  },
1229
  "153": {
1230
- "content": "▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁",
1231
  "lstrip": false,
1232
  "normalized": false,
1233
  "rstrip": false,
@@ -1235,7 +1235,7 @@
1235
  "special": false
1236
  },
1237
  "154": {
1238
- "content": "▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁",
1239
  "lstrip": false,
1240
  "normalized": false,
1241
  "rstrip": false,
@@ -1243,7 +1243,7 @@
1243
  "special": false
1244
  },
1245
  "155": {
1246
- "content": "▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁",
1247
  "lstrip": false,
1248
  "normalized": false,
1249
  "rstrip": false,
@@ -1251,7 +1251,7 @@
1251
  "special": false
1252
  },
1253
  "156": {
1254
- "content": "▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁",
1255
  "lstrip": false,
1256
  "normalized": false,
1257
  "rstrip": false,
@@ -1259,7 +1259,7 @@
1259
  "special": false
1260
  },
1261
  "157": {
1262
- "content": "▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁",
1263
  "lstrip": false,
1264
  "normalized": false,
1265
  "rstrip": false,
@@ -1267,7 +1267,7 @@
1267
  "special": false
1268
  },
1269
  "158": {
1270
- "content": "▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁",
1271
  "lstrip": false,
1272
  "normalized": false,
1273
  "rstrip": false,
@@ -1275,7 +1275,7 @@
1275
  "special": false
1276
  },
1277
  "159": {
1278
- "content": "▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁",
1279
  "lstrip": false,
1280
  "normalized": false,
1281
  "rstrip": false,
@@ -1283,7 +1283,7 @@
1283
  "special": false
1284
  },
1285
  "160": {
1286
- "content": "▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁",
1287
  "lstrip": false,
1288
  "normalized": false,
1289
  "rstrip": false,
@@ -1291,7 +1291,7 @@
1291
  "special": false
1292
  },
1293
  "161": {
1294
- "content": "▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁",
1295
  "lstrip": false,
1296
  "normalized": false,
1297
  "rstrip": false,
@@ -1299,7 +1299,7 @@
1299
  "special": false
1300
  },
1301
  "162": {
1302
- "content": "▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁",
1303
  "lstrip": false,
1304
  "normalized": false,
1305
  "rstrip": false,
@@ -1307,7 +1307,7 @@
1307
  "special": false
1308
  },
1309
  "163": {
1310
- "content": "▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁",
1311
  "lstrip": false,
1312
  "normalized": false,
1313
  "rstrip": false,
@@ -1315,7 +1315,7 @@
1315
  "special": false
1316
  },
1317
  "164": {
1318
- "content": "▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁",
1319
  "lstrip": false,
1320
  "normalized": false,
1321
  "rstrip": false,
@@ -1323,7 +1323,7 @@
1323
  "special": false
1324
  },
1325
  "165": {
1326
- "content": "▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁",
1327
  "lstrip": false,
1328
  "normalized": false,
1329
  "rstrip": false,
@@ -1331,7 +1331,7 @@
1331
  "special": false
1332
  },
1333
  "166": {
1334
- "content": "▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁",
1335
  "lstrip": false,
1336
  "normalized": false,
1337
  "rstrip": false,
@@ -1339,7 +1339,7 @@
1339
  "special": false
1340
  },
1341
  "167": {
1342
- "content": "▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁",
1343
  "lstrip": false,
1344
  "normalized": false,
1345
  "rstrip": false,
@@ -1347,7 +1347,7 @@
1347
  "special": false
1348
  },
1349
  "168": {
1350
- "content": "▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁",
1351
  "lstrip": false,
1352
  "normalized": false,
1353
  "rstrip": false,
@@ -1746,7 +1746,8 @@
1746
  "bos_token": "<bos>",
1747
  "clean_up_tokenization_spaces": false,
1748
  "eos_token": "<eos>",
1749
- "model_max_length": 1000000000000000019884624838656,
 
1750
  "pad_token": "<pad>",
1751
  "padding_side": "left",
1752
  "sp_model_kwargs": {},
@@ -1754,4 +1755,4 @@
1754
  "tokenizer_class": "GemmaTokenizer",
1755
  "unk_token": "<unk>",
1756
  "use_default_system_prompt": false
1757
- }
 
1115
  "special": false
1116
  },
1117
  "139": {
1118
+ "content": "\u2581\u2581",
1119
  "lstrip": false,
1120
  "normalized": false,
1121
  "rstrip": false,
 
1123
  "special": false
1124
  },
1125
  "140": {
1126
+ "content": "\u2581\u2581\u2581",
1127
  "lstrip": false,
1128
  "normalized": false,
1129
  "rstrip": false,
 
1131
  "special": false
1132
  },
1133
  "141": {
1134
+ "content": "\u2581\u2581\u2581\u2581",
1135
  "lstrip": false,
1136
  "normalized": false,
1137
  "rstrip": false,
 
1139
  "special": false
1140
  },
1141
  "142": {
1142
+ "content": "\u2581\u2581\u2581\u2581\u2581",
1143
  "lstrip": false,
1144
  "normalized": false,
1145
  "rstrip": false,
 
1147
  "special": false
1148
  },
1149
  "143": {
1150
+ "content": "\u2581\u2581\u2581\u2581\u2581\u2581",
1151
  "lstrip": false,
1152
  "normalized": false,
1153
  "rstrip": false,
 
1155
  "special": false
1156
  },
1157
  "144": {
1158
+ "content": "\u2581\u2581\u2581\u2581\u2581\u2581\u2581",
1159
  "lstrip": false,
1160
  "normalized": false,
1161
  "rstrip": false,
 
1163
  "special": false
1164
  },
1165
  "145": {
1166
+ "content": "\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581",
1167
  "lstrip": false,
1168
  "normalized": false,
1169
  "rstrip": false,
 
1171
  "special": false
1172
  },
1173
  "146": {
1174
+ "content": "\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581",
1175
  "lstrip": false,
1176
  "normalized": false,
1177
  "rstrip": false,
 
1179
  "special": false
1180
  },
1181
  "147": {
1182
+ "content": "\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581",
1183
  "lstrip": false,
1184
  "normalized": false,
1185
  "rstrip": false,
 
1187
  "special": false
1188
  },
1189
  "148": {
1190
+ "content": "\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581",
1191
  "lstrip": false,
1192
  "normalized": false,
1193
  "rstrip": false,
 
1195
  "special": false
1196
  },
1197
  "149": {
1198
+ "content": "\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581",
1199
  "lstrip": false,
1200
  "normalized": false,
1201
  "rstrip": false,
 
1203
  "special": false
1204
  },
1205
  "150": {
1206
+ "content": "\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581",
1207
  "lstrip": false,
1208
  "normalized": false,
1209
  "rstrip": false,
 
1211
  "special": false
1212
  },
1213
  "151": {
1214
+ "content": "\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581",
1215
  "lstrip": false,
1216
  "normalized": false,
1217
  "rstrip": false,
 
1219
  "special": false
1220
  },
1221
  "152": {
1222
+ "content": "\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581",
1223
  "lstrip": false,
1224
  "normalized": false,
1225
  "rstrip": false,
 
1227
  "special": false
1228
  },
1229
  "153": {
1230
+ "content": "\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581",
1231
  "lstrip": false,
1232
  "normalized": false,
1233
  "rstrip": false,
 
1235
  "special": false
1236
  },
1237
  "154": {
1238
+ "content": "\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581",
1239
  "lstrip": false,
1240
  "normalized": false,
1241
  "rstrip": false,
 
1243
  "special": false
1244
  },
1245
  "155": {
1246
+ "content": "\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581",
1247
  "lstrip": false,
1248
  "normalized": false,
1249
  "rstrip": false,
 
1251
  "special": false
1252
  },
1253
  "156": {
1254
+ "content": "\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581",
1255
  "lstrip": false,
1256
  "normalized": false,
1257
  "rstrip": false,
 
1259
  "special": false
1260
  },
1261
  "157": {
1262
+ "content": "\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581",
1263
  "lstrip": false,
1264
  "normalized": false,
1265
  "rstrip": false,
 
1267
  "special": false
1268
  },
1269
  "158": {
1270
+ "content": "\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581",
1271
  "lstrip": false,
1272
  "normalized": false,
1273
  "rstrip": false,
 
1275
  "special": false
1276
  },
1277
  "159": {
1278
+ "content": "\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581",
1279
  "lstrip": false,
1280
  "normalized": false,
1281
  "rstrip": false,
 
1283
  "special": false
1284
  },
1285
  "160": {
1286
+ "content": "\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581",
1287
  "lstrip": false,
1288
  "normalized": false,
1289
  "rstrip": false,
 
1291
  "special": false
1292
  },
1293
  "161": {
1294
+ "content": "\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581",
1295
  "lstrip": false,
1296
  "normalized": false,
1297
  "rstrip": false,
 
1299
  "special": false
1300
  },
1301
  "162": {
1302
+ "content": "\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581",
1303
  "lstrip": false,
1304
  "normalized": false,
1305
  "rstrip": false,
 
1307
  "special": false
1308
  },
1309
  "163": {
1310
+ "content": "\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581",
1311
  "lstrip": false,
1312
  "normalized": false,
1313
  "rstrip": false,
 
1315
  "special": false
1316
  },
1317
  "164": {
1318
+ "content": "\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581",
1319
  "lstrip": false,
1320
  "normalized": false,
1321
  "rstrip": false,
 
1323
  "special": false
1324
  },
1325
  "165": {
1326
+ "content": "\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581",
1327
  "lstrip": false,
1328
  "normalized": false,
1329
  "rstrip": false,
 
1331
  "special": false
1332
  },
1333
  "166": {
1334
+ "content": "\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581",
1335
  "lstrip": false,
1336
  "normalized": false,
1337
  "rstrip": false,
 
1339
  "special": false
1340
  },
1341
  "167": {
1342
+ "content": "\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581",
1343
  "lstrip": false,
1344
  "normalized": false,
1345
  "rstrip": false,
 
1347
  "special": false
1348
  },
1349
  "168": {
1350
+ "content": "\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581",
1351
  "lstrip": false,
1352
  "normalized": false,
1353
  "rstrip": false,
 
1746
  "bos_token": "<bos>",
1747
  "clean_up_tokenization_spaces": false,
1748
  "eos_token": "<eos>",
1749
+ "extra_special_tokens": {},
1750
+ "model_max_length": 8192,
1751
  "pad_token": "<pad>",
1752
  "padding_side": "left",
1753
  "sp_model_kwargs": {},
 
1755
  "tokenizer_class": "GemmaTokenizer",
1756
  "unk_token": "<unk>",
1757
  "use_default_system_prompt": false
1758
+ }