|
{ |
|
"base_model_name_or_path": "meta-llama/Llama-3.2-1B-Instruct", |
|
"compression": { |
|
"disabled_ids": [ |
|
128000, |
|
128001, |
|
128002, |
|
128003, |
|
128004, |
|
128005, |
|
128006, |
|
128007, |
|
128008, |
|
128009, |
|
128010, |
|
128011, |
|
128012, |
|
128013, |
|
128014, |
|
128015, |
|
128016, |
|
128017, |
|
128018, |
|
128019, |
|
128020, |
|
128021, |
|
128022, |
|
128023, |
|
128024, |
|
128025, |
|
128026, |
|
128027, |
|
128028, |
|
128029, |
|
128030, |
|
128031, |
|
128032, |
|
128033, |
|
128034, |
|
128035, |
|
128036, |
|
128037, |
|
128038, |
|
128039, |
|
128040, |
|
128041, |
|
128042, |
|
128043, |
|
128044, |
|
128045, |
|
128046, |
|
128047, |
|
128048, |
|
128049, |
|
128050, |
|
128051, |
|
128052, |
|
128053, |
|
128054, |
|
128055, |
|
128056, |
|
128057, |
|
128058, |
|
128059, |
|
128060, |
|
128061, |
|
128062, |
|
128063, |
|
128064, |
|
128065, |
|
128066, |
|
128067, |
|
128068, |
|
128069, |
|
128070, |
|
128071, |
|
128072, |
|
128073, |
|
128074, |
|
128075, |
|
128076, |
|
128077, |
|
128078, |
|
128079, |
|
128080, |
|
128081, |
|
128082, |
|
128083, |
|
128084, |
|
128085, |
|
128086, |
|
128087, |
|
128088, |
|
128089, |
|
128090, |
|
128091, |
|
128092, |
|
128093, |
|
128094, |
|
128095, |
|
128096, |
|
128097, |
|
128098, |
|
128099, |
|
128100, |
|
128101, |
|
128102, |
|
128103, |
|
128104, |
|
128105, |
|
128106, |
|
128107, |
|
128108, |
|
128109, |
|
128110, |
|
128111, |
|
128112, |
|
128113, |
|
128114, |
|
128115, |
|
128116, |
|
128117, |
|
128118, |
|
128119, |
|
128120, |
|
128121, |
|
128122, |
|
128123, |
|
128124, |
|
128125, |
|
128126, |
|
128127, |
|
128128, |
|
128129, |
|
128130, |
|
128131, |
|
128132, |
|
128133, |
|
128134, |
|
128135, |
|
128136, |
|
128137, |
|
128138, |
|
128139, |
|
128140, |
|
128141, |
|
128142, |
|
128143, |
|
128144, |
|
128145, |
|
128146, |
|
128147, |
|
128148, |
|
128149, |
|
128150, |
|
128151, |
|
128152, |
|
128153, |
|
128154, |
|
128155, |
|
128156, |
|
128157, |
|
128158, |
|
128159, |
|
128160, |
|
128161, |
|
128162, |
|
128163, |
|
128164, |
|
128165, |
|
128166, |
|
128167, |
|
128168, |
|
128169, |
|
128170, |
|
128171, |
|
128172, |
|
128173, |
|
128174, |
|
128175, |
|
128176, |
|
128177, |
|
128178, |
|
128179, |
|
128180, |
|
128181, |
|
128182, |
|
128183, |
|
128184, |
|
128185, |
|
128186, |
|
128187, |
|
128188, |
|
128189, |
|
128190, |
|
128191, |
|
128192, |
|
128193, |
|
128194, |
|
128195, |
|
128196, |
|
128197, |
|
128198, |
|
128199, |
|
128200, |
|
128201, |
|
128202, |
|
128203, |
|
128204, |
|
128205, |
|
128206, |
|
128207, |
|
128208, |
|
128209, |
|
128210, |
|
128211, |
|
128212, |
|
128213, |
|
128214, |
|
128215, |
|
128216, |
|
128217, |
|
128218, |
|
128219, |
|
128220, |
|
128221, |
|
128222, |
|
128223, |
|
128224, |
|
128225, |
|
128226, |
|
128227, |
|
128228, |
|
128229, |
|
128230, |
|
128231, |
|
128232, |
|
128233, |
|
128234, |
|
128235, |
|
128236, |
|
128237, |
|
128238, |
|
128239, |
|
128240, |
|
128241, |
|
128242, |
|
128243, |
|
128244, |
|
128245, |
|
128246, |
|
128247, |
|
128248, |
|
128249, |
|
128250, |
|
128251, |
|
128252, |
|
128253, |
|
128254, |
|
128255 |
|
], |
|
"initial_vocab_size": 128256, |
|
"max_codebook_size": 2048, |
|
"max_subtokens": 4 |
|
}, |
|
"encoder": { |
|
"hidden_size": 2048, |
|
"intermediate_size": null, |
|
"num_heads": 32, |
|
"num_hidden_layers": 2, |
|
"position_encoding": "learnable", |
|
"tie_encoders": true |
|
}, |
|
"encoder_type": "transformer" |
|
} |