dacorvo's picture
dacorvo HF staff
Synchronizing local compiler cache.
9571a70 verified
raw
history blame
1.1 kB
{"architectures": ["CvtModel"], "attention_drop_rate": [0.0, 0.0, 0.0], "cls_token": [false, false, true], "depth": [1, 2, 10], "drop_path_rate": [0.0, 0.0, 0.1], "drop_rate": [0.0, 0.0, 0.0], "embed_dim": [16, 48, 96], "image_size": 64, "initializer_range": 0.02, "kernel_qkv": [3, 3, 3], "layer_norm_eps": 1e-12, "mlp_ratio": [4.0, 4.0, 4.0], "model_type": "cvt", "neuron": {"auto_cast": null, "auto_cast_type": null, "compiler_type": "neuronx-cc", "compiler_version": "2.15.128.0+56dc5a86", "disable_fallback": false, "disable_fast_relayout": false, "dynamic_batch_size": true, "inline_weights_to_neff": true, "optlevel": "2", "output_attentions": false, "output_hidden_states": false, "static_batch_size": 1, "static_image_size": 64, "static_num_channels": 3}, "num_channels": 3, "num_heads": [1, 3, 6], "padding_kv": [1, 1, 1], "padding_q": [1, 1, 1], "patch_padding": [2, 1, 1], "patch_sizes": [7, 3, 3], "patch_stride": [4, 2, 2], "qkv_bias": [true, true, true], "qkv_projection_method": ["dw_bn", "dw_bn", "dw_bn"], "stride_kv": [2, 2, 2], "stride_q": [1, 1, 1], "task": "image-classification"}