Synchronizing local compiler cache.
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +344 -0
- neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev0/qwen2/Qwen/Qwen2.5-0.5B/5eef7da50a217db5b302.json +97 -0
- neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev0/qwen2/yujiepan/qwen2.5-128k-tiny-random/3292185f0123466a93a2.json +79 -0
- neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev0/qwen2/yujiepan/qwen2.5-128k-tiny-random/b60dca7d7a9c53810fe0.json +79 -0
- neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev0/qwen2/yujiepan/qwen2.5-128k-tiny-random/b9b0c081795fa9e33ca6.json +79 -0
- neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/albert/hf-internal-testing/tiny-random-AlbertModel/082c855afd5bbe38fea8.json +54 -0
- neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/albert/hf-internal-testing/tiny-random-AlbertModel/19ebb6a6a5ec909e86f1.json +55 -0
- neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/albert/hf-internal-testing/tiny-random-AlbertModel/1e1cab9afee16970464a.json +55 -0
- neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/albert/hf-internal-testing/tiny-random-AlbertModel/2420b2b633bc1e938403.json +54 -0
- neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/albert/hf-internal-testing/tiny-random-AlbertModel/3585a8b7eec15ef74cc9.json +55 -0
- neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/albert/hf-internal-testing/tiny-random-AlbertModel/4d038e1c09d623b63731.json +55 -0
- neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/albert/hf-internal-testing/tiny-random-AlbertModel/59c92a651b8b40190b9d.json +54 -0
- neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/albert/hf-internal-testing/tiny-random-AlbertModel/707d5fc3c98b3c204500.json +54 -0
- neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/albert/hf-internal-testing/tiny-random-AlbertModel/8829976eff976b676195.json +54 -0
- neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/albert/hf-internal-testing/tiny-random-AlbertModel/903f2ac3444c8203b948.json +54 -0
- neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/albert/hf-internal-testing/tiny-random-AlbertModel/9b69ad26e6071c069631.json +55 -0
- neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/albert/hf-internal-testing/tiny-random-AlbertModel/aa7706c37f42f9b0efa0.json +54 -0
- neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/albert/hf-internal-testing/tiny-random-AlbertModel/b5b638607d26526724c7.json +54 -0
- neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/albert/hf-internal-testing/tiny-random-AlbertModel/ce96b3b9bef1f6cf0d93.json +55 -0
- neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/albert/hf-internal-testing/tiny-random-AlbertModel/cf3a4b3035690a565ab1.json +55 -0
- neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/albert/hf-internal-testing/tiny-random-AlbertModel/d2da3177c42e88297899.json +55 -0
- neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/albert/hf-internal-testing/tiny-random-AlbertModel/e59dd1535caa6a29b4cc.json +54 -0
- neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/beit/hf-internal-testing/tiny-random-BeitForImageClassification/7b8399664c54026a03ff.json +90 -0
- neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/beit/hf-internal-testing/tiny-random-BeitForImageClassification/8eea34f80bdd528f4c47.json +90 -0
- neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/bert/Jingya/tiny-random-bert-remote-code/601076bf2990d898404b.json +52 -0
- neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/bert/fxmarty/tiny-bert-sst2-distilled-subfolder/d7d576d06e1491d72e5a.json +61 -0
- neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/bert/hf-internal-testing/tiny-random-BertModel/07d9dac237105afed7b4.json +52 -0
- neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/bert/hf-internal-testing/tiny-random-BertModel/0d7dca7e1b02d11fa30b.json +52 -0
- neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/bert/hf-internal-testing/tiny-random-BertModel/22ce2cce0b08d134021c.json +53 -0
- neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/bert/hf-internal-testing/tiny-random-BertModel/28bcefedc9caadd676ab.json +53 -0
- neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/bert/hf-internal-testing/tiny-random-BertModel/3908bf519c210b434176.json +53 -0
- neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/bert/hf-internal-testing/tiny-random-BertModel/5ead9d705b13f37e716b.json +52 -0
- neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/bert/hf-internal-testing/tiny-random-BertModel/80c925bab2fcc5749b91.json +53 -0
- neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/bert/hf-internal-testing/tiny-random-BertModel/92f51980d46489605055.json +52 -0
- neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/bert/hf-internal-testing/tiny-random-BertModel/aeebf3f56cf9d0ed0250.json +52 -0
- neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/bert/hf-internal-testing/tiny-random-BertModel/cfb94bae5629e275593f.json +53 -0
- neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/bert/hf-internal-testing/tiny-random-BertModel/e050716b5de372871d73.json +52 -0
- neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/bert/hf-internal-testing/tiny-random-BertModel/e0768f223c51e12fd868.json +52 -0
- neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/bert/hf-internal-testing/tiny-random-BertModel/e2594a1f187f452902f7.json +52 -0
- neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/bert/hf-internal-testing/tiny-random-BertModel/e4834fd951418b796374.json +53 -0
- neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/bert/hf-internal-testing/tiny-random-BertModel/e7e71e6beffbf701391b.json +53 -0
- neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/bert/hf-internal-testing/tiny-random-BertModel/ea81a963f6aa67da9f09.json +53 -0
- neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/bert/hf-internal-testing/tiny-random-BertModel/ef32dca934503ba9400c.json +52 -0
- neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/bert/hf-internal-testing/tiny-random-BertModel/f15944a91bf873bc4059.json +52 -0
- neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/bert/sentence-transformers/all-MiniLM-L6-v2/b571d0d9ac9ad084fa8c.json +54 -0
- neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/bert/sentence-transformers/all-MiniLM-L6-v2/f99a0822ae493faf0bb5.json +54 -0
- neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/camembert/hf-internal-testing/tiny-random-camembert/16650c04744503a0af47.json +52 -0
- neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/camembert/hf-internal-testing/tiny-random-camembert/3d5fe21de242b8b602d5.json +52 -0
- neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/camembert/hf-internal-testing/tiny-random-camembert/4b4a4fbbe9d668bcf61e.json +52 -0
- neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/camembert/hf-internal-testing/tiny-random-camembert/5bca725791b646775427.json +53 -0
.gitattributes
CHANGED
@@ -10270,3 +10270,347 @@ neuronxcc-2.20.9961.0+0acef03a/MODULE_057bc784fc164fb34d3e+ed72d204/model.neff f
|
|
10270 |
neuronxcc-2.20.9961.0+0acef03a/MODULE_de733c6f96020a1e5f56+a9d440f5/model.neff filter=lfs diff=lfs merge=lfs -text
|
10271 |
neuronxcc-2.20.9961.0+0acef03a/MODULE_de733c6f96020a1e5f56+a9d440f5/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text
|
10272 |
neuronxcc-2.20.9961.0+0acef03a/MODULE_e3031c3c114f7c905db7+ae6a382b/model.neff filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
10270 |
neuronxcc-2.20.9961.0+0acef03a/MODULE_de733c6f96020a1e5f56+a9d440f5/model.neff filter=lfs diff=lfs merge=lfs -text
|
10271 |
neuronxcc-2.20.9961.0+0acef03a/MODULE_de733c6f96020a1e5f56+a9d440f5/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text
|
10272 |
neuronxcc-2.20.9961.0+0acef03a/MODULE_e3031c3c114f7c905db7+ae6a382b/model.neff filter=lfs diff=lfs merge=lfs -text
|
10273 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_0219e831452f3e9b80e6/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10274 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_021be40fb5716d1066d1/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10275 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_02c51eae95f4097f74e7/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10276 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_07d9dac237105afed7b4/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10277 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_082c855afd5bbe38fea8/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10278 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_0994f3d43a554bcbbcd7/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10279 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_0ad6e67d0b4363af0472/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10280 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_0af77bd813eb760ae10d/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10281 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_0b0b6686a4841c281f89/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10282 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_0b384d0739d57659345e/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10283 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_0bfe6d17355fd2f0836f/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10284 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_0ca055684d61c552e3ec/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10285 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_0ca23862a0ff1499156f/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10286 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_0d7dca7e1b02d11fa30b/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10287 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_0e02d4795b77fba80c35/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10288 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_0f556b899de48f28b455/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10289 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_0fdfb4247e7d07ebbad0/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10290 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_101f045ec3ef38dff069/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10291 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_11228616321528259762+e30acd3a/model.neff filter=lfs diff=lfs merge=lfs -text
|
10292 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_1179fb416e242252b8b1/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10293 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_117dcaf2b5ba5b392c51/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10294 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_11d26d78110e3ea447dd/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10295 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_12273156641748218648+e30acd3a/model.neff filter=lfs diff=lfs merge=lfs -text
|
10296 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_1227467f6a1477aec333/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10297 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_1355027528627e06e5cb/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10298 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_136344c1e04a80fc9e83/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10299 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_14069605881026998085+e30acd3a/model.neff filter=lfs diff=lfs merge=lfs -text
|
10300 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_14160024224657763603+e30acd3a/model.neff filter=lfs diff=lfs merge=lfs -text
|
10301 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_14829227305888857035+e30acd3a/model.neff filter=lfs diff=lfs merge=lfs -text
|
10302 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_148a07ab282c4e1a2a0e/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10303 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_15025462673285903344+e30acd3a/model.neff filter=lfs diff=lfs merge=lfs -text
|
10304 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_15f7e443873c3474a6aa/decoder/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10305 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_15f7e443873c3474a6aa/encoder/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10306 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_16650c04744503a0af47/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10307 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_16839706381867715922+e30acd3a/model.neff filter=lfs diff=lfs merge=lfs -text
|
10308 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_16b01b31bf5bb1c85c1d/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10309 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_17327912813737302838+e30acd3a/model.neff filter=lfs diff=lfs merge=lfs -text
|
10310 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_17419856824540332941+e30acd3a/model.neff filter=lfs diff=lfs merge=lfs -text
|
10311 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_17641195202625304294+e30acd3a/model.neff filter=lfs diff=lfs merge=lfs -text
|
10312 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_17711110885328520544+e30acd3a/model.neff filter=lfs diff=lfs merge=lfs -text
|
10313 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_17855694184933887987+e30acd3a/model.neff filter=lfs diff=lfs merge=lfs -text
|
10314 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_184d9b81ae20431d278e/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10315 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_18d8cc6bf53b525ebb83/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10316 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_19a9557944c3c798892c/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10317 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_19ebb6a6a5ec909e86f1/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10318 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_1ae5dec75b26da7fc293+253d6470/model.neff filter=lfs diff=lfs merge=lfs -text
|
10319 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_1be47d7ec35995ba24e2/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10320 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_1ccdb35db19ea6d46330/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10321 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_1d4e0541af5c102c02ad/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10322 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_1e1cab9afee16970464a/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10323 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_1f71844521461b69a9a1/text_encoder/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10324 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_1f71844521461b69a9a1/unet/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10325 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_1f71844521461b69a9a1/vae_decoder/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10326 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_1f71844521461b69a9a1/vae_encoder/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10327 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_1f997b4c07c5b98b2872/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10328 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_2011979c1c7685c0c1e8/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10329 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_22ac4beaed8c828e276d/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10330 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_22ce2cce0b08d134021c/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10331 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_2420b2b633bc1e938403/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10332 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_2518ad68ffda816de14c+a74130ed/model.neff filter=lfs diff=lfs merge=lfs -text
|
10333 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_2518ad68ffda816de14c+a74130ed/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text
|
10334 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_27494e54568e0f4aef97/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10335 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_28bcefedc9caadd676ab/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10336 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_2994655886375ea65794/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10337 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_2bfc916223b281bde6c9/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10338 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_2c3447cbfc1aa2c980e4/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10339 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_2d941194111edd1cc349/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10340 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_2ec978f7548ba514cc92/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10341 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_2eeccd3fb290738b486c/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10342 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_30709c9a1366cc22f381/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10343 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_3091516cc256301854d5/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10344 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_3164ef3b6e4540774d38/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10345 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_3262637bc52e95809853+431f5505/model.neff filter=lfs diff=lfs merge=lfs -text
|
10346 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_33c68608ff1365e11b4b/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10347 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_35240b83eadb946e8397/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10348 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_3585a8b7eec15ef74cc9/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10349 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_3666724308aaa469662b/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10350 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_37fb28b99dfea65dc5fd/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10351 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_38fe3c7c7cf144065eac/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10352 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_3908bf519c210b434176/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10353 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_39152d050ca1aafdbcb7/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10354 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_3bf2eb59f27536b63a45/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10355 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_3d5fe21de242b8b602d5/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10356 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_3f7a39fcaca1f42af1d6/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10357 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_4067177570182b1343d2/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10358 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_4148dd3c4e0957c59aec/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10359 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_4375062474730619889+e30acd3a/model.neff filter=lfs diff=lfs merge=lfs -text
|
10360 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_44670f0e856e93e13945/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10361 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_45c7246705c9e6fab659/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10362 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_466672b98b30e850228e/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10363 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_467e3986218b1c421e16/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10364 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_4696932584f9d8f704d5/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10365 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_4750006367237009755+e30acd3a/model.neff filter=lfs diff=lfs merge=lfs -text
|
10366 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_484d55fa9705364e6d6c/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10367 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_491a208ef81533ee4361/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10368 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_4974b909ef52ed6985aa/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10369 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_4b4a4fbbe9d668bcf61e/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10370 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_4b5db21c35dab98379c0/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10371 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_4bf35dcb438eff118841/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10372 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_4d038e1c09d623b63731/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10373 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_4d2fe63b7ea76c7ef876+a74130ed/model.neff filter=lfs diff=lfs merge=lfs -text
|
10374 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_4d2fe63b7ea76c7ef876+a74130ed/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text
|
10375 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_4e4ef27b3302beb416e2+253d6470/model.neff filter=lfs diff=lfs merge=lfs -text
|
10376 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_50466361a10e0beb2743/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10377 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_50881c62b5e180d29b73/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10378 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_50dd1eff58edae4890c4/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10379 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_52ac96dddc861615c14b/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10380 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_530b46c2c544923d9ae4/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10381 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_5321652960071550735+e30acd3a/model.neff filter=lfs diff=lfs merge=lfs -text
|
10382 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_54999f3651eabb911710/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10383 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_565ec63172e78bb6a459/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10384 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_566b362576597dc93bf0/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10385 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_56fb08782842e65d4478/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10386 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_56fb7ca25c9741358f35/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10387 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_57575a85181cb2c0c6ce/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10388 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_59287e3a63d75be1484e/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10389 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_59c92a651b8b40190b9d/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10390 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_5bca725791b646775427/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10391 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_5cfaeab2b13c776d07bb/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10392 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_5d5dadc2c2138bf8ab44/decoder/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10393 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_5d5dadc2c2138bf8ab44/encoder/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10394 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_5dba74ecad23c5836b41/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10395 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_5de28d74475c2e525475/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10396 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_5e0f1f4e96fb7f38115d/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10397 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_5ead9d705b13f37e716b/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10398 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_5ee5e7496586a5b158cd/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10399 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_5fb0198cf9dd4a2e93ea/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10400 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_5fc297836c63bcff7ed3/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10401 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_601076bf2990d898404b/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10402 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_602b46624db97cda3fee/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10403 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_6081e29d0b26014e391f/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10404 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_61774b9874fadd5b1723/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10405 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_61a96b508e7be967c0c7+cd3419b6/model.neff filter=lfs diff=lfs merge=lfs -text
|
10406 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_61a96b508e7be967c0c7+cd3419b6/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text
|
10407 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_62c0826140d6564782c3/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10408 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_6356dda8884e943ca1eb/text_encoder/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10409 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_6356dda8884e943ca1eb/text_encoder_2/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10410 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_6356dda8884e943ca1eb/unet/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10411 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_6356dda8884e943ca1eb/vae_decoder/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10412 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_6356dda8884e943ca1eb/vae_encoder/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10413 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_639b34a908c080e3d3e9/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10414 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_63b1a6be8b23f66fef00/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10415 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_64383c5d9ccd5d74a246/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10416 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_64a180bec331b8ec91ba/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10417 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_655beeec84479afaaafe/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10418 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_66be3aba74892f370b62/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10419 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_68d42db5e52211fa0dc3/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10420 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_68df0af504c21aa2b1ce/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10421 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_6903f75a616124fbbe62/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10422 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_69748744deacc485a2da/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10423 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_6a46f0468637fa1ceea4/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10424 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_6b45e20838de2009119b/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10425 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_6cdfd3f8d054eaf72194/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10426 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_6e06599623de7d47c750/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10427 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_6ec1ef9088ffe38a3d25/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10428 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_707d5fc3c98b3c204500/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10429 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_70a99404c72ad381de36/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10430 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_70ae67fe6de015024b24+cd3419b6/model.neff filter=lfs diff=lfs merge=lfs -text
|
10431 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_70ae67fe6de015024b24+cd3419b6/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text
|
10432 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_71d6f99f019cce5d2c56/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10433 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_7291119501971561507+e30acd3a/model.neff filter=lfs diff=lfs merge=lfs -text
|
10434 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_72b1081c4393b26efe11/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10435 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_733d8ce97f615c7406f6/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10436 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_749c49190e3a9c9b1317/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10437 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_74c4ec2a3829c1027457/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10438 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_77e174f71c47d9f4d0b7/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10439 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_7b1d8863929b4701df6d/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10440 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_7b8399664c54026a03ff/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10441 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_7be6e0568963be54593a/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10442 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_7cc364920677c1ace017/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10443 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_7dd477985731dbce8cf8/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10444 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_7ec9c0b2b3c87c96c7d0/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10445 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_80563bbcc3f75213156d/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10446 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_80c925bab2fcc5749b91/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10447 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_8285b8316500e52286c9/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10448 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_8319eff5a8285defb5a3/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10449 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_833bce8fd7e57021a525/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10450 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_83466d3415d7c423ad3a/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10451 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_83b76f3670fb9dd6d79d/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10452 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_8417307499696621353+e30acd3a/model.neff filter=lfs diff=lfs merge=lfs -text
|
10453 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_855c66679f1728d4b0b9/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10454 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_876a3fac78c9e7d8d969/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10455 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_87b36020196a848d8295/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10456 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_87eb7ec28b9b01a3f8de/text_encoder/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10457 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_87eb7ec28b9b01a3f8de/unet/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10458 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_87eb7ec28b9b01a3f8de/vae_decoder/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10459 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_87eb7ec28b9b01a3f8de/vae_encoder/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10460 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_8829976eff976b676195/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10461 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_88abbb6c39ef61b204e1/decoder/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10462 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_88abbb6c39ef61b204e1/encoder/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10463 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_896e2cb6bda1ecefc195/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10464 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_89c332555d9bb1164bb3+431f5505/model.neff filter=lfs diff=lfs merge=lfs -text
|
10465 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_8afa7462593888c1ace0/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10466 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_8b1a6646a196796c979b/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10467 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_8eea34f80bdd528f4c47/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10468 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_9013e8baf47aa2490da7/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10469 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_903f2ac3444c8203b948/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10470 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_922088b97905a7fc46ca/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10471 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_9280fd71681625e0f026/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10472 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_92b322085492cfc5743f/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10473 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_92f51980d46489605055/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10474 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_93fb6328ff6b4914fec7/text_encoder/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10475 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_93fb6328ff6b4914fec7/text_encoder_2/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10476 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_93fb6328ff6b4914fec7/unet/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10477 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_93fb6328ff6b4914fec7/vae_decoder/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10478 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_93fb6328ff6b4914fec7/vae_encoder/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10479 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_950e3bf7ec0e47e9d1f6/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10480 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_9584ca4279d47aa94f96/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10481 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_96263cd071abd0bb8205/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10482 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_96735d336b988c7ae46c/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10483 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_96f2f0fe551f33210e73/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10484 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_98afed8f23bccfa2bf93/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10485 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_99a4d278a736dc55c4e1/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10486 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_99bc626550f56c193835/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10487 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_9a0e849430be2af050d7/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10488 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_9a67f4255c65b566abfd/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10489 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_9b1e403c2901fc8169d9/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10490 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_9b69ad26e6071c069631/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10491 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_9e7952fae90c1f6f8fb4/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10492 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_9f5df17622d13f7aa0a1/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10493 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_9f6a8efd40fcd1be4ca9/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10494 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_a1326d88e9b290f8e35a/controlnet_0/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10495 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_a1326d88e9b290f8e35a/text_encoder/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10496 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_a1326d88e9b290f8e35a/unet/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10497 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_a1326d88e9b290f8e35a/vae_decoder/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10498 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_a1326d88e9b290f8e35a/vae_encoder/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10499 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_a456d73c225440c520af/text_encoder/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10500 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_a456d73c225440c520af/unet/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10501 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_a456d73c225440c520af/vae_decoder/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10502 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_a456d73c225440c520af/vae_encoder/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10503 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_a6e434271f70307fe55a/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10504 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_a7dcaa4d6f7541916f6b/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10505 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_aa7706c37f42f9b0efa0/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10506 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_ab0ec5a632242310c520/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10507 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_ac82cc5cd27456228f9b/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10508 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_ad9de1959357baf1be93/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10509 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_aeebf3f56cf9d0ed0250/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10510 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_af36677e1d281b7581b7/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10511 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_b26cf211d0154814b6de/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10512 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_b2a5715c8de1d06e02d1/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10513 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_b45d43ae8e345b80b8b6/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10514 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_b46c903d70fcbd8dde04/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10515 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_b571d0d9ac9ad084fa8c/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10516 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_b5b638607d26526724c7/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10517 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_b6abe5e7902b7d92c00b/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10518 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_b825412615cae3305380/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10519 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_b83eb9efb666a7597fa6/controlnet_0/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10520 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_b83eb9efb666a7597fa6/controlnet_1/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10521 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_b83eb9efb666a7597fa6/text_encoder/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10522 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_b83eb9efb666a7597fa6/unet/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10523 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_b83eb9efb666a7597fa6/vae_decoder/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10524 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_b83eb9efb666a7597fa6/vae_encoder/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10525 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_ba276d9e084c36d4d299/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10526 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_bb5b129941b54904675f/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10527 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_bc33d8c25a64bc49fa25/text_encoder/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10528 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_bc33d8c25a64bc49fa25/text_encoder_2/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10529 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_bc33d8c25a64bc49fa25/unet/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10530 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_bc33d8c25a64bc49fa25/vae_decoder/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10531 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_bc33d8c25a64bc49fa25/vae_encoder/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10532 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_bc7d63ab74772beafa77/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10533 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_bd8a7636ac96599afce0/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10534 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_bf898d9815ecfc28a3c4/decoder/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10535 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_bf898d9815ecfc28a3c4/encoder/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10536 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_c121d453d2dce97dc9f2/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10537 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_c1a7e229a1e0089bc100/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10538 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_c3dac669c643d4e0b641/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10539 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_c6a6313df00b13f0bc20/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10540 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_c76ea064827fb5ffaf3a/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10541 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_c7711f055c4601678bfc/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10542 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_c845c7c1978a7f0fc5bc+cd3419b6/model.neff filter=lfs diff=lfs merge=lfs -text
|
10543 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_c845c7c1978a7f0fc5bc+cd3419b6/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text
|
10544 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_cd2b22a4d8bd6ff87e79/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10545 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_ce96b3b9bef1f6cf0d93/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10546 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_cf3a4b3035690a565ab1/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10547 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_cfb94bae5629e275593f/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10548 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_cfbfacea58d61c7302ac/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10549 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_d0207458a6f6fb104830/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10550 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_d0dd0aeeae66ba529c6f/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10551 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_d2c282677041876b494e/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10552 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_d2da3177c42e88297899/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10553 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_d327dc6d21691f2390f2/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10554 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_d3a9e3a3693c0097041a/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10555 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_d4527b583703e675299f/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10556 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_d5fb9a76d0fdc62db217/text_encoder/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10557 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_d5fb9a76d0fdc62db217/unet/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10558 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_d5fb9a76d0fdc62db217/vae_decoder/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10559 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_d5fb9a76d0fdc62db217/vae_encoder/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10560 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_d63d38954db56a481479/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10561 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_d752631e2f1bc8b5bd5c/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10562 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_d780aaa6e4cc8ef4073b/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10563 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_d7d576d06e1491d72e5a/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10564 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_d83e395611ddc3a29d9f/decoder/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10565 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_d83e395611ddc3a29d9f/encoder/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10566 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_db7feb9a8e6a89d9b5cc/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10567 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_dbf38214a01c36374929/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10568 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_dc19e38388ce4a13824f/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10569 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_dcfeb3310672a794fe59/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10570 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_dec4d4d1adf057ba26a6/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10571 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_e00b8a80c7b4565a38b9/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10572 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_e01d4f3ed05b3b779179/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10573 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_e050716b5de372871d73/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10574 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_e0768f223c51e12fd868/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10575 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_e0d110db2ae6fd6f9a18/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10576 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_e0e485d1effe77c0355a/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10577 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_e207d10cd73986f34774/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10578 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_e2594a1f187f452902f7/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10579 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_e3343136a71050139f62/text_encoder/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10580 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_e3343136a71050139f62/text_encoder_2/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10581 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_e3343136a71050139f62/unet/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10582 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_e3343136a71050139f62/vae_decoder/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10583 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_e3343136a71050139f62/vae_encoder/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10584 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_e4834fd951418b796374/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10585 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_e57cbde649dde732937d/decoder/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10586 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_e57cbde649dde732937d/encoder/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10587 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_e59dd1535caa6a29b4cc/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10588 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_e5c893a9ead6645e9326/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10589 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_e7d6a1ed3ce052d450ca/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10590 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_e7e71e6beffbf701391b/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10591 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_ea65e810b73a07c4f93e/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10592 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_ea81a963f6aa67da9f09/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10593 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_eaa04c5b1a458bb8ede4/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10594 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_eaffcb1bcf2a2ba5568c/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10595 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_ebdd3f238f484caa6f2b/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10596 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_ed32d4174c8c48368338/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10597 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_ef32dca934503ba9400c/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10598 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_f0f76b9ba98b72bdf648/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10599 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_f15944a91bf873bc4059/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10600 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_f1ec63e05f9ea876842c/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10601 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_f2764d531dd4d92fcf44/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10602 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_f2fb67dde0ac51075166/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10603 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_f3e9a9a693c44ea917dc/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10604 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_f441d043990635e01090/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10605 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_f58c375fdf2f49018e38/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10606 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_f59412f8a600e9a71fb8/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10607 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_f73c821d92438436ad6c/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10608 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_f8697b18674e9f438a96/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10609 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_f8990edfbb4deaf97027/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10610 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_f99a0822ae493faf0bb5/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10611 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_fa6da73026ca7a0eb10f/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10612 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_fba7e5f3d8634f923189/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10613 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_fd402f1583fe91543618/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10614 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_fe61ce3dd9af75901342/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10615 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_ff3a95a3a80afa64563d/model.neuron filter=lfs diff=lfs merge=lfs -text
|
10616 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_ffe8abf61d5a2a0a2b8e/model.neuron filter=lfs diff=lfs merge=lfs -text
|
neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev0/qwen2/Qwen/Qwen2.5-0.5B/5eef7da50a217db5b302.json
ADDED
@@ -0,0 +1,97 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_entry_class": "SingleModelCacheEntry",
|
3 |
+
"_model_id": "Qwen/Qwen2.5-0.5B",
|
4 |
+
"_task": "text-generation",
|
5 |
+
"architectures": [
|
6 |
+
"Qwen2ForCausalLM"
|
7 |
+
],
|
8 |
+
"attention_dropout": 0.0,
|
9 |
+
"hidden_act": "silu",
|
10 |
+
"hidden_size": 896,
|
11 |
+
"initializer_range": 0.02,
|
12 |
+
"intermediate_size": 4864,
|
13 |
+
"layer_types": [
|
14 |
+
"full_attention",
|
15 |
+
"full_attention",
|
16 |
+
"full_attention",
|
17 |
+
"full_attention",
|
18 |
+
"full_attention",
|
19 |
+
"full_attention",
|
20 |
+
"full_attention",
|
21 |
+
"full_attention",
|
22 |
+
"full_attention",
|
23 |
+
"full_attention",
|
24 |
+
"full_attention",
|
25 |
+
"full_attention",
|
26 |
+
"full_attention",
|
27 |
+
"full_attention",
|
28 |
+
"full_attention",
|
29 |
+
"full_attention",
|
30 |
+
"full_attention",
|
31 |
+
"full_attention",
|
32 |
+
"full_attention",
|
33 |
+
"full_attention",
|
34 |
+
"full_attention",
|
35 |
+
"full_attention",
|
36 |
+
"full_attention",
|
37 |
+
"full_attention"
|
38 |
+
],
|
39 |
+
"max_position_embeddings": 32768,
|
40 |
+
"max_window_layers": 24,
|
41 |
+
"model_type": "qwen2",
|
42 |
+
"neuron": {
|
43 |
+
"_serialized_key": "NxDNeuronConfig",
|
44 |
+
"async_mode": false,
|
45 |
+
"attn_kernel_enabled": false,
|
46 |
+
"batch_size": 1,
|
47 |
+
"capacity_factor": null,
|
48 |
+
"cc_pipeline_tiling_factor": 2,
|
49 |
+
"checkpoint_id": "Qwen/Qwen2.5-0.5B",
|
50 |
+
"checkpoint_revision": "060db6499f32faf8b98477b0a26969ef7d8b9987",
|
51 |
+
"continuous_batching": false,
|
52 |
+
"enable_bucketing": false,
|
53 |
+
"ep_degree": 1,
|
54 |
+
"flash_decoding_enabled": false,
|
55 |
+
"fused_qkv": false,
|
56 |
+
"glu_mlp": true,
|
57 |
+
"is_chunked_prefill": false,
|
58 |
+
"local_ranks_size": 2,
|
59 |
+
"logical_nc_config": 1,
|
60 |
+
"max_batch_size": 1,
|
61 |
+
"max_context_length": 128,
|
62 |
+
"max_topk": 256,
|
63 |
+
"mlp_kernel_enabled": false,
|
64 |
+
"mlp_kernel_fuse_residual_add": false,
|
65 |
+
"n_active_tokens": 128,
|
66 |
+
"neuronxcc_version": "2.19.8089.0+8ab9f450",
|
67 |
+
"num_cores_per_group": 1,
|
68 |
+
"on_device_sampling": true,
|
69 |
+
"optimum_neuron_version": "0.3.1.dev0",
|
70 |
+
"output_logits": false,
|
71 |
+
"padding_side": "right",
|
72 |
+
"pp_degree": 1,
|
73 |
+
"qk_layernorm": false,
|
74 |
+
"qkv_kernel_enabled": false,
|
75 |
+
"rpl_reduce_dtype": "bfloat16",
|
76 |
+
"sequence_length": 128,
|
77 |
+
"sequence_parallel_enabled": false,
|
78 |
+
"speculation_length": 0,
|
79 |
+
"start_rank_id": 0,
|
80 |
+
"target": null,
|
81 |
+
"torch_dtype": "bfloat16",
|
82 |
+
"tp_degree": 2,
|
83 |
+
"vocab_parallel": false
|
84 |
+
},
|
85 |
+
"num_attention_heads": 14,
|
86 |
+
"num_hidden_layers": 24,
|
87 |
+
"num_key_value_heads": 2,
|
88 |
+
"rms_norm_eps": 1e-06,
|
89 |
+
"rope_scaling": null,
|
90 |
+
"rope_theta": 1000000.0,
|
91 |
+
"sliding_window": null,
|
92 |
+
"tie_word_embeddings": true,
|
93 |
+
"use_cache": true,
|
94 |
+
"use_mrope": false,
|
95 |
+
"use_sliding_window": false,
|
96 |
+
"vocab_size": 151936
|
97 |
+
}
|
neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev0/qwen2/yujiepan/qwen2.5-128k-tiny-random/3292185f0123466a93a2.json
ADDED
@@ -0,0 +1,79 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_entry_class": "SingleModelCacheEntry",
|
3 |
+
"_model_id": "yujiepan/qwen2.5-128k-tiny-random",
|
4 |
+
"_task": "text-generation",
|
5 |
+
"architectures": [
|
6 |
+
"Qwen2ForCausalLM"
|
7 |
+
],
|
8 |
+
"attention_dropout": 0.0,
|
9 |
+
"hidden_act": "silu",
|
10 |
+
"hidden_size": 8,
|
11 |
+
"initializer_range": 0.02,
|
12 |
+
"intermediate_size": 16,
|
13 |
+
"layer_types": [
|
14 |
+
"full_attention",
|
15 |
+
"full_attention"
|
16 |
+
],
|
17 |
+
"max_position_embeddings": 32768,
|
18 |
+
"max_window_layers": 1,
|
19 |
+
"model_type": "qwen2",
|
20 |
+
"neuron": {
|
21 |
+
"_serialized_key": "NxDNeuronConfig",
|
22 |
+
"async_mode": false,
|
23 |
+
"attn_kernel_enabled": false,
|
24 |
+
"batch_size": 2,
|
25 |
+
"capacity_factor": null,
|
26 |
+
"cc_pipeline_tiling_factor": 2,
|
27 |
+
"checkpoint_id": "yujiepan/qwen2.5-128k-tiny-random",
|
28 |
+
"checkpoint_revision": "c8296d4ca3f87782876d2382fbb6481d1beb8ef0",
|
29 |
+
"continuous_batching": true,
|
30 |
+
"enable_bucketing": false,
|
31 |
+
"ep_degree": 1,
|
32 |
+
"flash_decoding_enabled": false,
|
33 |
+
"fused_qkv": false,
|
34 |
+
"glu_mlp": true,
|
35 |
+
"is_chunked_prefill": false,
|
36 |
+
"local_ranks_size": 2,
|
37 |
+
"logical_nc_config": 1,
|
38 |
+
"max_batch_size": 2,
|
39 |
+
"max_context_length": 100,
|
40 |
+
"max_topk": 256,
|
41 |
+
"mlp_kernel_enabled": false,
|
42 |
+
"mlp_kernel_fuse_residual_add": false,
|
43 |
+
"n_active_tokens": 100,
|
44 |
+
"neuronxcc_version": "2.19.8089.0+8ab9f450",
|
45 |
+
"num_cores_per_group": 1,
|
46 |
+
"on_device_sampling": false,
|
47 |
+
"optimum_neuron_version": "0.3.1.dev0",
|
48 |
+
"output_logits": false,
|
49 |
+
"padding_side": "right",
|
50 |
+
"pp_degree": 1,
|
51 |
+
"qk_layernorm": false,
|
52 |
+
"qkv_kernel_enabled": false,
|
53 |
+
"rpl_reduce_dtype": "float16",
|
54 |
+
"sequence_length": 100,
|
55 |
+
"sequence_parallel_enabled": false,
|
56 |
+
"speculation_length": 0,
|
57 |
+
"start_rank_id": 0,
|
58 |
+
"target": null,
|
59 |
+
"torch_dtype": "float16",
|
60 |
+
"tp_degree": 2,
|
61 |
+
"vocab_parallel": false
|
62 |
+
},
|
63 |
+
"num_attention_heads": 4,
|
64 |
+
"num_hidden_layers": 2,
|
65 |
+
"num_key_value_heads": 2,
|
66 |
+
"rms_norm_eps": 1e-06,
|
67 |
+
"rope_scaling": {
|
68 |
+
"factor": 4.0,
|
69 |
+
"original_max_position_embeddings": 32768,
|
70 |
+
"rope_type": "yarn",
|
71 |
+
"type": "yarn"
|
72 |
+
},
|
73 |
+
"rope_theta": 1000000.0,
|
74 |
+
"sliding_window": null,
|
75 |
+
"tie_word_embeddings": false,
|
76 |
+
"use_cache": true,
|
77 |
+
"use_sliding_window": false,
|
78 |
+
"vocab_size": 152064
|
79 |
+
}
|
neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev0/qwen2/yujiepan/qwen2.5-128k-tiny-random/b60dca7d7a9c53810fe0.json
ADDED
@@ -0,0 +1,79 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_entry_class": "SingleModelCacheEntry",
|
3 |
+
"_model_id": "yujiepan/qwen2.5-128k-tiny-random",
|
4 |
+
"_task": "text-generation",
|
5 |
+
"architectures": [
|
6 |
+
"Qwen2ForCausalLM"
|
7 |
+
],
|
8 |
+
"attention_dropout": 0.0,
|
9 |
+
"hidden_act": "silu",
|
10 |
+
"hidden_size": 8,
|
11 |
+
"initializer_range": 0.02,
|
12 |
+
"intermediate_size": 16,
|
13 |
+
"layer_types": [
|
14 |
+
"full_attention",
|
15 |
+
"full_attention"
|
16 |
+
],
|
17 |
+
"max_position_embeddings": 32768,
|
18 |
+
"max_window_layers": 1,
|
19 |
+
"model_type": "qwen2",
|
20 |
+
"neuron": {
|
21 |
+
"_serialized_key": "NxDNeuronConfig",
|
22 |
+
"async_mode": false,
|
23 |
+
"attn_kernel_enabled": false,
|
24 |
+
"batch_size": 1,
|
25 |
+
"capacity_factor": null,
|
26 |
+
"cc_pipeline_tiling_factor": 2,
|
27 |
+
"checkpoint_id": "yujiepan/qwen2.5-128k-tiny-random",
|
28 |
+
"checkpoint_revision": "c8296d4ca3f87782876d2382fbb6481d1beb8ef0",
|
29 |
+
"continuous_batching": false,
|
30 |
+
"enable_bucketing": false,
|
31 |
+
"ep_degree": 1,
|
32 |
+
"flash_decoding_enabled": false,
|
33 |
+
"fused_qkv": false,
|
34 |
+
"glu_mlp": true,
|
35 |
+
"is_chunked_prefill": false,
|
36 |
+
"local_ranks_size": 2,
|
37 |
+
"logical_nc_config": 1,
|
38 |
+
"max_batch_size": 1,
|
39 |
+
"max_context_length": 100,
|
40 |
+
"max_topk": 256,
|
41 |
+
"mlp_kernel_enabled": false,
|
42 |
+
"mlp_kernel_fuse_residual_add": false,
|
43 |
+
"n_active_tokens": 100,
|
44 |
+
"neuronxcc_version": "2.19.8089.0+8ab9f450",
|
45 |
+
"num_cores_per_group": 1,
|
46 |
+
"on_device_sampling": true,
|
47 |
+
"optimum_neuron_version": "0.3.1.dev0",
|
48 |
+
"output_logits": false,
|
49 |
+
"padding_side": "right",
|
50 |
+
"pp_degree": 1,
|
51 |
+
"qk_layernorm": false,
|
52 |
+
"qkv_kernel_enabled": false,
|
53 |
+
"rpl_reduce_dtype": "float16",
|
54 |
+
"sequence_length": 100,
|
55 |
+
"sequence_parallel_enabled": false,
|
56 |
+
"speculation_length": 0,
|
57 |
+
"start_rank_id": 0,
|
58 |
+
"target": null,
|
59 |
+
"torch_dtype": "float16",
|
60 |
+
"tp_degree": 2,
|
61 |
+
"vocab_parallel": false
|
62 |
+
},
|
63 |
+
"num_attention_heads": 4,
|
64 |
+
"num_hidden_layers": 2,
|
65 |
+
"num_key_value_heads": 2,
|
66 |
+
"rms_norm_eps": 1e-06,
|
67 |
+
"rope_scaling": {
|
68 |
+
"factor": 4.0,
|
69 |
+
"original_max_position_embeddings": 32768,
|
70 |
+
"rope_type": "yarn",
|
71 |
+
"type": "yarn"
|
72 |
+
},
|
73 |
+
"rope_theta": 1000000.0,
|
74 |
+
"sliding_window": null,
|
75 |
+
"tie_word_embeddings": false,
|
76 |
+
"use_cache": true,
|
77 |
+
"use_sliding_window": false,
|
78 |
+
"vocab_size": 152064
|
79 |
+
}
|
neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev0/qwen2/yujiepan/qwen2.5-128k-tiny-random/b9b0c081795fa9e33ca6.json
ADDED
@@ -0,0 +1,79 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_entry_class": "SingleModelCacheEntry",
|
3 |
+
"_model_id": "yujiepan/qwen2.5-128k-tiny-random",
|
4 |
+
"_task": "text-generation",
|
5 |
+
"architectures": [
|
6 |
+
"Qwen2ForCausalLM"
|
7 |
+
],
|
8 |
+
"attention_dropout": 0.0,
|
9 |
+
"hidden_act": "silu",
|
10 |
+
"hidden_size": 8,
|
11 |
+
"initializer_range": 0.02,
|
12 |
+
"intermediate_size": 16,
|
13 |
+
"layer_types": [
|
14 |
+
"full_attention",
|
15 |
+
"full_attention"
|
16 |
+
],
|
17 |
+
"max_position_embeddings": 32768,
|
18 |
+
"max_window_layers": 1,
|
19 |
+
"model_type": "qwen2",
|
20 |
+
"neuron": {
|
21 |
+
"_serialized_key": "NxDNeuronConfig",
|
22 |
+
"async_mode": false,
|
23 |
+
"attn_kernel_enabled": false,
|
24 |
+
"batch_size": 1,
|
25 |
+
"capacity_factor": null,
|
26 |
+
"cc_pipeline_tiling_factor": 2,
|
27 |
+
"checkpoint_id": "yujiepan/qwen2.5-128k-tiny-random",
|
28 |
+
"checkpoint_revision": "c8296d4ca3f87782876d2382fbb6481d1beb8ef0",
|
29 |
+
"continuous_batching": false,
|
30 |
+
"enable_bucketing": false,
|
31 |
+
"ep_degree": 1,
|
32 |
+
"flash_decoding_enabled": false,
|
33 |
+
"fused_qkv": false,
|
34 |
+
"glu_mlp": true,
|
35 |
+
"is_chunked_prefill": false,
|
36 |
+
"local_ranks_size": 2,
|
37 |
+
"logical_nc_config": 1,
|
38 |
+
"max_batch_size": 1,
|
39 |
+
"max_context_length": 100,
|
40 |
+
"max_topk": 256,
|
41 |
+
"mlp_kernel_enabled": false,
|
42 |
+
"mlp_kernel_fuse_residual_add": false,
|
43 |
+
"n_active_tokens": 100,
|
44 |
+
"neuronxcc_version": "2.19.8089.0+8ab9f450",
|
45 |
+
"num_cores_per_group": 1,
|
46 |
+
"on_device_sampling": true,
|
47 |
+
"optimum_neuron_version": "0.3.1.dev0",
|
48 |
+
"output_logits": false,
|
49 |
+
"padding_side": "right",
|
50 |
+
"pp_degree": 1,
|
51 |
+
"qk_layernorm": false,
|
52 |
+
"qkv_kernel_enabled": false,
|
53 |
+
"rpl_reduce_dtype": "bfloat16",
|
54 |
+
"sequence_length": 100,
|
55 |
+
"sequence_parallel_enabled": false,
|
56 |
+
"speculation_length": 0,
|
57 |
+
"start_rank_id": 0,
|
58 |
+
"target": null,
|
59 |
+
"torch_dtype": "bfloat16",
|
60 |
+
"tp_degree": 2,
|
61 |
+
"vocab_parallel": false
|
62 |
+
},
|
63 |
+
"num_attention_heads": 4,
|
64 |
+
"num_hidden_layers": 2,
|
65 |
+
"num_key_value_heads": 2,
|
66 |
+
"rms_norm_eps": 1e-06,
|
67 |
+
"rope_scaling": {
|
68 |
+
"factor": 4.0,
|
69 |
+
"original_max_position_embeddings": 32768,
|
70 |
+
"rope_type": "yarn",
|
71 |
+
"type": "yarn"
|
72 |
+
},
|
73 |
+
"rope_theta": 1000000.0,
|
74 |
+
"sliding_window": null,
|
75 |
+
"tie_word_embeddings": false,
|
76 |
+
"use_cache": true,
|
77 |
+
"use_sliding_window": false,
|
78 |
+
"vocab_size": 152064
|
79 |
+
}
|
neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/albert/hf-internal-testing/tiny-random-AlbertModel/082c855afd5bbe38fea8.json
ADDED
@@ -0,0 +1,54 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_entry_class": "SingleModelCacheEntry",
|
3 |
+
"_model_id": "hf-internal-testing/tiny-random-AlbertModel",
|
4 |
+
"_task": "fill-mask",
|
5 |
+
"architectures": [
|
6 |
+
"AlbertModel"
|
7 |
+
],
|
8 |
+
"attention_probs_dropout_prob": 0.1,
|
9 |
+
"classifier_dropout_prob": 0.1,
|
10 |
+
"embedding_size": 128,
|
11 |
+
"hidden_act": "gelu",
|
12 |
+
"hidden_dropout_prob": 0.1,
|
13 |
+
"hidden_size": 36,
|
14 |
+
"initializer_range": 0.02,
|
15 |
+
"inner_group_num": 1,
|
16 |
+
"intermediate_size": 37,
|
17 |
+
"layer_norm_eps": 1e-12,
|
18 |
+
"max_position_embeddings": 512,
|
19 |
+
"model_type": "albert",
|
20 |
+
"neuron": {
|
21 |
+
"auto_cast": null,
|
22 |
+
"auto_cast_type": null,
|
23 |
+
"compiler_type": "neuronx-cc",
|
24 |
+
"compiler_version": "2.19.8089.0+8ab9f450",
|
25 |
+
"disable_fallback": false,
|
26 |
+
"disable_fast_relayout": false,
|
27 |
+
"dynamic_batch_size": false,
|
28 |
+
"float_dtype": "fp32",
|
29 |
+
"inline_weights_to_neff": true,
|
30 |
+
"input_names": [
|
31 |
+
"input_ids",
|
32 |
+
"attention_mask",
|
33 |
+
"token_type_ids"
|
34 |
+
],
|
35 |
+
"int_dtype": "int64",
|
36 |
+
"model_type": "albert",
|
37 |
+
"optlevel": "2",
|
38 |
+
"output_attentions": false,
|
39 |
+
"output_hidden_states": false,
|
40 |
+
"output_names": [
|
41 |
+
"logits"
|
42 |
+
],
|
43 |
+
"static_batch_size": 1,
|
44 |
+
"static_sequence_length": 128,
|
45 |
+
"task": "fill-mask",
|
46 |
+
"tensor_parallel_size": 1
|
47 |
+
},
|
48 |
+
"num_attention_heads": 6,
|
49 |
+
"num_hidden_groups": 6,
|
50 |
+
"num_hidden_layers": 6,
|
51 |
+
"position_embedding_type": "absolute",
|
52 |
+
"type_vocab_size": 16,
|
53 |
+
"vocab_size": 30000
|
54 |
+
}
|
neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/albert/hf-internal-testing/tiny-random-AlbertModel/19ebb6a6a5ec909e86f1.json
ADDED
@@ -0,0 +1,55 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_entry_class": "SingleModelCacheEntry",
|
3 |
+
"_model_id": "hf-internal-testing/tiny-random-AlbertModel",
|
4 |
+
"_task": "feature-extraction",
|
5 |
+
"architectures": [
|
6 |
+
"AlbertModel"
|
7 |
+
],
|
8 |
+
"attention_probs_dropout_prob": 0.1,
|
9 |
+
"classifier_dropout_prob": 0.1,
|
10 |
+
"embedding_size": 128,
|
11 |
+
"hidden_act": "gelu",
|
12 |
+
"hidden_dropout_prob": 0.1,
|
13 |
+
"hidden_size": 36,
|
14 |
+
"initializer_range": 0.02,
|
15 |
+
"inner_group_num": 1,
|
16 |
+
"intermediate_size": 37,
|
17 |
+
"layer_norm_eps": 1e-12,
|
18 |
+
"max_position_embeddings": 512,
|
19 |
+
"model_type": "albert",
|
20 |
+
"neuron": {
|
21 |
+
"auto_cast": null,
|
22 |
+
"auto_cast_type": null,
|
23 |
+
"compiler_type": "neuronx-cc",
|
24 |
+
"compiler_version": "2.19.8089.0+8ab9f450",
|
25 |
+
"disable_fallback": false,
|
26 |
+
"disable_fast_relayout": false,
|
27 |
+
"dynamic_batch_size": true,
|
28 |
+
"float_dtype": "fp32",
|
29 |
+
"inline_weights_to_neff": true,
|
30 |
+
"input_names": [
|
31 |
+
"input_ids",
|
32 |
+
"attention_mask",
|
33 |
+
"token_type_ids"
|
34 |
+
],
|
35 |
+
"int_dtype": "int64",
|
36 |
+
"model_type": "albert",
|
37 |
+
"optlevel": "2",
|
38 |
+
"output_attentions": false,
|
39 |
+
"output_hidden_states": false,
|
40 |
+
"output_names": [
|
41 |
+
"last_hidden_state",
|
42 |
+
"pooler_output"
|
43 |
+
],
|
44 |
+
"static_batch_size": 1,
|
45 |
+
"static_sequence_length": 32,
|
46 |
+
"task": "feature-extraction",
|
47 |
+
"tensor_parallel_size": 1
|
48 |
+
},
|
49 |
+
"num_attention_heads": 6,
|
50 |
+
"num_hidden_groups": 6,
|
51 |
+
"num_hidden_layers": 6,
|
52 |
+
"position_embedding_type": "absolute",
|
53 |
+
"type_vocab_size": 16,
|
54 |
+
"vocab_size": 30000
|
55 |
+
}
|
neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/albert/hf-internal-testing/tiny-random-AlbertModel/1e1cab9afee16970464a.json
ADDED
@@ -0,0 +1,55 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_entry_class": "SingleModelCacheEntry",
|
3 |
+
"_model_id": "hf-internal-testing/tiny-random-AlbertModel",
|
4 |
+
"_task": "question-answering",
|
5 |
+
"architectures": [
|
6 |
+
"AlbertModel"
|
7 |
+
],
|
8 |
+
"attention_probs_dropout_prob": 0.1,
|
9 |
+
"classifier_dropout_prob": 0.1,
|
10 |
+
"embedding_size": 128,
|
11 |
+
"hidden_act": "gelu",
|
12 |
+
"hidden_dropout_prob": 0.1,
|
13 |
+
"hidden_size": 36,
|
14 |
+
"initializer_range": 0.02,
|
15 |
+
"inner_group_num": 1,
|
16 |
+
"intermediate_size": 37,
|
17 |
+
"layer_norm_eps": 1e-12,
|
18 |
+
"max_position_embeddings": 512,
|
19 |
+
"model_type": "albert",
|
20 |
+
"neuron": {
|
21 |
+
"auto_cast": null,
|
22 |
+
"auto_cast_type": null,
|
23 |
+
"compiler_type": "neuronx-cc",
|
24 |
+
"compiler_version": "2.19.8089.0+8ab9f450",
|
25 |
+
"disable_fallback": false,
|
26 |
+
"disable_fast_relayout": false,
|
27 |
+
"dynamic_batch_size": false,
|
28 |
+
"float_dtype": "fp32",
|
29 |
+
"inline_weights_to_neff": true,
|
30 |
+
"input_names": [
|
31 |
+
"input_ids",
|
32 |
+
"attention_mask",
|
33 |
+
"token_type_ids"
|
34 |
+
],
|
35 |
+
"int_dtype": "int64",
|
36 |
+
"model_type": "albert",
|
37 |
+
"optlevel": "2",
|
38 |
+
"output_attentions": false,
|
39 |
+
"output_hidden_states": false,
|
40 |
+
"output_names": [
|
41 |
+
"start_logits",
|
42 |
+
"end_logits"
|
43 |
+
],
|
44 |
+
"static_batch_size": 1,
|
45 |
+
"static_sequence_length": 32,
|
46 |
+
"task": "question-answering",
|
47 |
+
"tensor_parallel_size": 1
|
48 |
+
},
|
49 |
+
"num_attention_heads": 6,
|
50 |
+
"num_hidden_groups": 6,
|
51 |
+
"num_hidden_layers": 6,
|
52 |
+
"position_embedding_type": "absolute",
|
53 |
+
"type_vocab_size": 16,
|
54 |
+
"vocab_size": 30000
|
55 |
+
}
|
neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/albert/hf-internal-testing/tiny-random-AlbertModel/2420b2b633bc1e938403.json
ADDED
@@ -0,0 +1,54 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_entry_class": "SingleModelCacheEntry",
|
3 |
+
"_model_id": "hf-internal-testing/tiny-random-AlbertModel",
|
4 |
+
"_task": "text-classification",
|
5 |
+
"architectures": [
|
6 |
+
"AlbertModel"
|
7 |
+
],
|
8 |
+
"attention_probs_dropout_prob": 0.1,
|
9 |
+
"classifier_dropout_prob": 0.1,
|
10 |
+
"embedding_size": 128,
|
11 |
+
"hidden_act": "gelu",
|
12 |
+
"hidden_dropout_prob": 0.1,
|
13 |
+
"hidden_size": 36,
|
14 |
+
"initializer_range": 0.02,
|
15 |
+
"inner_group_num": 1,
|
16 |
+
"intermediate_size": 37,
|
17 |
+
"layer_norm_eps": 1e-12,
|
18 |
+
"max_position_embeddings": 512,
|
19 |
+
"model_type": "albert",
|
20 |
+
"neuron": {
|
21 |
+
"auto_cast": null,
|
22 |
+
"auto_cast_type": null,
|
23 |
+
"compiler_type": "neuronx-cc",
|
24 |
+
"compiler_version": "2.19.8089.0+8ab9f450",
|
25 |
+
"disable_fallback": false,
|
26 |
+
"disable_fast_relayout": false,
|
27 |
+
"dynamic_batch_size": false,
|
28 |
+
"float_dtype": "fp32",
|
29 |
+
"inline_weights_to_neff": true,
|
30 |
+
"input_names": [
|
31 |
+
"input_ids",
|
32 |
+
"attention_mask",
|
33 |
+
"token_type_ids"
|
34 |
+
],
|
35 |
+
"int_dtype": "int64",
|
36 |
+
"model_type": "albert",
|
37 |
+
"optlevel": "2",
|
38 |
+
"output_attentions": false,
|
39 |
+
"output_hidden_states": false,
|
40 |
+
"output_names": [
|
41 |
+
"logits"
|
42 |
+
],
|
43 |
+
"static_batch_size": 1,
|
44 |
+
"static_sequence_length": 32,
|
45 |
+
"task": "text-classification",
|
46 |
+
"tensor_parallel_size": 1
|
47 |
+
},
|
48 |
+
"num_attention_heads": 6,
|
49 |
+
"num_hidden_groups": 6,
|
50 |
+
"num_hidden_layers": 6,
|
51 |
+
"position_embedding_type": "absolute",
|
52 |
+
"type_vocab_size": 16,
|
53 |
+
"vocab_size": 30000
|
54 |
+
}
|
neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/albert/hf-internal-testing/tiny-random-AlbertModel/3585a8b7eec15ef74cc9.json
ADDED
@@ -0,0 +1,55 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_entry_class": "SingleModelCacheEntry",
|
3 |
+
"_model_id": "hf-internal-testing/tiny-random-AlbertModel",
|
4 |
+
"_task": "multiple-choice",
|
5 |
+
"architectures": [
|
6 |
+
"AlbertModel"
|
7 |
+
],
|
8 |
+
"attention_probs_dropout_prob": 0.1,
|
9 |
+
"classifier_dropout_prob": 0.1,
|
10 |
+
"embedding_size": 128,
|
11 |
+
"hidden_act": "gelu",
|
12 |
+
"hidden_dropout_prob": 0.1,
|
13 |
+
"hidden_size": 36,
|
14 |
+
"initializer_range": 0.02,
|
15 |
+
"inner_group_num": 1,
|
16 |
+
"intermediate_size": 37,
|
17 |
+
"layer_norm_eps": 1e-12,
|
18 |
+
"max_position_embeddings": 512,
|
19 |
+
"model_type": "albert",
|
20 |
+
"neuron": {
|
21 |
+
"auto_cast": null,
|
22 |
+
"auto_cast_type": null,
|
23 |
+
"compiler_type": "neuronx-cc",
|
24 |
+
"compiler_version": "2.19.8089.0+8ab9f450",
|
25 |
+
"disable_fallback": false,
|
26 |
+
"disable_fast_relayout": false,
|
27 |
+
"dynamic_batch_size": true,
|
28 |
+
"float_dtype": "fp32",
|
29 |
+
"inline_weights_to_neff": true,
|
30 |
+
"input_names": [
|
31 |
+
"input_ids",
|
32 |
+
"attention_mask",
|
33 |
+
"token_type_ids"
|
34 |
+
],
|
35 |
+
"int_dtype": "int64",
|
36 |
+
"model_type": "albert",
|
37 |
+
"optlevel": "2",
|
38 |
+
"output_attentions": false,
|
39 |
+
"output_hidden_states": false,
|
40 |
+
"output_names": [
|
41 |
+
"logits"
|
42 |
+
],
|
43 |
+
"static_batch_size": 1,
|
44 |
+
"static_num_choices": 4,
|
45 |
+
"static_sequence_length": 128,
|
46 |
+
"task": "multiple-choice",
|
47 |
+
"tensor_parallel_size": 1
|
48 |
+
},
|
49 |
+
"num_attention_heads": 6,
|
50 |
+
"num_hidden_groups": 6,
|
51 |
+
"num_hidden_layers": 6,
|
52 |
+
"position_embedding_type": "absolute",
|
53 |
+
"type_vocab_size": 16,
|
54 |
+
"vocab_size": 30000
|
55 |
+
}
|
neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/albert/hf-internal-testing/tiny-random-AlbertModel/4d038e1c09d623b63731.json
ADDED
@@ -0,0 +1,55 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_entry_class": "SingleModelCacheEntry",
|
3 |
+
"_model_id": "hf-internal-testing/tiny-random-AlbertModel",
|
4 |
+
"_task": "feature-extraction",
|
5 |
+
"architectures": [
|
6 |
+
"AlbertModel"
|
7 |
+
],
|
8 |
+
"attention_probs_dropout_prob": 0.1,
|
9 |
+
"classifier_dropout_prob": 0.1,
|
10 |
+
"embedding_size": 128,
|
11 |
+
"hidden_act": "gelu",
|
12 |
+
"hidden_dropout_prob": 0.1,
|
13 |
+
"hidden_size": 36,
|
14 |
+
"initializer_range": 0.02,
|
15 |
+
"inner_group_num": 1,
|
16 |
+
"intermediate_size": 37,
|
17 |
+
"layer_norm_eps": 1e-12,
|
18 |
+
"max_position_embeddings": 512,
|
19 |
+
"model_type": "albert",
|
20 |
+
"neuron": {
|
21 |
+
"auto_cast": null,
|
22 |
+
"auto_cast_type": null,
|
23 |
+
"compiler_type": "neuronx-cc",
|
24 |
+
"compiler_version": "2.19.8089.0+8ab9f450",
|
25 |
+
"disable_fallback": false,
|
26 |
+
"disable_fast_relayout": false,
|
27 |
+
"dynamic_batch_size": false,
|
28 |
+
"float_dtype": "fp32",
|
29 |
+
"inline_weights_to_neff": true,
|
30 |
+
"input_names": [
|
31 |
+
"input_ids",
|
32 |
+
"attention_mask",
|
33 |
+
"token_type_ids"
|
34 |
+
],
|
35 |
+
"int_dtype": "int64",
|
36 |
+
"model_type": "albert",
|
37 |
+
"optlevel": "2",
|
38 |
+
"output_attentions": false,
|
39 |
+
"output_hidden_states": false,
|
40 |
+
"output_names": [
|
41 |
+
"last_hidden_state",
|
42 |
+
"pooler_output"
|
43 |
+
],
|
44 |
+
"static_batch_size": 1,
|
45 |
+
"static_sequence_length": 128,
|
46 |
+
"task": "feature-extraction",
|
47 |
+
"tensor_parallel_size": 1
|
48 |
+
},
|
49 |
+
"num_attention_heads": 6,
|
50 |
+
"num_hidden_groups": 6,
|
51 |
+
"num_hidden_layers": 6,
|
52 |
+
"position_embedding_type": "absolute",
|
53 |
+
"type_vocab_size": 16,
|
54 |
+
"vocab_size": 30000
|
55 |
+
}
|
neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/albert/hf-internal-testing/tiny-random-AlbertModel/59c92a651b8b40190b9d.json
ADDED
@@ -0,0 +1,54 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_entry_class": "SingleModelCacheEntry",
|
3 |
+
"_model_id": "hf-internal-testing/tiny-random-AlbertModel",
|
4 |
+
"_task": "token-classification",
|
5 |
+
"architectures": [
|
6 |
+
"AlbertModel"
|
7 |
+
],
|
8 |
+
"attention_probs_dropout_prob": 0.1,
|
9 |
+
"classifier_dropout_prob": 0.1,
|
10 |
+
"embedding_size": 128,
|
11 |
+
"hidden_act": "gelu",
|
12 |
+
"hidden_dropout_prob": 0.1,
|
13 |
+
"hidden_size": 36,
|
14 |
+
"initializer_range": 0.02,
|
15 |
+
"inner_group_num": 1,
|
16 |
+
"intermediate_size": 37,
|
17 |
+
"layer_norm_eps": 1e-12,
|
18 |
+
"max_position_embeddings": 512,
|
19 |
+
"model_type": "albert",
|
20 |
+
"neuron": {
|
21 |
+
"auto_cast": null,
|
22 |
+
"auto_cast_type": null,
|
23 |
+
"compiler_type": "neuronx-cc",
|
24 |
+
"compiler_version": "2.19.8089.0+8ab9f450",
|
25 |
+
"disable_fallback": false,
|
26 |
+
"disable_fast_relayout": false,
|
27 |
+
"dynamic_batch_size": false,
|
28 |
+
"float_dtype": "fp32",
|
29 |
+
"inline_weights_to_neff": true,
|
30 |
+
"input_names": [
|
31 |
+
"input_ids",
|
32 |
+
"attention_mask",
|
33 |
+
"token_type_ids"
|
34 |
+
],
|
35 |
+
"int_dtype": "int64",
|
36 |
+
"model_type": "albert",
|
37 |
+
"optlevel": "2",
|
38 |
+
"output_attentions": false,
|
39 |
+
"output_hidden_states": false,
|
40 |
+
"output_names": [
|
41 |
+
"logits"
|
42 |
+
],
|
43 |
+
"static_batch_size": 1,
|
44 |
+
"static_sequence_length": 32,
|
45 |
+
"task": "token-classification",
|
46 |
+
"tensor_parallel_size": 1
|
47 |
+
},
|
48 |
+
"num_attention_heads": 6,
|
49 |
+
"num_hidden_groups": 6,
|
50 |
+
"num_hidden_layers": 6,
|
51 |
+
"position_embedding_type": "absolute",
|
52 |
+
"type_vocab_size": 16,
|
53 |
+
"vocab_size": 30000
|
54 |
+
}
|
neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/albert/hf-internal-testing/tiny-random-AlbertModel/707d5fc3c98b3c204500.json
ADDED
@@ -0,0 +1,54 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_entry_class": "SingleModelCacheEntry",
|
3 |
+
"_model_id": "hf-internal-testing/tiny-random-AlbertModel",
|
4 |
+
"_task": "fill-mask",
|
5 |
+
"architectures": [
|
6 |
+
"AlbertModel"
|
7 |
+
],
|
8 |
+
"attention_probs_dropout_prob": 0.1,
|
9 |
+
"classifier_dropout_prob": 0.1,
|
10 |
+
"embedding_size": 128,
|
11 |
+
"hidden_act": "gelu",
|
12 |
+
"hidden_dropout_prob": 0.1,
|
13 |
+
"hidden_size": 36,
|
14 |
+
"initializer_range": 0.02,
|
15 |
+
"inner_group_num": 1,
|
16 |
+
"intermediate_size": 37,
|
17 |
+
"layer_norm_eps": 1e-12,
|
18 |
+
"max_position_embeddings": 512,
|
19 |
+
"model_type": "albert",
|
20 |
+
"neuron": {
|
21 |
+
"auto_cast": null,
|
22 |
+
"auto_cast_type": null,
|
23 |
+
"compiler_type": "neuronx-cc",
|
24 |
+
"compiler_version": "2.19.8089.0+8ab9f450",
|
25 |
+
"disable_fallback": false,
|
26 |
+
"disable_fast_relayout": false,
|
27 |
+
"dynamic_batch_size": true,
|
28 |
+
"float_dtype": "fp32",
|
29 |
+
"inline_weights_to_neff": true,
|
30 |
+
"input_names": [
|
31 |
+
"input_ids",
|
32 |
+
"attention_mask",
|
33 |
+
"token_type_ids"
|
34 |
+
],
|
35 |
+
"int_dtype": "int64",
|
36 |
+
"model_type": "albert",
|
37 |
+
"optlevel": "2",
|
38 |
+
"output_attentions": false,
|
39 |
+
"output_hidden_states": false,
|
40 |
+
"output_names": [
|
41 |
+
"logits"
|
42 |
+
],
|
43 |
+
"static_batch_size": 1,
|
44 |
+
"static_sequence_length": 32,
|
45 |
+
"task": "fill-mask",
|
46 |
+
"tensor_parallel_size": 1
|
47 |
+
},
|
48 |
+
"num_attention_heads": 6,
|
49 |
+
"num_hidden_groups": 6,
|
50 |
+
"num_hidden_layers": 6,
|
51 |
+
"position_embedding_type": "absolute",
|
52 |
+
"type_vocab_size": 16,
|
53 |
+
"vocab_size": 30000
|
54 |
+
}
|
neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/albert/hf-internal-testing/tiny-random-AlbertModel/8829976eff976b676195.json
ADDED
@@ -0,0 +1,54 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_entry_class": "SingleModelCacheEntry",
|
3 |
+
"_model_id": "hf-internal-testing/tiny-random-AlbertModel",
|
4 |
+
"_task": "token-classification",
|
5 |
+
"architectures": [
|
6 |
+
"AlbertModel"
|
7 |
+
],
|
8 |
+
"attention_probs_dropout_prob": 0.1,
|
9 |
+
"classifier_dropout_prob": 0.1,
|
10 |
+
"embedding_size": 128,
|
11 |
+
"hidden_act": "gelu",
|
12 |
+
"hidden_dropout_prob": 0.1,
|
13 |
+
"hidden_size": 36,
|
14 |
+
"initializer_range": 0.02,
|
15 |
+
"inner_group_num": 1,
|
16 |
+
"intermediate_size": 37,
|
17 |
+
"layer_norm_eps": 1e-12,
|
18 |
+
"max_position_embeddings": 512,
|
19 |
+
"model_type": "albert",
|
20 |
+
"neuron": {
|
21 |
+
"auto_cast": null,
|
22 |
+
"auto_cast_type": null,
|
23 |
+
"compiler_type": "neuronx-cc",
|
24 |
+
"compiler_version": "2.19.8089.0+8ab9f450",
|
25 |
+
"disable_fallback": false,
|
26 |
+
"disable_fast_relayout": false,
|
27 |
+
"dynamic_batch_size": false,
|
28 |
+
"float_dtype": "fp32",
|
29 |
+
"inline_weights_to_neff": true,
|
30 |
+
"input_names": [
|
31 |
+
"input_ids",
|
32 |
+
"attention_mask",
|
33 |
+
"token_type_ids"
|
34 |
+
],
|
35 |
+
"int_dtype": "int64",
|
36 |
+
"model_type": "albert",
|
37 |
+
"optlevel": "2",
|
38 |
+
"output_attentions": false,
|
39 |
+
"output_hidden_states": false,
|
40 |
+
"output_names": [
|
41 |
+
"logits"
|
42 |
+
],
|
43 |
+
"static_batch_size": 1,
|
44 |
+
"static_sequence_length": 128,
|
45 |
+
"task": "token-classification",
|
46 |
+
"tensor_parallel_size": 1
|
47 |
+
},
|
48 |
+
"num_attention_heads": 6,
|
49 |
+
"num_hidden_groups": 6,
|
50 |
+
"num_hidden_layers": 6,
|
51 |
+
"position_embedding_type": "absolute",
|
52 |
+
"type_vocab_size": 16,
|
53 |
+
"vocab_size": 30000
|
54 |
+
}
|
neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/albert/hf-internal-testing/tiny-random-AlbertModel/903f2ac3444c8203b948.json
ADDED
@@ -0,0 +1,54 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_entry_class": "SingleModelCacheEntry",
|
3 |
+
"_model_id": "hf-internal-testing/tiny-random-AlbertModel",
|
4 |
+
"_task": "fill-mask",
|
5 |
+
"architectures": [
|
6 |
+
"AlbertModel"
|
7 |
+
],
|
8 |
+
"attention_probs_dropout_prob": 0.1,
|
9 |
+
"classifier_dropout_prob": 0.1,
|
10 |
+
"embedding_size": 128,
|
11 |
+
"hidden_act": "gelu",
|
12 |
+
"hidden_dropout_prob": 0.1,
|
13 |
+
"hidden_size": 36,
|
14 |
+
"initializer_range": 0.02,
|
15 |
+
"inner_group_num": 1,
|
16 |
+
"intermediate_size": 37,
|
17 |
+
"layer_norm_eps": 1e-12,
|
18 |
+
"max_position_embeddings": 512,
|
19 |
+
"model_type": "albert",
|
20 |
+
"neuron": {
|
21 |
+
"auto_cast": null,
|
22 |
+
"auto_cast_type": null,
|
23 |
+
"compiler_type": "neuronx-cc",
|
24 |
+
"compiler_version": "2.19.8089.0+8ab9f450",
|
25 |
+
"disable_fallback": false,
|
26 |
+
"disable_fast_relayout": false,
|
27 |
+
"dynamic_batch_size": false,
|
28 |
+
"float_dtype": "fp32",
|
29 |
+
"inline_weights_to_neff": true,
|
30 |
+
"input_names": [
|
31 |
+
"input_ids",
|
32 |
+
"attention_mask",
|
33 |
+
"token_type_ids"
|
34 |
+
],
|
35 |
+
"int_dtype": "int64",
|
36 |
+
"model_type": "albert",
|
37 |
+
"optlevel": "2",
|
38 |
+
"output_attentions": false,
|
39 |
+
"output_hidden_states": false,
|
40 |
+
"output_names": [
|
41 |
+
"logits"
|
42 |
+
],
|
43 |
+
"static_batch_size": 1,
|
44 |
+
"static_sequence_length": 32,
|
45 |
+
"task": "fill-mask",
|
46 |
+
"tensor_parallel_size": 1
|
47 |
+
},
|
48 |
+
"num_attention_heads": 6,
|
49 |
+
"num_hidden_groups": 6,
|
50 |
+
"num_hidden_layers": 6,
|
51 |
+
"position_embedding_type": "absolute",
|
52 |
+
"type_vocab_size": 16,
|
53 |
+
"vocab_size": 30000
|
54 |
+
}
|
neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/albert/hf-internal-testing/tiny-random-AlbertModel/9b69ad26e6071c069631.json
ADDED
@@ -0,0 +1,55 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_entry_class": "SingleModelCacheEntry",
|
3 |
+
"_model_id": "hf-internal-testing/tiny-random-AlbertModel",
|
4 |
+
"_task": "question-answering",
|
5 |
+
"architectures": [
|
6 |
+
"AlbertModel"
|
7 |
+
],
|
8 |
+
"attention_probs_dropout_prob": 0.1,
|
9 |
+
"classifier_dropout_prob": 0.1,
|
10 |
+
"embedding_size": 128,
|
11 |
+
"hidden_act": "gelu",
|
12 |
+
"hidden_dropout_prob": 0.1,
|
13 |
+
"hidden_size": 36,
|
14 |
+
"initializer_range": 0.02,
|
15 |
+
"inner_group_num": 1,
|
16 |
+
"intermediate_size": 37,
|
17 |
+
"layer_norm_eps": 1e-12,
|
18 |
+
"max_position_embeddings": 512,
|
19 |
+
"model_type": "albert",
|
20 |
+
"neuron": {
|
21 |
+
"auto_cast": null,
|
22 |
+
"auto_cast_type": null,
|
23 |
+
"compiler_type": "neuronx-cc",
|
24 |
+
"compiler_version": "2.19.8089.0+8ab9f450",
|
25 |
+
"disable_fallback": false,
|
26 |
+
"disable_fast_relayout": false,
|
27 |
+
"dynamic_batch_size": false,
|
28 |
+
"float_dtype": "fp32",
|
29 |
+
"inline_weights_to_neff": true,
|
30 |
+
"input_names": [
|
31 |
+
"input_ids",
|
32 |
+
"attention_mask",
|
33 |
+
"token_type_ids"
|
34 |
+
],
|
35 |
+
"int_dtype": "int64",
|
36 |
+
"model_type": "albert",
|
37 |
+
"optlevel": "2",
|
38 |
+
"output_attentions": false,
|
39 |
+
"output_hidden_states": false,
|
40 |
+
"output_names": [
|
41 |
+
"start_logits",
|
42 |
+
"end_logits"
|
43 |
+
],
|
44 |
+
"static_batch_size": 1,
|
45 |
+
"static_sequence_length": 128,
|
46 |
+
"task": "question-answering",
|
47 |
+
"tensor_parallel_size": 1
|
48 |
+
},
|
49 |
+
"num_attention_heads": 6,
|
50 |
+
"num_hidden_groups": 6,
|
51 |
+
"num_hidden_layers": 6,
|
52 |
+
"position_embedding_type": "absolute",
|
53 |
+
"type_vocab_size": 16,
|
54 |
+
"vocab_size": 30000
|
55 |
+
}
|
neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/albert/hf-internal-testing/tiny-random-AlbertModel/aa7706c37f42f9b0efa0.json
ADDED
@@ -0,0 +1,54 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_entry_class": "SingleModelCacheEntry",
|
3 |
+
"_model_id": "hf-internal-testing/tiny-random-AlbertModel",
|
4 |
+
"_task": "token-classification",
|
5 |
+
"architectures": [
|
6 |
+
"AlbertModel"
|
7 |
+
],
|
8 |
+
"attention_probs_dropout_prob": 0.1,
|
9 |
+
"classifier_dropout_prob": 0.1,
|
10 |
+
"embedding_size": 128,
|
11 |
+
"hidden_act": "gelu",
|
12 |
+
"hidden_dropout_prob": 0.1,
|
13 |
+
"hidden_size": 36,
|
14 |
+
"initializer_range": 0.02,
|
15 |
+
"inner_group_num": 1,
|
16 |
+
"intermediate_size": 37,
|
17 |
+
"layer_norm_eps": 1e-12,
|
18 |
+
"max_position_embeddings": 512,
|
19 |
+
"model_type": "albert",
|
20 |
+
"neuron": {
|
21 |
+
"auto_cast": null,
|
22 |
+
"auto_cast_type": null,
|
23 |
+
"compiler_type": "neuronx-cc",
|
24 |
+
"compiler_version": "2.19.8089.0+8ab9f450",
|
25 |
+
"disable_fallback": false,
|
26 |
+
"disable_fast_relayout": false,
|
27 |
+
"dynamic_batch_size": true,
|
28 |
+
"float_dtype": "fp32",
|
29 |
+
"inline_weights_to_neff": true,
|
30 |
+
"input_names": [
|
31 |
+
"input_ids",
|
32 |
+
"attention_mask",
|
33 |
+
"token_type_ids"
|
34 |
+
],
|
35 |
+
"int_dtype": "int64",
|
36 |
+
"model_type": "albert",
|
37 |
+
"optlevel": "2",
|
38 |
+
"output_attentions": false,
|
39 |
+
"output_hidden_states": false,
|
40 |
+
"output_names": [
|
41 |
+
"logits"
|
42 |
+
],
|
43 |
+
"static_batch_size": 1,
|
44 |
+
"static_sequence_length": 32,
|
45 |
+
"task": "token-classification",
|
46 |
+
"tensor_parallel_size": 1
|
47 |
+
},
|
48 |
+
"num_attention_heads": 6,
|
49 |
+
"num_hidden_groups": 6,
|
50 |
+
"num_hidden_layers": 6,
|
51 |
+
"position_embedding_type": "absolute",
|
52 |
+
"type_vocab_size": 16,
|
53 |
+
"vocab_size": 30000
|
54 |
+
}
|
neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/albert/hf-internal-testing/tiny-random-AlbertModel/b5b638607d26526724c7.json
ADDED
@@ -0,0 +1,54 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_entry_class": "SingleModelCacheEntry",
|
3 |
+
"_model_id": "hf-internal-testing/tiny-random-AlbertModel",
|
4 |
+
"_task": "text-classification",
|
5 |
+
"architectures": [
|
6 |
+
"AlbertModel"
|
7 |
+
],
|
8 |
+
"attention_probs_dropout_prob": 0.1,
|
9 |
+
"classifier_dropout_prob": 0.1,
|
10 |
+
"embedding_size": 128,
|
11 |
+
"hidden_act": "gelu",
|
12 |
+
"hidden_dropout_prob": 0.1,
|
13 |
+
"hidden_size": 36,
|
14 |
+
"initializer_range": 0.02,
|
15 |
+
"inner_group_num": 1,
|
16 |
+
"intermediate_size": 37,
|
17 |
+
"layer_norm_eps": 1e-12,
|
18 |
+
"max_position_embeddings": 512,
|
19 |
+
"model_type": "albert",
|
20 |
+
"neuron": {
|
21 |
+
"auto_cast": null,
|
22 |
+
"auto_cast_type": null,
|
23 |
+
"compiler_type": "neuronx-cc",
|
24 |
+
"compiler_version": "2.19.8089.0+8ab9f450",
|
25 |
+
"disable_fallback": false,
|
26 |
+
"disable_fast_relayout": false,
|
27 |
+
"dynamic_batch_size": false,
|
28 |
+
"float_dtype": "fp32",
|
29 |
+
"inline_weights_to_neff": true,
|
30 |
+
"input_names": [
|
31 |
+
"input_ids",
|
32 |
+
"attention_mask",
|
33 |
+
"token_type_ids"
|
34 |
+
],
|
35 |
+
"int_dtype": "int64",
|
36 |
+
"model_type": "albert",
|
37 |
+
"optlevel": "2",
|
38 |
+
"output_attentions": false,
|
39 |
+
"output_hidden_states": false,
|
40 |
+
"output_names": [
|
41 |
+
"logits"
|
42 |
+
],
|
43 |
+
"static_batch_size": 1,
|
44 |
+
"static_sequence_length": 128,
|
45 |
+
"task": "text-classification",
|
46 |
+
"tensor_parallel_size": 1
|
47 |
+
},
|
48 |
+
"num_attention_heads": 6,
|
49 |
+
"num_hidden_groups": 6,
|
50 |
+
"num_hidden_layers": 6,
|
51 |
+
"position_embedding_type": "absolute",
|
52 |
+
"type_vocab_size": 16,
|
53 |
+
"vocab_size": 30000
|
54 |
+
}
|
neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/albert/hf-internal-testing/tiny-random-AlbertModel/ce96b3b9bef1f6cf0d93.json
ADDED
@@ -0,0 +1,55 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_entry_class": "SingleModelCacheEntry",
|
3 |
+
"_model_id": "hf-internal-testing/tiny-random-AlbertModel",
|
4 |
+
"_task": "question-answering",
|
5 |
+
"architectures": [
|
6 |
+
"AlbertModel"
|
7 |
+
],
|
8 |
+
"attention_probs_dropout_prob": 0.1,
|
9 |
+
"classifier_dropout_prob": 0.1,
|
10 |
+
"embedding_size": 128,
|
11 |
+
"hidden_act": "gelu",
|
12 |
+
"hidden_dropout_prob": 0.1,
|
13 |
+
"hidden_size": 36,
|
14 |
+
"initializer_range": 0.02,
|
15 |
+
"inner_group_num": 1,
|
16 |
+
"intermediate_size": 37,
|
17 |
+
"layer_norm_eps": 1e-12,
|
18 |
+
"max_position_embeddings": 512,
|
19 |
+
"model_type": "albert",
|
20 |
+
"neuron": {
|
21 |
+
"auto_cast": null,
|
22 |
+
"auto_cast_type": null,
|
23 |
+
"compiler_type": "neuronx-cc",
|
24 |
+
"compiler_version": "2.19.8089.0+8ab9f450",
|
25 |
+
"disable_fallback": false,
|
26 |
+
"disable_fast_relayout": false,
|
27 |
+
"dynamic_batch_size": true,
|
28 |
+
"float_dtype": "fp32",
|
29 |
+
"inline_weights_to_neff": true,
|
30 |
+
"input_names": [
|
31 |
+
"input_ids",
|
32 |
+
"attention_mask",
|
33 |
+
"token_type_ids"
|
34 |
+
],
|
35 |
+
"int_dtype": "int64",
|
36 |
+
"model_type": "albert",
|
37 |
+
"optlevel": "2",
|
38 |
+
"output_attentions": false,
|
39 |
+
"output_hidden_states": false,
|
40 |
+
"output_names": [
|
41 |
+
"start_logits",
|
42 |
+
"end_logits"
|
43 |
+
],
|
44 |
+
"static_batch_size": 1,
|
45 |
+
"static_sequence_length": 32,
|
46 |
+
"task": "question-answering",
|
47 |
+
"tensor_parallel_size": 1
|
48 |
+
},
|
49 |
+
"num_attention_heads": 6,
|
50 |
+
"num_hidden_groups": 6,
|
51 |
+
"num_hidden_layers": 6,
|
52 |
+
"position_embedding_type": "absolute",
|
53 |
+
"type_vocab_size": 16,
|
54 |
+
"vocab_size": 30000
|
55 |
+
}
|
neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/albert/hf-internal-testing/tiny-random-AlbertModel/cf3a4b3035690a565ab1.json
ADDED
@@ -0,0 +1,55 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_entry_class": "SingleModelCacheEntry",
|
3 |
+
"_model_id": "hf-internal-testing/tiny-random-AlbertModel",
|
4 |
+
"_task": "feature-extraction",
|
5 |
+
"architectures": [
|
6 |
+
"AlbertModel"
|
7 |
+
],
|
8 |
+
"attention_probs_dropout_prob": 0.1,
|
9 |
+
"classifier_dropout_prob": 0.1,
|
10 |
+
"embedding_size": 128,
|
11 |
+
"hidden_act": "gelu",
|
12 |
+
"hidden_dropout_prob": 0.1,
|
13 |
+
"hidden_size": 36,
|
14 |
+
"initializer_range": 0.02,
|
15 |
+
"inner_group_num": 1,
|
16 |
+
"intermediate_size": 37,
|
17 |
+
"layer_norm_eps": 1e-12,
|
18 |
+
"max_position_embeddings": 512,
|
19 |
+
"model_type": "albert",
|
20 |
+
"neuron": {
|
21 |
+
"auto_cast": null,
|
22 |
+
"auto_cast_type": null,
|
23 |
+
"compiler_type": "neuronx-cc",
|
24 |
+
"compiler_version": "2.19.8089.0+8ab9f450",
|
25 |
+
"disable_fallback": false,
|
26 |
+
"disable_fast_relayout": false,
|
27 |
+
"dynamic_batch_size": false,
|
28 |
+
"float_dtype": "fp32",
|
29 |
+
"inline_weights_to_neff": true,
|
30 |
+
"input_names": [
|
31 |
+
"input_ids",
|
32 |
+
"attention_mask",
|
33 |
+
"token_type_ids"
|
34 |
+
],
|
35 |
+
"int_dtype": "int64",
|
36 |
+
"model_type": "albert",
|
37 |
+
"optlevel": "2",
|
38 |
+
"output_attentions": false,
|
39 |
+
"output_hidden_states": false,
|
40 |
+
"output_names": [
|
41 |
+
"last_hidden_state",
|
42 |
+
"pooler_output"
|
43 |
+
],
|
44 |
+
"static_batch_size": 1,
|
45 |
+
"static_sequence_length": 32,
|
46 |
+
"task": "feature-extraction",
|
47 |
+
"tensor_parallel_size": 1
|
48 |
+
},
|
49 |
+
"num_attention_heads": 6,
|
50 |
+
"num_hidden_groups": 6,
|
51 |
+
"num_hidden_layers": 6,
|
52 |
+
"position_embedding_type": "absolute",
|
53 |
+
"type_vocab_size": 16,
|
54 |
+
"vocab_size": 30000
|
55 |
+
}
|
neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/albert/hf-internal-testing/tiny-random-AlbertModel/d2da3177c42e88297899.json
ADDED
@@ -0,0 +1,55 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_entry_class": "SingleModelCacheEntry",
|
3 |
+
"_model_id": "hf-internal-testing/tiny-random-AlbertModel",
|
4 |
+
"_task": "multiple-choice",
|
5 |
+
"architectures": [
|
6 |
+
"AlbertModel"
|
7 |
+
],
|
8 |
+
"attention_probs_dropout_prob": 0.1,
|
9 |
+
"classifier_dropout_prob": 0.1,
|
10 |
+
"embedding_size": 128,
|
11 |
+
"hidden_act": "gelu",
|
12 |
+
"hidden_dropout_prob": 0.1,
|
13 |
+
"hidden_size": 36,
|
14 |
+
"initializer_range": 0.02,
|
15 |
+
"inner_group_num": 1,
|
16 |
+
"intermediate_size": 37,
|
17 |
+
"layer_norm_eps": 1e-12,
|
18 |
+
"max_position_embeddings": 512,
|
19 |
+
"model_type": "albert",
|
20 |
+
"neuron": {
|
21 |
+
"auto_cast": null,
|
22 |
+
"auto_cast_type": null,
|
23 |
+
"compiler_type": "neuronx-cc",
|
24 |
+
"compiler_version": "2.19.8089.0+8ab9f450",
|
25 |
+
"disable_fallback": false,
|
26 |
+
"disable_fast_relayout": false,
|
27 |
+
"dynamic_batch_size": false,
|
28 |
+
"float_dtype": "fp32",
|
29 |
+
"inline_weights_to_neff": true,
|
30 |
+
"input_names": [
|
31 |
+
"input_ids",
|
32 |
+
"attention_mask",
|
33 |
+
"token_type_ids"
|
34 |
+
],
|
35 |
+
"int_dtype": "int64",
|
36 |
+
"model_type": "albert",
|
37 |
+
"optlevel": "2",
|
38 |
+
"output_attentions": false,
|
39 |
+
"output_hidden_states": false,
|
40 |
+
"output_names": [
|
41 |
+
"logits"
|
42 |
+
],
|
43 |
+
"static_batch_size": 1,
|
44 |
+
"static_num_choices": 4,
|
45 |
+
"static_sequence_length": 128,
|
46 |
+
"task": "multiple-choice",
|
47 |
+
"tensor_parallel_size": 1
|
48 |
+
},
|
49 |
+
"num_attention_heads": 6,
|
50 |
+
"num_hidden_groups": 6,
|
51 |
+
"num_hidden_layers": 6,
|
52 |
+
"position_embedding_type": "absolute",
|
53 |
+
"type_vocab_size": 16,
|
54 |
+
"vocab_size": 30000
|
55 |
+
}
|
neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/albert/hf-internal-testing/tiny-random-AlbertModel/e59dd1535caa6a29b4cc.json
ADDED
@@ -0,0 +1,54 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_entry_class": "SingleModelCacheEntry",
|
3 |
+
"_model_id": "hf-internal-testing/tiny-random-AlbertModel",
|
4 |
+
"_task": "text-classification",
|
5 |
+
"architectures": [
|
6 |
+
"AlbertModel"
|
7 |
+
],
|
8 |
+
"attention_probs_dropout_prob": 0.1,
|
9 |
+
"classifier_dropout_prob": 0.1,
|
10 |
+
"embedding_size": 128,
|
11 |
+
"hidden_act": "gelu",
|
12 |
+
"hidden_dropout_prob": 0.1,
|
13 |
+
"hidden_size": 36,
|
14 |
+
"initializer_range": 0.02,
|
15 |
+
"inner_group_num": 1,
|
16 |
+
"intermediate_size": 37,
|
17 |
+
"layer_norm_eps": 1e-12,
|
18 |
+
"max_position_embeddings": 512,
|
19 |
+
"model_type": "albert",
|
20 |
+
"neuron": {
|
21 |
+
"auto_cast": null,
|
22 |
+
"auto_cast_type": null,
|
23 |
+
"compiler_type": "neuronx-cc",
|
24 |
+
"compiler_version": "2.19.8089.0+8ab9f450",
|
25 |
+
"disable_fallback": false,
|
26 |
+
"disable_fast_relayout": false,
|
27 |
+
"dynamic_batch_size": true,
|
28 |
+
"float_dtype": "fp32",
|
29 |
+
"inline_weights_to_neff": true,
|
30 |
+
"input_names": [
|
31 |
+
"input_ids",
|
32 |
+
"attention_mask",
|
33 |
+
"token_type_ids"
|
34 |
+
],
|
35 |
+
"int_dtype": "int64",
|
36 |
+
"model_type": "albert",
|
37 |
+
"optlevel": "2",
|
38 |
+
"output_attentions": false,
|
39 |
+
"output_hidden_states": false,
|
40 |
+
"output_names": [
|
41 |
+
"logits"
|
42 |
+
],
|
43 |
+
"static_batch_size": 1,
|
44 |
+
"static_sequence_length": 32,
|
45 |
+
"task": "text-classification",
|
46 |
+
"tensor_parallel_size": 1
|
47 |
+
},
|
48 |
+
"num_attention_heads": 6,
|
49 |
+
"num_hidden_groups": 6,
|
50 |
+
"num_hidden_layers": 6,
|
51 |
+
"position_embedding_type": "absolute",
|
52 |
+
"type_vocab_size": 16,
|
53 |
+
"vocab_size": 30000
|
54 |
+
}
|
neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/beit/hf-internal-testing/tiny-random-BeitForImageClassification/7b8399664c54026a03ff.json
ADDED
@@ -0,0 +1,90 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_entry_class": "SingleModelCacheEntry",
|
3 |
+
"_model_id": "hf-internal-testing/tiny-random-BeitForImageClassification",
|
4 |
+
"_task": "image-classification",
|
5 |
+
"add_fpn": false,
|
6 |
+
"architectures": [
|
7 |
+
"BeitForImageClassification"
|
8 |
+
],
|
9 |
+
"attention_probs_dropout_prob": 0.1,
|
10 |
+
"auxiliary_channels": 256,
|
11 |
+
"auxiliary_concat_input": false,
|
12 |
+
"auxiliary_loss_weight": 0.4,
|
13 |
+
"auxiliary_num_convs": 1,
|
14 |
+
"drop_path_rate": 0.1,
|
15 |
+
"hidden_act": "gelu",
|
16 |
+
"hidden_dropout_prob": 0.1,
|
17 |
+
"hidden_size": 32,
|
18 |
+
"image_size": 30,
|
19 |
+
"initializer_range": 0.02,
|
20 |
+
"intermediate_size": 37,
|
21 |
+
"layer_norm_eps": 1e-12,
|
22 |
+
"layer_scale_init_value": 0.1,
|
23 |
+
"model_type": "beit",
|
24 |
+
"neuron": {
|
25 |
+
"auto_cast": null,
|
26 |
+
"auto_cast_type": null,
|
27 |
+
"compiler_type": "neuronx-cc",
|
28 |
+
"compiler_version": "2.19.8089.0+8ab9f450",
|
29 |
+
"disable_fallback": false,
|
30 |
+
"disable_fast_relayout": false,
|
31 |
+
"dynamic_batch_size": true,
|
32 |
+
"float_dtype": "fp32",
|
33 |
+
"inline_weights_to_neff": true,
|
34 |
+
"input_names": [
|
35 |
+
"pixel_values"
|
36 |
+
],
|
37 |
+
"int_dtype": "int64",
|
38 |
+
"model_type": "beit",
|
39 |
+
"optlevel": "2",
|
40 |
+
"output_attentions": false,
|
41 |
+
"output_hidden_states": false,
|
42 |
+
"output_names": [
|
43 |
+
"logits"
|
44 |
+
],
|
45 |
+
"static_batch_size": 1,
|
46 |
+
"static_image_size": 30,
|
47 |
+
"static_num_channels": 3,
|
48 |
+
"static_patch_size": 2,
|
49 |
+
"task": "image-classification",
|
50 |
+
"tensor_parallel_size": 1
|
51 |
+
},
|
52 |
+
"num_attention_heads": 4,
|
53 |
+
"num_channels": 3,
|
54 |
+
"num_hidden_layers": 4,
|
55 |
+
"out_features": [
|
56 |
+
"stem",
|
57 |
+
"stage1",
|
58 |
+
"stage2",
|
59 |
+
"stage3"
|
60 |
+
],
|
61 |
+
"out_indices": [
|
62 |
+
0,
|
63 |
+
1,
|
64 |
+
2,
|
65 |
+
3
|
66 |
+
],
|
67 |
+
"patch_size": 2,
|
68 |
+
"pool_scales": [
|
69 |
+
1,
|
70 |
+
2,
|
71 |
+
3,
|
72 |
+
6
|
73 |
+
],
|
74 |
+
"reshape_hidden_states": true,
|
75 |
+
"semantic_loss_ignore_index": 255,
|
76 |
+
"stage_names": [
|
77 |
+
"stem",
|
78 |
+
"stage1",
|
79 |
+
"stage2",
|
80 |
+
"stage3",
|
81 |
+
"stage4"
|
82 |
+
],
|
83 |
+
"use_absolute_position_embeddings": false,
|
84 |
+
"use_auxiliary_head": true,
|
85 |
+
"use_mask_token": false,
|
86 |
+
"use_mean_pooling": true,
|
87 |
+
"use_relative_position_bias": false,
|
88 |
+
"use_shared_relative_position_bias": false,
|
89 |
+
"vocab_size": 100
|
90 |
+
}
|
neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/beit/hf-internal-testing/tiny-random-BeitForImageClassification/8eea34f80bdd528f4c47.json
ADDED
@@ -0,0 +1,90 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_entry_class": "SingleModelCacheEntry",
|
3 |
+
"_model_id": "hf-internal-testing/tiny-random-BeitForImageClassification",
|
4 |
+
"_task": "image-classification",
|
5 |
+
"add_fpn": false,
|
6 |
+
"architectures": [
|
7 |
+
"BeitForImageClassification"
|
8 |
+
],
|
9 |
+
"attention_probs_dropout_prob": 0.1,
|
10 |
+
"auxiliary_channels": 256,
|
11 |
+
"auxiliary_concat_input": false,
|
12 |
+
"auxiliary_loss_weight": 0.4,
|
13 |
+
"auxiliary_num_convs": 1,
|
14 |
+
"drop_path_rate": 0.1,
|
15 |
+
"hidden_act": "gelu",
|
16 |
+
"hidden_dropout_prob": 0.1,
|
17 |
+
"hidden_size": 32,
|
18 |
+
"image_size": 30,
|
19 |
+
"initializer_range": 0.02,
|
20 |
+
"intermediate_size": 37,
|
21 |
+
"layer_norm_eps": 1e-12,
|
22 |
+
"layer_scale_init_value": 0.1,
|
23 |
+
"model_type": "beit",
|
24 |
+
"neuron": {
|
25 |
+
"auto_cast": null,
|
26 |
+
"auto_cast_type": null,
|
27 |
+
"compiler_type": "neuronx-cc",
|
28 |
+
"compiler_version": "2.19.8089.0+8ab9f450",
|
29 |
+
"disable_fallback": false,
|
30 |
+
"disable_fast_relayout": false,
|
31 |
+
"dynamic_batch_size": false,
|
32 |
+
"float_dtype": "fp32",
|
33 |
+
"inline_weights_to_neff": true,
|
34 |
+
"input_names": [
|
35 |
+
"pixel_values"
|
36 |
+
],
|
37 |
+
"int_dtype": "int64",
|
38 |
+
"model_type": "beit",
|
39 |
+
"optlevel": "2",
|
40 |
+
"output_attentions": false,
|
41 |
+
"output_hidden_states": false,
|
42 |
+
"output_names": [
|
43 |
+
"logits"
|
44 |
+
],
|
45 |
+
"static_batch_size": 1,
|
46 |
+
"static_image_size": 30,
|
47 |
+
"static_num_channels": 3,
|
48 |
+
"static_patch_size": 2,
|
49 |
+
"task": "image-classification",
|
50 |
+
"tensor_parallel_size": 1
|
51 |
+
},
|
52 |
+
"num_attention_heads": 4,
|
53 |
+
"num_channels": 3,
|
54 |
+
"num_hidden_layers": 4,
|
55 |
+
"out_features": [
|
56 |
+
"stem",
|
57 |
+
"stage1",
|
58 |
+
"stage2",
|
59 |
+
"stage3"
|
60 |
+
],
|
61 |
+
"out_indices": [
|
62 |
+
0,
|
63 |
+
1,
|
64 |
+
2,
|
65 |
+
3
|
66 |
+
],
|
67 |
+
"patch_size": 2,
|
68 |
+
"pool_scales": [
|
69 |
+
1,
|
70 |
+
2,
|
71 |
+
3,
|
72 |
+
6
|
73 |
+
],
|
74 |
+
"reshape_hidden_states": true,
|
75 |
+
"semantic_loss_ignore_index": 255,
|
76 |
+
"stage_names": [
|
77 |
+
"stem",
|
78 |
+
"stage1",
|
79 |
+
"stage2",
|
80 |
+
"stage3",
|
81 |
+
"stage4"
|
82 |
+
],
|
83 |
+
"use_absolute_position_embeddings": false,
|
84 |
+
"use_auxiliary_head": true,
|
85 |
+
"use_mask_token": false,
|
86 |
+
"use_mean_pooling": true,
|
87 |
+
"use_relative_position_bias": false,
|
88 |
+
"use_shared_relative_position_bias": false,
|
89 |
+
"vocab_size": 100
|
90 |
+
}
|
neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/bert/Jingya/tiny-random-bert-remote-code/601076bf2990d898404b.json
ADDED
@@ -0,0 +1,52 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_entry_class": "SingleModelCacheEntry",
|
3 |
+
"_model_id": "Jingya/tiny-random-bert-remote-code",
|
4 |
+
"_task": "text-classification",
|
5 |
+
"architectures": [
|
6 |
+
"BertModel"
|
7 |
+
],
|
8 |
+
"attention_probs_dropout_prob": 0.1,
|
9 |
+
"classifier_dropout": null,
|
10 |
+
"hidden_act": "gelu",
|
11 |
+
"hidden_dropout_prob": 0.1,
|
12 |
+
"hidden_size": 32,
|
13 |
+
"initializer_range": 0.02,
|
14 |
+
"intermediate_size": 37,
|
15 |
+
"layer_norm_eps": 1e-12,
|
16 |
+
"max_position_embeddings": 512,
|
17 |
+
"model_type": "bert",
|
18 |
+
"neuron": {
|
19 |
+
"auto_cast": null,
|
20 |
+
"auto_cast_type": null,
|
21 |
+
"compiler_type": "neuronx-cc",
|
22 |
+
"compiler_version": "2.19.8089.0+8ab9f450",
|
23 |
+
"disable_fallback": false,
|
24 |
+
"disable_fast_relayout": false,
|
25 |
+
"dynamic_batch_size": false,
|
26 |
+
"float_dtype": "fp32",
|
27 |
+
"inline_weights_to_neff": true,
|
28 |
+
"input_names": [
|
29 |
+
"input_ids",
|
30 |
+
"attention_mask",
|
31 |
+
"token_type_ids"
|
32 |
+
],
|
33 |
+
"int_dtype": "int64",
|
34 |
+
"model_type": "bert",
|
35 |
+
"optlevel": "2",
|
36 |
+
"output_attentions": false,
|
37 |
+
"output_hidden_states": false,
|
38 |
+
"output_names": [
|
39 |
+
"logits"
|
40 |
+
],
|
41 |
+
"static_batch_size": 1,
|
42 |
+
"static_sequence_length": 32,
|
43 |
+
"task": "text-classification",
|
44 |
+
"tensor_parallel_size": 1
|
45 |
+
},
|
46 |
+
"num_attention_heads": 4,
|
47 |
+
"num_hidden_layers": 5,
|
48 |
+
"position_embedding_type": "absolute",
|
49 |
+
"type_vocab_size": 16,
|
50 |
+
"use_cache": true,
|
51 |
+
"vocab_size": 1124
|
52 |
+
}
|
neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/bert/fxmarty/tiny-bert-sst2-distilled-subfolder/d7d576d06e1491d72e5a.json
ADDED
@@ -0,0 +1,61 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_entry_class": "SingleModelCacheEntry",
|
3 |
+
"_model_id": "fxmarty/tiny-bert-sst2-distilled-subfolder",
|
4 |
+
"_task": "text-classification",
|
5 |
+
"architectures": [
|
6 |
+
"BertForSequenceClassification"
|
7 |
+
],
|
8 |
+
"attention_probs_dropout_prob": 0.1,
|
9 |
+
"classifier_dropout": null,
|
10 |
+
"hidden_act": "gelu",
|
11 |
+
"hidden_dropout_prob": 0.1,
|
12 |
+
"hidden_size": 128,
|
13 |
+
"id2label": {
|
14 |
+
"0": "negative",
|
15 |
+
"1": "positive"
|
16 |
+
},
|
17 |
+
"initializer_range": 0.02,
|
18 |
+
"intermediate_size": 512,
|
19 |
+
"label2id": {
|
20 |
+
"negative": "0",
|
21 |
+
"positive": "1"
|
22 |
+
},
|
23 |
+
"layer_norm_eps": 1e-12,
|
24 |
+
"max_position_embeddings": 512,
|
25 |
+
"model_type": "bert",
|
26 |
+
"neuron": {
|
27 |
+
"auto_cast": null,
|
28 |
+
"auto_cast_type": null,
|
29 |
+
"compiler_type": "neuronx-cc",
|
30 |
+
"compiler_version": "2.19.8089.0+8ab9f450",
|
31 |
+
"disable_fallback": false,
|
32 |
+
"disable_fast_relayout": false,
|
33 |
+
"dynamic_batch_size": false,
|
34 |
+
"float_dtype": "fp32",
|
35 |
+
"inline_weights_to_neff": true,
|
36 |
+
"input_names": [
|
37 |
+
"input_ids",
|
38 |
+
"attention_mask",
|
39 |
+
"token_type_ids"
|
40 |
+
],
|
41 |
+
"int_dtype": "int64",
|
42 |
+
"model_type": "bert",
|
43 |
+
"optlevel": "2",
|
44 |
+
"output_attentions": false,
|
45 |
+
"output_hidden_states": false,
|
46 |
+
"output_names": [
|
47 |
+
"logits"
|
48 |
+
],
|
49 |
+
"static_batch_size": 1,
|
50 |
+
"static_sequence_length": 32,
|
51 |
+
"task": "text-classification",
|
52 |
+
"tensor_parallel_size": 1
|
53 |
+
},
|
54 |
+
"num_attention_heads": 2,
|
55 |
+
"num_hidden_layers": 2,
|
56 |
+
"position_embedding_type": "absolute",
|
57 |
+
"problem_type": "single_label_classification",
|
58 |
+
"type_vocab_size": 2,
|
59 |
+
"use_cache": true,
|
60 |
+
"vocab_size": 30522
|
61 |
+
}
|
neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/bert/hf-internal-testing/tiny-random-BertModel/07d9dac237105afed7b4.json
ADDED
@@ -0,0 +1,52 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_entry_class": "SingleModelCacheEntry",
|
3 |
+
"_model_id": "hf-internal-testing/tiny-random-BertModel",
|
4 |
+
"_task": "fill-mask",
|
5 |
+
"architectures": [
|
6 |
+
"BertModel"
|
7 |
+
],
|
8 |
+
"attention_probs_dropout_prob": 0.1,
|
9 |
+
"classifier_dropout": null,
|
10 |
+
"hidden_act": "gelu",
|
11 |
+
"hidden_dropout_prob": 0.1,
|
12 |
+
"hidden_size": 32,
|
13 |
+
"initializer_range": 0.02,
|
14 |
+
"intermediate_size": 37,
|
15 |
+
"layer_norm_eps": 1e-12,
|
16 |
+
"max_position_embeddings": 512,
|
17 |
+
"model_type": "bert",
|
18 |
+
"neuron": {
|
19 |
+
"auto_cast": null,
|
20 |
+
"auto_cast_type": null,
|
21 |
+
"compiler_type": "neuronx-cc",
|
22 |
+
"compiler_version": "2.19.8089.0+8ab9f450",
|
23 |
+
"disable_fallback": false,
|
24 |
+
"disable_fast_relayout": false,
|
25 |
+
"dynamic_batch_size": false,
|
26 |
+
"float_dtype": "fp32",
|
27 |
+
"inline_weights_to_neff": true,
|
28 |
+
"input_names": [
|
29 |
+
"input_ids",
|
30 |
+
"attention_mask",
|
31 |
+
"token_type_ids"
|
32 |
+
],
|
33 |
+
"int_dtype": "int64",
|
34 |
+
"model_type": "bert",
|
35 |
+
"optlevel": "2",
|
36 |
+
"output_attentions": false,
|
37 |
+
"output_hidden_states": false,
|
38 |
+
"output_names": [
|
39 |
+
"logits"
|
40 |
+
],
|
41 |
+
"static_batch_size": 1,
|
42 |
+
"static_sequence_length": 32,
|
43 |
+
"task": "fill-mask",
|
44 |
+
"tensor_parallel_size": 1
|
45 |
+
},
|
46 |
+
"num_attention_heads": 4,
|
47 |
+
"num_hidden_layers": 5,
|
48 |
+
"position_embedding_type": "absolute",
|
49 |
+
"type_vocab_size": 16,
|
50 |
+
"use_cache": true,
|
51 |
+
"vocab_size": 1124
|
52 |
+
}
|
neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/bert/hf-internal-testing/tiny-random-BertModel/0d7dca7e1b02d11fa30b.json
ADDED
@@ -0,0 +1,52 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_entry_class": "SingleModelCacheEntry",
|
3 |
+
"_model_id": "hf-internal-testing/tiny-random-BertModel",
|
4 |
+
"_task": "text-classification",
|
5 |
+
"architectures": [
|
6 |
+
"BertModel"
|
7 |
+
],
|
8 |
+
"attention_probs_dropout_prob": 0.1,
|
9 |
+
"classifier_dropout": null,
|
10 |
+
"hidden_act": "gelu",
|
11 |
+
"hidden_dropout_prob": 0.1,
|
12 |
+
"hidden_size": 32,
|
13 |
+
"initializer_range": 0.02,
|
14 |
+
"intermediate_size": 37,
|
15 |
+
"layer_norm_eps": 1e-12,
|
16 |
+
"max_position_embeddings": 512,
|
17 |
+
"model_type": "bert",
|
18 |
+
"neuron": {
|
19 |
+
"auto_cast": null,
|
20 |
+
"auto_cast_type": null,
|
21 |
+
"compiler_type": "neuronx-cc",
|
22 |
+
"compiler_version": "2.19.8089.0+8ab9f450",
|
23 |
+
"disable_fallback": false,
|
24 |
+
"disable_fast_relayout": false,
|
25 |
+
"dynamic_batch_size": false,
|
26 |
+
"float_dtype": "fp32",
|
27 |
+
"inline_weights_to_neff": true,
|
28 |
+
"input_names": [
|
29 |
+
"input_ids",
|
30 |
+
"attention_mask",
|
31 |
+
"token_type_ids"
|
32 |
+
],
|
33 |
+
"int_dtype": "int64",
|
34 |
+
"model_type": "bert",
|
35 |
+
"optlevel": "2",
|
36 |
+
"output_attentions": false,
|
37 |
+
"output_hidden_states": false,
|
38 |
+
"output_names": [
|
39 |
+
"logits"
|
40 |
+
],
|
41 |
+
"static_batch_size": 1,
|
42 |
+
"static_sequence_length": 32,
|
43 |
+
"task": "text-classification",
|
44 |
+
"tensor_parallel_size": 1
|
45 |
+
},
|
46 |
+
"num_attention_heads": 4,
|
47 |
+
"num_hidden_layers": 5,
|
48 |
+
"position_embedding_type": "absolute",
|
49 |
+
"type_vocab_size": 16,
|
50 |
+
"use_cache": true,
|
51 |
+
"vocab_size": 1124
|
52 |
+
}
|
neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/bert/hf-internal-testing/tiny-random-BertModel/22ce2cce0b08d134021c.json
ADDED
@@ -0,0 +1,53 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_entry_class": "SingleModelCacheEntry",
|
3 |
+
"_model_id": "hf-internal-testing/tiny-random-BertModel",
|
4 |
+
"_task": "multiple-choice",
|
5 |
+
"architectures": [
|
6 |
+
"BertModel"
|
7 |
+
],
|
8 |
+
"attention_probs_dropout_prob": 0.1,
|
9 |
+
"classifier_dropout": null,
|
10 |
+
"hidden_act": "gelu",
|
11 |
+
"hidden_dropout_prob": 0.1,
|
12 |
+
"hidden_size": 32,
|
13 |
+
"initializer_range": 0.02,
|
14 |
+
"intermediate_size": 37,
|
15 |
+
"layer_norm_eps": 1e-12,
|
16 |
+
"max_position_embeddings": 512,
|
17 |
+
"model_type": "bert",
|
18 |
+
"neuron": {
|
19 |
+
"auto_cast": null,
|
20 |
+
"auto_cast_type": null,
|
21 |
+
"compiler_type": "neuronx-cc",
|
22 |
+
"compiler_version": "2.19.8089.0+8ab9f450",
|
23 |
+
"disable_fallback": false,
|
24 |
+
"disable_fast_relayout": false,
|
25 |
+
"dynamic_batch_size": false,
|
26 |
+
"float_dtype": "fp32",
|
27 |
+
"inline_weights_to_neff": true,
|
28 |
+
"input_names": [
|
29 |
+
"input_ids",
|
30 |
+
"attention_mask",
|
31 |
+
"token_type_ids"
|
32 |
+
],
|
33 |
+
"int_dtype": "int64",
|
34 |
+
"model_type": "bert",
|
35 |
+
"optlevel": "2",
|
36 |
+
"output_attentions": false,
|
37 |
+
"output_hidden_states": false,
|
38 |
+
"output_names": [
|
39 |
+
"logits"
|
40 |
+
],
|
41 |
+
"static_batch_size": 1,
|
42 |
+
"static_num_choices": 4,
|
43 |
+
"static_sequence_length": 128,
|
44 |
+
"task": "multiple-choice",
|
45 |
+
"tensor_parallel_size": 1
|
46 |
+
},
|
47 |
+
"num_attention_heads": 4,
|
48 |
+
"num_hidden_layers": 5,
|
49 |
+
"position_embedding_type": "absolute",
|
50 |
+
"type_vocab_size": 16,
|
51 |
+
"use_cache": true,
|
52 |
+
"vocab_size": 1124
|
53 |
+
}
|
neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/bert/hf-internal-testing/tiny-random-BertModel/28bcefedc9caadd676ab.json
ADDED
@@ -0,0 +1,53 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_entry_class": "SingleModelCacheEntry",
|
3 |
+
"_model_id": "hf-internal-testing/tiny-random-BertModel",
|
4 |
+
"_task": "feature-extraction",
|
5 |
+
"architectures": [
|
6 |
+
"BertModel"
|
7 |
+
],
|
8 |
+
"attention_probs_dropout_prob": 0.1,
|
9 |
+
"classifier_dropout": null,
|
10 |
+
"hidden_act": "gelu",
|
11 |
+
"hidden_dropout_prob": 0.1,
|
12 |
+
"hidden_size": 32,
|
13 |
+
"initializer_range": 0.02,
|
14 |
+
"intermediate_size": 37,
|
15 |
+
"layer_norm_eps": 1e-12,
|
16 |
+
"max_position_embeddings": 512,
|
17 |
+
"model_type": "bert",
|
18 |
+
"neuron": {
|
19 |
+
"auto_cast": null,
|
20 |
+
"auto_cast_type": null,
|
21 |
+
"compiler_type": "neuronx-cc",
|
22 |
+
"compiler_version": "2.19.8089.0+8ab9f450",
|
23 |
+
"disable_fallback": false,
|
24 |
+
"disable_fast_relayout": false,
|
25 |
+
"dynamic_batch_size": false,
|
26 |
+
"float_dtype": "fp32",
|
27 |
+
"inline_weights_to_neff": true,
|
28 |
+
"input_names": [
|
29 |
+
"input_ids",
|
30 |
+
"attention_mask",
|
31 |
+
"token_type_ids"
|
32 |
+
],
|
33 |
+
"int_dtype": "int64",
|
34 |
+
"model_type": "bert",
|
35 |
+
"optlevel": "2",
|
36 |
+
"output_attentions": false,
|
37 |
+
"output_hidden_states": false,
|
38 |
+
"output_names": [
|
39 |
+
"last_hidden_state",
|
40 |
+
"pooler_output"
|
41 |
+
],
|
42 |
+
"static_batch_size": 1,
|
43 |
+
"static_sequence_length": 128,
|
44 |
+
"task": "feature-extraction",
|
45 |
+
"tensor_parallel_size": 1
|
46 |
+
},
|
47 |
+
"num_attention_heads": 4,
|
48 |
+
"num_hidden_layers": 5,
|
49 |
+
"position_embedding_type": "absolute",
|
50 |
+
"type_vocab_size": 16,
|
51 |
+
"use_cache": true,
|
52 |
+
"vocab_size": 1124
|
53 |
+
}
|
neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/bert/hf-internal-testing/tiny-random-BertModel/3908bf519c210b434176.json
ADDED
@@ -0,0 +1,53 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_entry_class": "SingleModelCacheEntry",
|
3 |
+
"_model_id": "hf-internal-testing/tiny-random-BertModel",
|
4 |
+
"_task": "feature-extraction",
|
5 |
+
"architectures": [
|
6 |
+
"BertModel"
|
7 |
+
],
|
8 |
+
"attention_probs_dropout_prob": 0.1,
|
9 |
+
"classifier_dropout": null,
|
10 |
+
"hidden_act": "gelu",
|
11 |
+
"hidden_dropout_prob": 0.1,
|
12 |
+
"hidden_size": 32,
|
13 |
+
"initializer_range": 0.02,
|
14 |
+
"intermediate_size": 37,
|
15 |
+
"layer_norm_eps": 1e-12,
|
16 |
+
"max_position_embeddings": 512,
|
17 |
+
"model_type": "bert",
|
18 |
+
"neuron": {
|
19 |
+
"auto_cast": null,
|
20 |
+
"auto_cast_type": null,
|
21 |
+
"compiler_type": "neuronx-cc",
|
22 |
+
"compiler_version": "2.19.8089.0+8ab9f450",
|
23 |
+
"disable_fallback": false,
|
24 |
+
"disable_fast_relayout": false,
|
25 |
+
"dynamic_batch_size": false,
|
26 |
+
"float_dtype": "fp32",
|
27 |
+
"inline_weights_to_neff": true,
|
28 |
+
"input_names": [
|
29 |
+
"input_ids",
|
30 |
+
"attention_mask",
|
31 |
+
"token_type_ids"
|
32 |
+
],
|
33 |
+
"int_dtype": "int64",
|
34 |
+
"model_type": "bert",
|
35 |
+
"optlevel": "2",
|
36 |
+
"output_attentions": false,
|
37 |
+
"output_hidden_states": false,
|
38 |
+
"output_names": [
|
39 |
+
"last_hidden_state",
|
40 |
+
"pooler_output"
|
41 |
+
],
|
42 |
+
"static_batch_size": 1,
|
43 |
+
"static_sequence_length": 32,
|
44 |
+
"task": "feature-extraction",
|
45 |
+
"tensor_parallel_size": 1
|
46 |
+
},
|
47 |
+
"num_attention_heads": 4,
|
48 |
+
"num_hidden_layers": 5,
|
49 |
+
"position_embedding_type": "absolute",
|
50 |
+
"type_vocab_size": 16,
|
51 |
+
"use_cache": true,
|
52 |
+
"vocab_size": 1124
|
53 |
+
}
|
neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/bert/hf-internal-testing/tiny-random-BertModel/5ead9d705b13f37e716b.json
ADDED
@@ -0,0 +1,52 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_entry_class": "SingleModelCacheEntry",
|
3 |
+
"_model_id": "hf-internal-testing/tiny-random-BertModel",
|
4 |
+
"_task": "text-classification",
|
5 |
+
"architectures": [
|
6 |
+
"BertModel"
|
7 |
+
],
|
8 |
+
"attention_probs_dropout_prob": 0.1,
|
9 |
+
"classifier_dropout": null,
|
10 |
+
"hidden_act": "gelu",
|
11 |
+
"hidden_dropout_prob": 0.1,
|
12 |
+
"hidden_size": 32,
|
13 |
+
"initializer_range": 0.02,
|
14 |
+
"intermediate_size": 37,
|
15 |
+
"layer_norm_eps": 1e-12,
|
16 |
+
"max_position_embeddings": 512,
|
17 |
+
"model_type": "bert",
|
18 |
+
"neuron": {
|
19 |
+
"auto_cast": null,
|
20 |
+
"auto_cast_type": null,
|
21 |
+
"compiler_type": "neuronx-cc",
|
22 |
+
"compiler_version": "2.19.8089.0+8ab9f450",
|
23 |
+
"disable_fallback": false,
|
24 |
+
"disable_fast_relayout": false,
|
25 |
+
"dynamic_batch_size": false,
|
26 |
+
"float_dtype": "fp32",
|
27 |
+
"inline_weights_to_neff": false,
|
28 |
+
"input_names": [
|
29 |
+
"input_ids",
|
30 |
+
"attention_mask",
|
31 |
+
"token_type_ids"
|
32 |
+
],
|
33 |
+
"int_dtype": "int64",
|
34 |
+
"model_type": "bert",
|
35 |
+
"optlevel": "2",
|
36 |
+
"output_attentions": false,
|
37 |
+
"output_hidden_states": false,
|
38 |
+
"output_names": [
|
39 |
+
"logits"
|
40 |
+
],
|
41 |
+
"static_batch_size": 1,
|
42 |
+
"static_sequence_length": 32,
|
43 |
+
"task": "text-classification",
|
44 |
+
"tensor_parallel_size": 1
|
45 |
+
},
|
46 |
+
"num_attention_heads": 4,
|
47 |
+
"num_hidden_layers": 5,
|
48 |
+
"position_embedding_type": "absolute",
|
49 |
+
"type_vocab_size": 16,
|
50 |
+
"use_cache": true,
|
51 |
+
"vocab_size": 1124
|
52 |
+
}
|
neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/bert/hf-internal-testing/tiny-random-BertModel/80c925bab2fcc5749b91.json
ADDED
@@ -0,0 +1,53 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_entry_class": "SingleModelCacheEntry",
|
3 |
+
"_model_id": "hf-internal-testing/tiny-random-BertModel",
|
4 |
+
"_task": "question-answering",
|
5 |
+
"architectures": [
|
6 |
+
"BertModel"
|
7 |
+
],
|
8 |
+
"attention_probs_dropout_prob": 0.1,
|
9 |
+
"classifier_dropout": null,
|
10 |
+
"hidden_act": "gelu",
|
11 |
+
"hidden_dropout_prob": 0.1,
|
12 |
+
"hidden_size": 32,
|
13 |
+
"initializer_range": 0.02,
|
14 |
+
"intermediate_size": 37,
|
15 |
+
"layer_norm_eps": 1e-12,
|
16 |
+
"max_position_embeddings": 512,
|
17 |
+
"model_type": "bert",
|
18 |
+
"neuron": {
|
19 |
+
"auto_cast": null,
|
20 |
+
"auto_cast_type": null,
|
21 |
+
"compiler_type": "neuronx-cc",
|
22 |
+
"compiler_version": "2.19.8089.0+8ab9f450",
|
23 |
+
"disable_fallback": false,
|
24 |
+
"disable_fast_relayout": false,
|
25 |
+
"dynamic_batch_size": false,
|
26 |
+
"float_dtype": "fp32",
|
27 |
+
"inline_weights_to_neff": true,
|
28 |
+
"input_names": [
|
29 |
+
"input_ids",
|
30 |
+
"attention_mask",
|
31 |
+
"token_type_ids"
|
32 |
+
],
|
33 |
+
"int_dtype": "int64",
|
34 |
+
"model_type": "bert",
|
35 |
+
"optlevel": "2",
|
36 |
+
"output_attentions": false,
|
37 |
+
"output_hidden_states": false,
|
38 |
+
"output_names": [
|
39 |
+
"start_logits",
|
40 |
+
"end_logits"
|
41 |
+
],
|
42 |
+
"static_batch_size": 1,
|
43 |
+
"static_sequence_length": 128,
|
44 |
+
"task": "question-answering",
|
45 |
+
"tensor_parallel_size": 1
|
46 |
+
},
|
47 |
+
"num_attention_heads": 4,
|
48 |
+
"num_hidden_layers": 5,
|
49 |
+
"position_embedding_type": "absolute",
|
50 |
+
"type_vocab_size": 16,
|
51 |
+
"use_cache": true,
|
52 |
+
"vocab_size": 1124
|
53 |
+
}
|
neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/bert/hf-internal-testing/tiny-random-BertModel/92f51980d46489605055.json
ADDED
@@ -0,0 +1,52 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_entry_class": "SingleModelCacheEntry",
|
3 |
+
"_model_id": "hf-internal-testing/tiny-random-BertModel",
|
4 |
+
"_task": "text-classification",
|
5 |
+
"architectures": [
|
6 |
+
"BertModel"
|
7 |
+
],
|
8 |
+
"attention_probs_dropout_prob": 0.1,
|
9 |
+
"classifier_dropout": null,
|
10 |
+
"hidden_act": "gelu",
|
11 |
+
"hidden_dropout_prob": 0.1,
|
12 |
+
"hidden_size": 32,
|
13 |
+
"initializer_range": 0.02,
|
14 |
+
"intermediate_size": 37,
|
15 |
+
"layer_norm_eps": 1e-12,
|
16 |
+
"max_position_embeddings": 512,
|
17 |
+
"model_type": "bert",
|
18 |
+
"neuron": {
|
19 |
+
"auto_cast": null,
|
20 |
+
"auto_cast_type": null,
|
21 |
+
"compiler_type": "neuronx-cc",
|
22 |
+
"compiler_version": "2.19.8089.0+8ab9f450",
|
23 |
+
"disable_fallback": false,
|
24 |
+
"disable_fast_relayout": false,
|
25 |
+
"dynamic_batch_size": false,
|
26 |
+
"float_dtype": "fp32",
|
27 |
+
"inline_weights_to_neff": true,
|
28 |
+
"input_names": [
|
29 |
+
"input_ids",
|
30 |
+
"attention_mask",
|
31 |
+
"token_type_ids"
|
32 |
+
],
|
33 |
+
"int_dtype": "int64",
|
34 |
+
"model_type": "bert",
|
35 |
+
"optlevel": "2",
|
36 |
+
"output_attentions": false,
|
37 |
+
"output_hidden_states": false,
|
38 |
+
"output_names": [
|
39 |
+
"logits"
|
40 |
+
],
|
41 |
+
"static_batch_size": 1,
|
42 |
+
"static_sequence_length": 128,
|
43 |
+
"task": "text-classification",
|
44 |
+
"tensor_parallel_size": 1
|
45 |
+
},
|
46 |
+
"num_attention_heads": 4,
|
47 |
+
"num_hidden_layers": 5,
|
48 |
+
"position_embedding_type": "absolute",
|
49 |
+
"type_vocab_size": 16,
|
50 |
+
"use_cache": true,
|
51 |
+
"vocab_size": 1124
|
52 |
+
}
|
neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/bert/hf-internal-testing/tiny-random-BertModel/aeebf3f56cf9d0ed0250.json
ADDED
@@ -0,0 +1,52 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_entry_class": "SingleModelCacheEntry",
|
3 |
+
"_model_id": "hf-internal-testing/tiny-random-BertModel",
|
4 |
+
"_task": "token-classification",
|
5 |
+
"architectures": [
|
6 |
+
"BertModel"
|
7 |
+
],
|
8 |
+
"attention_probs_dropout_prob": 0.1,
|
9 |
+
"classifier_dropout": null,
|
10 |
+
"hidden_act": "gelu",
|
11 |
+
"hidden_dropout_prob": 0.1,
|
12 |
+
"hidden_size": 32,
|
13 |
+
"initializer_range": 0.02,
|
14 |
+
"intermediate_size": 37,
|
15 |
+
"layer_norm_eps": 1e-12,
|
16 |
+
"max_position_embeddings": 512,
|
17 |
+
"model_type": "bert",
|
18 |
+
"neuron": {
|
19 |
+
"auto_cast": null,
|
20 |
+
"auto_cast_type": null,
|
21 |
+
"compiler_type": "neuronx-cc",
|
22 |
+
"compiler_version": "2.19.8089.0+8ab9f450",
|
23 |
+
"disable_fallback": false,
|
24 |
+
"disable_fast_relayout": false,
|
25 |
+
"dynamic_batch_size": false,
|
26 |
+
"float_dtype": "fp32",
|
27 |
+
"inline_weights_to_neff": true,
|
28 |
+
"input_names": [
|
29 |
+
"input_ids",
|
30 |
+
"attention_mask",
|
31 |
+
"token_type_ids"
|
32 |
+
],
|
33 |
+
"int_dtype": "int64",
|
34 |
+
"model_type": "bert",
|
35 |
+
"optlevel": "2",
|
36 |
+
"output_attentions": false,
|
37 |
+
"output_hidden_states": false,
|
38 |
+
"output_names": [
|
39 |
+
"logits"
|
40 |
+
],
|
41 |
+
"static_batch_size": 1,
|
42 |
+
"static_sequence_length": 32,
|
43 |
+
"task": "token-classification",
|
44 |
+
"tensor_parallel_size": 1
|
45 |
+
},
|
46 |
+
"num_attention_heads": 4,
|
47 |
+
"num_hidden_layers": 5,
|
48 |
+
"position_embedding_type": "absolute",
|
49 |
+
"type_vocab_size": 16,
|
50 |
+
"use_cache": true,
|
51 |
+
"vocab_size": 1124
|
52 |
+
}
|
neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/bert/hf-internal-testing/tiny-random-BertModel/cfb94bae5629e275593f.json
ADDED
@@ -0,0 +1,53 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_entry_class": "SingleModelCacheEntry",
|
3 |
+
"_model_id": "hf-internal-testing/tiny-random-BertModel",
|
4 |
+
"_task": "feature-extraction",
|
5 |
+
"architectures": [
|
6 |
+
"BertModel"
|
7 |
+
],
|
8 |
+
"attention_probs_dropout_prob": 0.1,
|
9 |
+
"classifier_dropout": null,
|
10 |
+
"hidden_act": "gelu",
|
11 |
+
"hidden_dropout_prob": 0.1,
|
12 |
+
"hidden_size": 32,
|
13 |
+
"initializer_range": 0.02,
|
14 |
+
"intermediate_size": 37,
|
15 |
+
"layer_norm_eps": 1e-12,
|
16 |
+
"max_position_embeddings": 512,
|
17 |
+
"model_type": "bert",
|
18 |
+
"neuron": {
|
19 |
+
"auto_cast": null,
|
20 |
+
"auto_cast_type": null,
|
21 |
+
"compiler_type": "neuronx-cc",
|
22 |
+
"compiler_version": "2.19.8089.0+8ab9f450",
|
23 |
+
"disable_fallback": false,
|
24 |
+
"disable_fast_relayout": false,
|
25 |
+
"dynamic_batch_size": true,
|
26 |
+
"float_dtype": "fp32",
|
27 |
+
"inline_weights_to_neff": true,
|
28 |
+
"input_names": [
|
29 |
+
"input_ids",
|
30 |
+
"attention_mask",
|
31 |
+
"token_type_ids"
|
32 |
+
],
|
33 |
+
"int_dtype": "int64",
|
34 |
+
"model_type": "bert",
|
35 |
+
"optlevel": "2",
|
36 |
+
"output_attentions": false,
|
37 |
+
"output_hidden_states": false,
|
38 |
+
"output_names": [
|
39 |
+
"last_hidden_state",
|
40 |
+
"pooler_output"
|
41 |
+
],
|
42 |
+
"static_batch_size": 1,
|
43 |
+
"static_sequence_length": 32,
|
44 |
+
"task": "feature-extraction",
|
45 |
+
"tensor_parallel_size": 1
|
46 |
+
},
|
47 |
+
"num_attention_heads": 4,
|
48 |
+
"num_hidden_layers": 5,
|
49 |
+
"position_embedding_type": "absolute",
|
50 |
+
"type_vocab_size": 16,
|
51 |
+
"use_cache": true,
|
52 |
+
"vocab_size": 1124
|
53 |
+
}
|
neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/bert/hf-internal-testing/tiny-random-BertModel/e050716b5de372871d73.json
ADDED
@@ -0,0 +1,52 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_entry_class": "SingleModelCacheEntry",
|
3 |
+
"_model_id": "hf-internal-testing/tiny-random-BertModel",
|
4 |
+
"_task": "token-classification",
|
5 |
+
"architectures": [
|
6 |
+
"BertModel"
|
7 |
+
],
|
8 |
+
"attention_probs_dropout_prob": 0.1,
|
9 |
+
"classifier_dropout": null,
|
10 |
+
"hidden_act": "gelu",
|
11 |
+
"hidden_dropout_prob": 0.1,
|
12 |
+
"hidden_size": 32,
|
13 |
+
"initializer_range": 0.02,
|
14 |
+
"intermediate_size": 37,
|
15 |
+
"layer_norm_eps": 1e-12,
|
16 |
+
"max_position_embeddings": 512,
|
17 |
+
"model_type": "bert",
|
18 |
+
"neuron": {
|
19 |
+
"auto_cast": null,
|
20 |
+
"auto_cast_type": null,
|
21 |
+
"compiler_type": "neuronx-cc",
|
22 |
+
"compiler_version": "2.19.8089.0+8ab9f450",
|
23 |
+
"disable_fallback": false,
|
24 |
+
"disable_fast_relayout": false,
|
25 |
+
"dynamic_batch_size": false,
|
26 |
+
"float_dtype": "fp32",
|
27 |
+
"inline_weights_to_neff": true,
|
28 |
+
"input_names": [
|
29 |
+
"input_ids",
|
30 |
+
"attention_mask",
|
31 |
+
"token_type_ids"
|
32 |
+
],
|
33 |
+
"int_dtype": "int64",
|
34 |
+
"model_type": "bert",
|
35 |
+
"optlevel": "2",
|
36 |
+
"output_attentions": false,
|
37 |
+
"output_hidden_states": false,
|
38 |
+
"output_names": [
|
39 |
+
"logits"
|
40 |
+
],
|
41 |
+
"static_batch_size": 1,
|
42 |
+
"static_sequence_length": 128,
|
43 |
+
"task": "token-classification",
|
44 |
+
"tensor_parallel_size": 1
|
45 |
+
},
|
46 |
+
"num_attention_heads": 4,
|
47 |
+
"num_hidden_layers": 5,
|
48 |
+
"position_embedding_type": "absolute",
|
49 |
+
"type_vocab_size": 16,
|
50 |
+
"use_cache": true,
|
51 |
+
"vocab_size": 1124
|
52 |
+
}
|
neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/bert/hf-internal-testing/tiny-random-BertModel/e0768f223c51e12fd868.json
ADDED
@@ -0,0 +1,52 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_entry_class": "SingleModelCacheEntry",
|
3 |
+
"_model_id": "hf-internal-testing/tiny-random-BertModel",
|
4 |
+
"_task": "fill-mask",
|
5 |
+
"architectures": [
|
6 |
+
"BertModel"
|
7 |
+
],
|
8 |
+
"attention_probs_dropout_prob": 0.1,
|
9 |
+
"classifier_dropout": null,
|
10 |
+
"hidden_act": "gelu",
|
11 |
+
"hidden_dropout_prob": 0.1,
|
12 |
+
"hidden_size": 32,
|
13 |
+
"initializer_range": 0.02,
|
14 |
+
"intermediate_size": 37,
|
15 |
+
"layer_norm_eps": 1e-12,
|
16 |
+
"max_position_embeddings": 512,
|
17 |
+
"model_type": "bert",
|
18 |
+
"neuron": {
|
19 |
+
"auto_cast": null,
|
20 |
+
"auto_cast_type": null,
|
21 |
+
"compiler_type": "neuronx-cc",
|
22 |
+
"compiler_version": "2.19.8089.0+8ab9f450",
|
23 |
+
"disable_fallback": false,
|
24 |
+
"disable_fast_relayout": false,
|
25 |
+
"dynamic_batch_size": true,
|
26 |
+
"float_dtype": "fp32",
|
27 |
+
"inline_weights_to_neff": true,
|
28 |
+
"input_names": [
|
29 |
+
"input_ids",
|
30 |
+
"attention_mask",
|
31 |
+
"token_type_ids"
|
32 |
+
],
|
33 |
+
"int_dtype": "int64",
|
34 |
+
"model_type": "bert",
|
35 |
+
"optlevel": "2",
|
36 |
+
"output_attentions": false,
|
37 |
+
"output_hidden_states": false,
|
38 |
+
"output_names": [
|
39 |
+
"logits"
|
40 |
+
],
|
41 |
+
"static_batch_size": 1,
|
42 |
+
"static_sequence_length": 32,
|
43 |
+
"task": "fill-mask",
|
44 |
+
"tensor_parallel_size": 1
|
45 |
+
},
|
46 |
+
"num_attention_heads": 4,
|
47 |
+
"num_hidden_layers": 5,
|
48 |
+
"position_embedding_type": "absolute",
|
49 |
+
"type_vocab_size": 16,
|
50 |
+
"use_cache": true,
|
51 |
+
"vocab_size": 1124
|
52 |
+
}
|
neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/bert/hf-internal-testing/tiny-random-BertModel/e2594a1f187f452902f7.json
ADDED
@@ -0,0 +1,52 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_entry_class": "SingleModelCacheEntry",
|
3 |
+
"_model_id": "hf-internal-testing/tiny-random-BertModel",
|
4 |
+
"_task": "fill-mask",
|
5 |
+
"architectures": [
|
6 |
+
"BertModel"
|
7 |
+
],
|
8 |
+
"attention_probs_dropout_prob": 0.1,
|
9 |
+
"classifier_dropout": null,
|
10 |
+
"hidden_act": "gelu",
|
11 |
+
"hidden_dropout_prob": 0.1,
|
12 |
+
"hidden_size": 32,
|
13 |
+
"initializer_range": 0.02,
|
14 |
+
"intermediate_size": 37,
|
15 |
+
"layer_norm_eps": 1e-12,
|
16 |
+
"max_position_embeddings": 512,
|
17 |
+
"model_type": "bert",
|
18 |
+
"neuron": {
|
19 |
+
"auto_cast": null,
|
20 |
+
"auto_cast_type": null,
|
21 |
+
"compiler_type": "neuronx-cc",
|
22 |
+
"compiler_version": "2.19.8089.0+8ab9f450",
|
23 |
+
"disable_fallback": false,
|
24 |
+
"disable_fast_relayout": false,
|
25 |
+
"dynamic_batch_size": false,
|
26 |
+
"float_dtype": "fp32",
|
27 |
+
"inline_weights_to_neff": true,
|
28 |
+
"input_names": [
|
29 |
+
"input_ids",
|
30 |
+
"attention_mask",
|
31 |
+
"token_type_ids"
|
32 |
+
],
|
33 |
+
"int_dtype": "int64",
|
34 |
+
"model_type": "bert",
|
35 |
+
"optlevel": "2",
|
36 |
+
"output_attentions": false,
|
37 |
+
"output_hidden_states": false,
|
38 |
+
"output_names": [
|
39 |
+
"logits"
|
40 |
+
],
|
41 |
+
"static_batch_size": 1,
|
42 |
+
"static_sequence_length": 128,
|
43 |
+
"task": "fill-mask",
|
44 |
+
"tensor_parallel_size": 1
|
45 |
+
},
|
46 |
+
"num_attention_heads": 4,
|
47 |
+
"num_hidden_layers": 5,
|
48 |
+
"position_embedding_type": "absolute",
|
49 |
+
"type_vocab_size": 16,
|
50 |
+
"use_cache": true,
|
51 |
+
"vocab_size": 1124
|
52 |
+
}
|
neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/bert/hf-internal-testing/tiny-random-BertModel/e4834fd951418b796374.json
ADDED
@@ -0,0 +1,53 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_entry_class": "SingleModelCacheEntry",
|
3 |
+
"_model_id": "hf-internal-testing/tiny-random-BertModel",
|
4 |
+
"_task": "multiple-choice",
|
5 |
+
"architectures": [
|
6 |
+
"BertModel"
|
7 |
+
],
|
8 |
+
"attention_probs_dropout_prob": 0.1,
|
9 |
+
"classifier_dropout": null,
|
10 |
+
"hidden_act": "gelu",
|
11 |
+
"hidden_dropout_prob": 0.1,
|
12 |
+
"hidden_size": 32,
|
13 |
+
"initializer_range": 0.02,
|
14 |
+
"intermediate_size": 37,
|
15 |
+
"layer_norm_eps": 1e-12,
|
16 |
+
"max_position_embeddings": 512,
|
17 |
+
"model_type": "bert",
|
18 |
+
"neuron": {
|
19 |
+
"auto_cast": null,
|
20 |
+
"auto_cast_type": null,
|
21 |
+
"compiler_type": "neuronx-cc",
|
22 |
+
"compiler_version": "2.19.8089.0+8ab9f450",
|
23 |
+
"disable_fallback": false,
|
24 |
+
"disable_fast_relayout": false,
|
25 |
+
"dynamic_batch_size": true,
|
26 |
+
"float_dtype": "fp32",
|
27 |
+
"inline_weights_to_neff": true,
|
28 |
+
"input_names": [
|
29 |
+
"input_ids",
|
30 |
+
"attention_mask",
|
31 |
+
"token_type_ids"
|
32 |
+
],
|
33 |
+
"int_dtype": "int64",
|
34 |
+
"model_type": "bert",
|
35 |
+
"optlevel": "2",
|
36 |
+
"output_attentions": false,
|
37 |
+
"output_hidden_states": false,
|
38 |
+
"output_names": [
|
39 |
+
"logits"
|
40 |
+
],
|
41 |
+
"static_batch_size": 1,
|
42 |
+
"static_num_choices": 4,
|
43 |
+
"static_sequence_length": 128,
|
44 |
+
"task": "multiple-choice",
|
45 |
+
"tensor_parallel_size": 1
|
46 |
+
},
|
47 |
+
"num_attention_heads": 4,
|
48 |
+
"num_hidden_layers": 5,
|
49 |
+
"position_embedding_type": "absolute",
|
50 |
+
"type_vocab_size": 16,
|
51 |
+
"use_cache": true,
|
52 |
+
"vocab_size": 1124
|
53 |
+
}
|
neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/bert/hf-internal-testing/tiny-random-BertModel/e7e71e6beffbf701391b.json
ADDED
@@ -0,0 +1,53 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_entry_class": "SingleModelCacheEntry",
|
3 |
+
"_model_id": "hf-internal-testing/tiny-random-BertModel",
|
4 |
+
"_task": "question-answering",
|
5 |
+
"architectures": [
|
6 |
+
"BertModel"
|
7 |
+
],
|
8 |
+
"attention_probs_dropout_prob": 0.1,
|
9 |
+
"classifier_dropout": null,
|
10 |
+
"hidden_act": "gelu",
|
11 |
+
"hidden_dropout_prob": 0.1,
|
12 |
+
"hidden_size": 32,
|
13 |
+
"initializer_range": 0.02,
|
14 |
+
"intermediate_size": 37,
|
15 |
+
"layer_norm_eps": 1e-12,
|
16 |
+
"max_position_embeddings": 512,
|
17 |
+
"model_type": "bert",
|
18 |
+
"neuron": {
|
19 |
+
"auto_cast": null,
|
20 |
+
"auto_cast_type": null,
|
21 |
+
"compiler_type": "neuronx-cc",
|
22 |
+
"compiler_version": "2.19.8089.0+8ab9f450",
|
23 |
+
"disable_fallback": false,
|
24 |
+
"disable_fast_relayout": false,
|
25 |
+
"dynamic_batch_size": false,
|
26 |
+
"float_dtype": "fp32",
|
27 |
+
"inline_weights_to_neff": true,
|
28 |
+
"input_names": [
|
29 |
+
"input_ids",
|
30 |
+
"attention_mask",
|
31 |
+
"token_type_ids"
|
32 |
+
],
|
33 |
+
"int_dtype": "int64",
|
34 |
+
"model_type": "bert",
|
35 |
+
"optlevel": "2",
|
36 |
+
"output_attentions": false,
|
37 |
+
"output_hidden_states": false,
|
38 |
+
"output_names": [
|
39 |
+
"start_logits",
|
40 |
+
"end_logits"
|
41 |
+
],
|
42 |
+
"static_batch_size": 1,
|
43 |
+
"static_sequence_length": 32,
|
44 |
+
"task": "question-answering",
|
45 |
+
"tensor_parallel_size": 1
|
46 |
+
},
|
47 |
+
"num_attention_heads": 4,
|
48 |
+
"num_hidden_layers": 5,
|
49 |
+
"position_embedding_type": "absolute",
|
50 |
+
"type_vocab_size": 16,
|
51 |
+
"use_cache": true,
|
52 |
+
"vocab_size": 1124
|
53 |
+
}
|
neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/bert/hf-internal-testing/tiny-random-BertModel/ea81a963f6aa67da9f09.json
ADDED
@@ -0,0 +1,53 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_entry_class": "SingleModelCacheEntry",
|
3 |
+
"_model_id": "hf-internal-testing/tiny-random-BertModel",
|
4 |
+
"_task": "question-answering",
|
5 |
+
"architectures": [
|
6 |
+
"BertModel"
|
7 |
+
],
|
8 |
+
"attention_probs_dropout_prob": 0.1,
|
9 |
+
"classifier_dropout": null,
|
10 |
+
"hidden_act": "gelu",
|
11 |
+
"hidden_dropout_prob": 0.1,
|
12 |
+
"hidden_size": 32,
|
13 |
+
"initializer_range": 0.02,
|
14 |
+
"intermediate_size": 37,
|
15 |
+
"layer_norm_eps": 1e-12,
|
16 |
+
"max_position_embeddings": 512,
|
17 |
+
"model_type": "bert",
|
18 |
+
"neuron": {
|
19 |
+
"auto_cast": null,
|
20 |
+
"auto_cast_type": null,
|
21 |
+
"compiler_type": "neuronx-cc",
|
22 |
+
"compiler_version": "2.19.8089.0+8ab9f450",
|
23 |
+
"disable_fallback": false,
|
24 |
+
"disable_fast_relayout": false,
|
25 |
+
"dynamic_batch_size": true,
|
26 |
+
"float_dtype": "fp32",
|
27 |
+
"inline_weights_to_neff": true,
|
28 |
+
"input_names": [
|
29 |
+
"input_ids",
|
30 |
+
"attention_mask",
|
31 |
+
"token_type_ids"
|
32 |
+
],
|
33 |
+
"int_dtype": "int64",
|
34 |
+
"model_type": "bert",
|
35 |
+
"optlevel": "2",
|
36 |
+
"output_attentions": false,
|
37 |
+
"output_hidden_states": false,
|
38 |
+
"output_names": [
|
39 |
+
"start_logits",
|
40 |
+
"end_logits"
|
41 |
+
],
|
42 |
+
"static_batch_size": 1,
|
43 |
+
"static_sequence_length": 32,
|
44 |
+
"task": "question-answering",
|
45 |
+
"tensor_parallel_size": 1
|
46 |
+
},
|
47 |
+
"num_attention_heads": 4,
|
48 |
+
"num_hidden_layers": 5,
|
49 |
+
"position_embedding_type": "absolute",
|
50 |
+
"type_vocab_size": 16,
|
51 |
+
"use_cache": true,
|
52 |
+
"vocab_size": 1124
|
53 |
+
}
|
neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/bert/hf-internal-testing/tiny-random-BertModel/ef32dca934503ba9400c.json
ADDED
@@ -0,0 +1,52 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_entry_class": "SingleModelCacheEntry",
|
3 |
+
"_model_id": "hf-internal-testing/tiny-random-BertModel",
|
4 |
+
"_task": "token-classification",
|
5 |
+
"architectures": [
|
6 |
+
"BertModel"
|
7 |
+
],
|
8 |
+
"attention_probs_dropout_prob": 0.1,
|
9 |
+
"classifier_dropout": null,
|
10 |
+
"hidden_act": "gelu",
|
11 |
+
"hidden_dropout_prob": 0.1,
|
12 |
+
"hidden_size": 32,
|
13 |
+
"initializer_range": 0.02,
|
14 |
+
"intermediate_size": 37,
|
15 |
+
"layer_norm_eps": 1e-12,
|
16 |
+
"max_position_embeddings": 512,
|
17 |
+
"model_type": "bert",
|
18 |
+
"neuron": {
|
19 |
+
"auto_cast": null,
|
20 |
+
"auto_cast_type": null,
|
21 |
+
"compiler_type": "neuronx-cc",
|
22 |
+
"compiler_version": "2.19.8089.0+8ab9f450",
|
23 |
+
"disable_fallback": false,
|
24 |
+
"disable_fast_relayout": false,
|
25 |
+
"dynamic_batch_size": true,
|
26 |
+
"float_dtype": "fp32",
|
27 |
+
"inline_weights_to_neff": true,
|
28 |
+
"input_names": [
|
29 |
+
"input_ids",
|
30 |
+
"attention_mask",
|
31 |
+
"token_type_ids"
|
32 |
+
],
|
33 |
+
"int_dtype": "int64",
|
34 |
+
"model_type": "bert",
|
35 |
+
"optlevel": "2",
|
36 |
+
"output_attentions": false,
|
37 |
+
"output_hidden_states": false,
|
38 |
+
"output_names": [
|
39 |
+
"logits"
|
40 |
+
],
|
41 |
+
"static_batch_size": 1,
|
42 |
+
"static_sequence_length": 32,
|
43 |
+
"task": "token-classification",
|
44 |
+
"tensor_parallel_size": 1
|
45 |
+
},
|
46 |
+
"num_attention_heads": 4,
|
47 |
+
"num_hidden_layers": 5,
|
48 |
+
"position_embedding_type": "absolute",
|
49 |
+
"type_vocab_size": 16,
|
50 |
+
"use_cache": true,
|
51 |
+
"vocab_size": 1124
|
52 |
+
}
|
neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/bert/hf-internal-testing/tiny-random-BertModel/f15944a91bf873bc4059.json
ADDED
@@ -0,0 +1,52 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_entry_class": "SingleModelCacheEntry",
|
3 |
+
"_model_id": "hf-internal-testing/tiny-random-BertModel",
|
4 |
+
"_task": "text-classification",
|
5 |
+
"architectures": [
|
6 |
+
"BertModel"
|
7 |
+
],
|
8 |
+
"attention_probs_dropout_prob": 0.1,
|
9 |
+
"classifier_dropout": null,
|
10 |
+
"hidden_act": "gelu",
|
11 |
+
"hidden_dropout_prob": 0.1,
|
12 |
+
"hidden_size": 32,
|
13 |
+
"initializer_range": 0.02,
|
14 |
+
"intermediate_size": 37,
|
15 |
+
"layer_norm_eps": 1e-12,
|
16 |
+
"max_position_embeddings": 512,
|
17 |
+
"model_type": "bert",
|
18 |
+
"neuron": {
|
19 |
+
"auto_cast": null,
|
20 |
+
"auto_cast_type": null,
|
21 |
+
"compiler_type": "neuronx-cc",
|
22 |
+
"compiler_version": "2.19.8089.0+8ab9f450",
|
23 |
+
"disable_fallback": false,
|
24 |
+
"disable_fast_relayout": false,
|
25 |
+
"dynamic_batch_size": true,
|
26 |
+
"float_dtype": "fp32",
|
27 |
+
"inline_weights_to_neff": true,
|
28 |
+
"input_names": [
|
29 |
+
"input_ids",
|
30 |
+
"attention_mask",
|
31 |
+
"token_type_ids"
|
32 |
+
],
|
33 |
+
"int_dtype": "int64",
|
34 |
+
"model_type": "bert",
|
35 |
+
"optlevel": "2",
|
36 |
+
"output_attentions": false,
|
37 |
+
"output_hidden_states": false,
|
38 |
+
"output_names": [
|
39 |
+
"logits"
|
40 |
+
],
|
41 |
+
"static_batch_size": 1,
|
42 |
+
"static_sequence_length": 32,
|
43 |
+
"task": "text-classification",
|
44 |
+
"tensor_parallel_size": 1
|
45 |
+
},
|
46 |
+
"num_attention_heads": 4,
|
47 |
+
"num_hidden_layers": 5,
|
48 |
+
"position_embedding_type": "absolute",
|
49 |
+
"type_vocab_size": 16,
|
50 |
+
"use_cache": true,
|
51 |
+
"vocab_size": 1124
|
52 |
+
}
|
neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/bert/sentence-transformers/all-MiniLM-L6-v2/b571d0d9ac9ad084fa8c.json
ADDED
@@ -0,0 +1,54 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_entry_class": "SingleModelCacheEntry",
|
3 |
+
"_model_id": "sentence-transformers/all-MiniLM-L6-v2",
|
4 |
+
"_task": "feature-extraction",
|
5 |
+
"architectures": [
|
6 |
+
"BertModel"
|
7 |
+
],
|
8 |
+
"attention_probs_dropout_prob": 0.1,
|
9 |
+
"classifier_dropout": null,
|
10 |
+
"export_model_type": "transformer",
|
11 |
+
"gradient_checkpointing": false,
|
12 |
+
"hidden_act": "gelu",
|
13 |
+
"hidden_dropout_prob": 0.1,
|
14 |
+
"hidden_size": 384,
|
15 |
+
"initializer_range": 0.02,
|
16 |
+
"intermediate_size": 1536,
|
17 |
+
"layer_norm_eps": 1e-12,
|
18 |
+
"max_position_embeddings": 512,
|
19 |
+
"model_type": "bert",
|
20 |
+
"neuron": {
|
21 |
+
"auto_cast": null,
|
22 |
+
"auto_cast_type": null,
|
23 |
+
"compiler_type": "neuronx-cc",
|
24 |
+
"compiler_version": "2.19.8089.0+8ab9f450",
|
25 |
+
"disable_fallback": false,
|
26 |
+
"disable_fast_relayout": false,
|
27 |
+
"dynamic_batch_size": false,
|
28 |
+
"float_dtype": "fp32",
|
29 |
+
"inline_weights_to_neff": true,
|
30 |
+
"input_names": [
|
31 |
+
"input_ids",
|
32 |
+
"attention_mask"
|
33 |
+
],
|
34 |
+
"int_dtype": "int64",
|
35 |
+
"model_type": "transformer",
|
36 |
+
"optlevel": "2",
|
37 |
+
"output_attentions": false,
|
38 |
+
"output_hidden_states": false,
|
39 |
+
"output_names": [
|
40 |
+
"token_embeddings",
|
41 |
+
"sentence_embedding"
|
42 |
+
],
|
43 |
+
"static_batch_size": 1,
|
44 |
+
"static_sequence_length": 16,
|
45 |
+
"task": "feature-extraction",
|
46 |
+
"tensor_parallel_size": 1
|
47 |
+
},
|
48 |
+
"num_attention_heads": 12,
|
49 |
+
"num_hidden_layers": 6,
|
50 |
+
"position_embedding_type": "absolute",
|
51 |
+
"type_vocab_size": 2,
|
52 |
+
"use_cache": true,
|
53 |
+
"vocab_size": 30522
|
54 |
+
}
|
neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/bert/sentence-transformers/all-MiniLM-L6-v2/f99a0822ae493faf0bb5.json
ADDED
@@ -0,0 +1,54 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_entry_class": "SingleModelCacheEntry",
|
3 |
+
"_model_id": "sentence-transformers/all-MiniLM-L6-v2",
|
4 |
+
"_task": "feature-extraction",
|
5 |
+
"architectures": [
|
6 |
+
"BertModel"
|
7 |
+
],
|
8 |
+
"attention_probs_dropout_prob": 0.1,
|
9 |
+
"classifier_dropout": null,
|
10 |
+
"export_model_type": "transformer",
|
11 |
+
"gradient_checkpointing": false,
|
12 |
+
"hidden_act": "gelu",
|
13 |
+
"hidden_dropout_prob": 0.1,
|
14 |
+
"hidden_size": 384,
|
15 |
+
"initializer_range": 0.02,
|
16 |
+
"intermediate_size": 1536,
|
17 |
+
"layer_norm_eps": 1e-12,
|
18 |
+
"max_position_embeddings": 512,
|
19 |
+
"model_type": "bert",
|
20 |
+
"neuron": {
|
21 |
+
"auto_cast": null,
|
22 |
+
"auto_cast_type": null,
|
23 |
+
"compiler_type": "neuronx-cc",
|
24 |
+
"compiler_version": "2.19.8089.0+8ab9f450",
|
25 |
+
"disable_fallback": false,
|
26 |
+
"disable_fast_relayout": false,
|
27 |
+
"dynamic_batch_size": true,
|
28 |
+
"float_dtype": "fp32",
|
29 |
+
"inline_weights_to_neff": true,
|
30 |
+
"input_names": [
|
31 |
+
"input_ids",
|
32 |
+
"attention_mask"
|
33 |
+
],
|
34 |
+
"int_dtype": "int64",
|
35 |
+
"model_type": "transformer",
|
36 |
+
"optlevel": "2",
|
37 |
+
"output_attentions": false,
|
38 |
+
"output_hidden_states": false,
|
39 |
+
"output_names": [
|
40 |
+
"token_embeddings",
|
41 |
+
"sentence_embedding"
|
42 |
+
],
|
43 |
+
"static_batch_size": 1,
|
44 |
+
"static_sequence_length": 32,
|
45 |
+
"task": "feature-extraction",
|
46 |
+
"tensor_parallel_size": 1
|
47 |
+
},
|
48 |
+
"num_attention_heads": 12,
|
49 |
+
"num_hidden_layers": 6,
|
50 |
+
"position_embedding_type": "absolute",
|
51 |
+
"type_vocab_size": 2,
|
52 |
+
"use_cache": true,
|
53 |
+
"vocab_size": 30522
|
54 |
+
}
|
neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/camembert/hf-internal-testing/tiny-random-camembert/16650c04744503a0af47.json
ADDED
@@ -0,0 +1,52 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_entry_class": "SingleModelCacheEntry",
|
3 |
+
"_model_id": "hf-internal-testing/tiny-random-camembert",
|
4 |
+
"_task": "token-classification",
|
5 |
+
"architectures": [
|
6 |
+
"CamembertModel"
|
7 |
+
],
|
8 |
+
"attention_probs_dropout_prob": 0.1,
|
9 |
+
"classifier_dropout": null,
|
10 |
+
"gradient_checkpointing": false,
|
11 |
+
"hidden_act": "gelu",
|
12 |
+
"hidden_dropout_prob": 0.1,
|
13 |
+
"hidden_size": 32,
|
14 |
+
"initializer_range": 0.02,
|
15 |
+
"intermediate_size": 37,
|
16 |
+
"layer_norm_eps": 1e-12,
|
17 |
+
"max_position_embeddings": 512,
|
18 |
+
"model_type": "camembert",
|
19 |
+
"neuron": {
|
20 |
+
"auto_cast": null,
|
21 |
+
"auto_cast_type": null,
|
22 |
+
"compiler_type": "neuronx-cc",
|
23 |
+
"compiler_version": "2.19.8089.0+8ab9f450",
|
24 |
+
"disable_fallback": false,
|
25 |
+
"disable_fast_relayout": false,
|
26 |
+
"dynamic_batch_size": false,
|
27 |
+
"float_dtype": "fp32",
|
28 |
+
"inline_weights_to_neff": true,
|
29 |
+
"input_names": [
|
30 |
+
"input_ids",
|
31 |
+
"attention_mask"
|
32 |
+
],
|
33 |
+
"int_dtype": "int64",
|
34 |
+
"model_type": "camembert",
|
35 |
+
"optlevel": "2",
|
36 |
+
"output_attentions": false,
|
37 |
+
"output_hidden_states": false,
|
38 |
+
"output_names": [
|
39 |
+
"logits"
|
40 |
+
],
|
41 |
+
"static_batch_size": 1,
|
42 |
+
"static_sequence_length": 32,
|
43 |
+
"task": "token-classification",
|
44 |
+
"tensor_parallel_size": 1
|
45 |
+
},
|
46 |
+
"num_attention_heads": 4,
|
47 |
+
"num_hidden_layers": 5,
|
48 |
+
"position_embedding_type": "absolute",
|
49 |
+
"type_vocab_size": 16,
|
50 |
+
"use_cache": true,
|
51 |
+
"vocab_size": 1000
|
52 |
+
}
|
neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/camembert/hf-internal-testing/tiny-random-camembert/3d5fe21de242b8b602d5.json
ADDED
@@ -0,0 +1,52 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_entry_class": "SingleModelCacheEntry",
|
3 |
+
"_model_id": "hf-internal-testing/tiny-random-camembert",
|
4 |
+
"_task": "fill-mask",
|
5 |
+
"architectures": [
|
6 |
+
"CamembertModel"
|
7 |
+
],
|
8 |
+
"attention_probs_dropout_prob": 0.1,
|
9 |
+
"classifier_dropout": null,
|
10 |
+
"gradient_checkpointing": false,
|
11 |
+
"hidden_act": "gelu",
|
12 |
+
"hidden_dropout_prob": 0.1,
|
13 |
+
"hidden_size": 32,
|
14 |
+
"initializer_range": 0.02,
|
15 |
+
"intermediate_size": 37,
|
16 |
+
"layer_norm_eps": 1e-12,
|
17 |
+
"max_position_embeddings": 512,
|
18 |
+
"model_type": "camembert",
|
19 |
+
"neuron": {
|
20 |
+
"auto_cast": null,
|
21 |
+
"auto_cast_type": null,
|
22 |
+
"compiler_type": "neuronx-cc",
|
23 |
+
"compiler_version": "2.19.8089.0+8ab9f450",
|
24 |
+
"disable_fallback": false,
|
25 |
+
"disable_fast_relayout": false,
|
26 |
+
"dynamic_batch_size": true,
|
27 |
+
"float_dtype": "fp32",
|
28 |
+
"inline_weights_to_neff": true,
|
29 |
+
"input_names": [
|
30 |
+
"input_ids",
|
31 |
+
"attention_mask"
|
32 |
+
],
|
33 |
+
"int_dtype": "int64",
|
34 |
+
"model_type": "camembert",
|
35 |
+
"optlevel": "2",
|
36 |
+
"output_attentions": false,
|
37 |
+
"output_hidden_states": false,
|
38 |
+
"output_names": [
|
39 |
+
"logits"
|
40 |
+
],
|
41 |
+
"static_batch_size": 1,
|
42 |
+
"static_sequence_length": 32,
|
43 |
+
"task": "fill-mask",
|
44 |
+
"tensor_parallel_size": 1
|
45 |
+
},
|
46 |
+
"num_attention_heads": 4,
|
47 |
+
"num_hidden_layers": 5,
|
48 |
+
"position_embedding_type": "absolute",
|
49 |
+
"type_vocab_size": 16,
|
50 |
+
"use_cache": true,
|
51 |
+
"vocab_size": 1000
|
52 |
+
}
|
neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/camembert/hf-internal-testing/tiny-random-camembert/4b4a4fbbe9d668bcf61e.json
ADDED
@@ -0,0 +1,52 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_entry_class": "SingleModelCacheEntry",
|
3 |
+
"_model_id": "hf-internal-testing/tiny-random-camembert",
|
4 |
+
"_task": "token-classification",
|
5 |
+
"architectures": [
|
6 |
+
"CamembertModel"
|
7 |
+
],
|
8 |
+
"attention_probs_dropout_prob": 0.1,
|
9 |
+
"classifier_dropout": null,
|
10 |
+
"gradient_checkpointing": false,
|
11 |
+
"hidden_act": "gelu",
|
12 |
+
"hidden_dropout_prob": 0.1,
|
13 |
+
"hidden_size": 32,
|
14 |
+
"initializer_range": 0.02,
|
15 |
+
"intermediate_size": 37,
|
16 |
+
"layer_norm_eps": 1e-12,
|
17 |
+
"max_position_embeddings": 512,
|
18 |
+
"model_type": "camembert",
|
19 |
+
"neuron": {
|
20 |
+
"auto_cast": null,
|
21 |
+
"auto_cast_type": null,
|
22 |
+
"compiler_type": "neuronx-cc",
|
23 |
+
"compiler_version": "2.19.8089.0+8ab9f450",
|
24 |
+
"disable_fallback": false,
|
25 |
+
"disable_fast_relayout": false,
|
26 |
+
"dynamic_batch_size": true,
|
27 |
+
"float_dtype": "fp32",
|
28 |
+
"inline_weights_to_neff": true,
|
29 |
+
"input_names": [
|
30 |
+
"input_ids",
|
31 |
+
"attention_mask"
|
32 |
+
],
|
33 |
+
"int_dtype": "int64",
|
34 |
+
"model_type": "camembert",
|
35 |
+
"optlevel": "2",
|
36 |
+
"output_attentions": false,
|
37 |
+
"output_hidden_states": false,
|
38 |
+
"output_names": [
|
39 |
+
"logits"
|
40 |
+
],
|
41 |
+
"static_batch_size": 1,
|
42 |
+
"static_sequence_length": 32,
|
43 |
+
"task": "token-classification",
|
44 |
+
"tensor_parallel_size": 1
|
45 |
+
},
|
46 |
+
"num_attention_heads": 4,
|
47 |
+
"num_hidden_layers": 5,
|
48 |
+
"position_embedding_type": "absolute",
|
49 |
+
"type_vocab_size": 16,
|
50 |
+
"use_cache": true,
|
51 |
+
"vocab_size": 1000
|
52 |
+
}
|
neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/camembert/hf-internal-testing/tiny-random-camembert/5bca725791b646775427.json
ADDED
@@ -0,0 +1,53 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_entry_class": "SingleModelCacheEntry",
|
3 |
+
"_model_id": "hf-internal-testing/tiny-random-camembert",
|
4 |
+
"_task": "question-answering",
|
5 |
+
"architectures": [
|
6 |
+
"CamembertModel"
|
7 |
+
],
|
8 |
+
"attention_probs_dropout_prob": 0.1,
|
9 |
+
"classifier_dropout": null,
|
10 |
+
"gradient_checkpointing": false,
|
11 |
+
"hidden_act": "gelu",
|
12 |
+
"hidden_dropout_prob": 0.1,
|
13 |
+
"hidden_size": 32,
|
14 |
+
"initializer_range": 0.02,
|
15 |
+
"intermediate_size": 37,
|
16 |
+
"layer_norm_eps": 1e-12,
|
17 |
+
"max_position_embeddings": 512,
|
18 |
+
"model_type": "camembert",
|
19 |
+
"neuron": {
|
20 |
+
"auto_cast": null,
|
21 |
+
"auto_cast_type": null,
|
22 |
+
"compiler_type": "neuronx-cc",
|
23 |
+
"compiler_version": "2.19.8089.0+8ab9f450",
|
24 |
+
"disable_fallback": false,
|
25 |
+
"disable_fast_relayout": false,
|
26 |
+
"dynamic_batch_size": false,
|
27 |
+
"float_dtype": "fp32",
|
28 |
+
"inline_weights_to_neff": true,
|
29 |
+
"input_names": [
|
30 |
+
"input_ids",
|
31 |
+
"attention_mask"
|
32 |
+
],
|
33 |
+
"int_dtype": "int64",
|
34 |
+
"model_type": "camembert",
|
35 |
+
"optlevel": "2",
|
36 |
+
"output_attentions": false,
|
37 |
+
"output_hidden_states": false,
|
38 |
+
"output_names": [
|
39 |
+
"start_logits",
|
40 |
+
"end_logits"
|
41 |
+
],
|
42 |
+
"static_batch_size": 1,
|
43 |
+
"static_sequence_length": 128,
|
44 |
+
"task": "question-answering",
|
45 |
+
"tensor_parallel_size": 1
|
46 |
+
},
|
47 |
+
"num_attention_heads": 4,
|
48 |
+
"num_hidden_layers": 5,
|
49 |
+
"position_embedding_type": "absolute",
|
50 |
+
"type_vocab_size": 16,
|
51 |
+
"use_cache": true,
|
52 |
+
"vocab_size": 1000
|
53 |
+
}
|