Synchronizing local compiler cache.
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +344 -0
- neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev0/qwen2/Qwen/Qwen2.5-0.5B/5eef7da50a217db5b302.json +97 -0
- neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev0/qwen2/yujiepan/qwen2.5-128k-tiny-random/3292185f0123466a93a2.json +79 -0
- neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev0/qwen2/yujiepan/qwen2.5-128k-tiny-random/b60dca7d7a9c53810fe0.json +79 -0
- neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev0/qwen2/yujiepan/qwen2.5-128k-tiny-random/b9b0c081795fa9e33ca6.json +79 -0
- neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/albert/hf-internal-testing/tiny-random-AlbertModel/082c855afd5bbe38fea8.json +54 -0
- neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/albert/hf-internal-testing/tiny-random-AlbertModel/19ebb6a6a5ec909e86f1.json +55 -0
- neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/albert/hf-internal-testing/tiny-random-AlbertModel/1e1cab9afee16970464a.json +55 -0
- neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/albert/hf-internal-testing/tiny-random-AlbertModel/2420b2b633bc1e938403.json +54 -0
- neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/albert/hf-internal-testing/tiny-random-AlbertModel/3585a8b7eec15ef74cc9.json +55 -0
- neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/albert/hf-internal-testing/tiny-random-AlbertModel/4d038e1c09d623b63731.json +55 -0
- neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/albert/hf-internal-testing/tiny-random-AlbertModel/59c92a651b8b40190b9d.json +54 -0
- neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/albert/hf-internal-testing/tiny-random-AlbertModel/707d5fc3c98b3c204500.json +54 -0
- neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/albert/hf-internal-testing/tiny-random-AlbertModel/8829976eff976b676195.json +54 -0
- neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/albert/hf-internal-testing/tiny-random-AlbertModel/903f2ac3444c8203b948.json +54 -0
- neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/albert/hf-internal-testing/tiny-random-AlbertModel/9b69ad26e6071c069631.json +55 -0
- neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/albert/hf-internal-testing/tiny-random-AlbertModel/aa7706c37f42f9b0efa0.json +54 -0
- neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/albert/hf-internal-testing/tiny-random-AlbertModel/b5b638607d26526724c7.json +54 -0
- neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/albert/hf-internal-testing/tiny-random-AlbertModel/ce96b3b9bef1f6cf0d93.json +55 -0
- neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/albert/hf-internal-testing/tiny-random-AlbertModel/cf3a4b3035690a565ab1.json +55 -0
- neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/albert/hf-internal-testing/tiny-random-AlbertModel/d2da3177c42e88297899.json +55 -0
- neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/albert/hf-internal-testing/tiny-random-AlbertModel/e59dd1535caa6a29b4cc.json +54 -0
- neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/beit/hf-internal-testing/tiny-random-BeitForImageClassification/7b8399664c54026a03ff.json +90 -0
- neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/beit/hf-internal-testing/tiny-random-BeitForImageClassification/8eea34f80bdd528f4c47.json +90 -0
- neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/bert/Jingya/tiny-random-bert-remote-code/601076bf2990d898404b.json +52 -0
- neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/bert/fxmarty/tiny-bert-sst2-distilled-subfolder/d7d576d06e1491d72e5a.json +61 -0
- neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/bert/hf-internal-testing/tiny-random-BertModel/07d9dac237105afed7b4.json +52 -0
- neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/bert/hf-internal-testing/tiny-random-BertModel/0d7dca7e1b02d11fa30b.json +52 -0
- neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/bert/hf-internal-testing/tiny-random-BertModel/22ce2cce0b08d134021c.json +53 -0
- neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/bert/hf-internal-testing/tiny-random-BertModel/28bcefedc9caadd676ab.json +53 -0
- neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/bert/hf-internal-testing/tiny-random-BertModel/3908bf519c210b434176.json +53 -0
- neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/bert/hf-internal-testing/tiny-random-BertModel/5ead9d705b13f37e716b.json +52 -0
- neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/bert/hf-internal-testing/tiny-random-BertModel/80c925bab2fcc5749b91.json +53 -0
- neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/bert/hf-internal-testing/tiny-random-BertModel/92f51980d46489605055.json +52 -0
- neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/bert/hf-internal-testing/tiny-random-BertModel/aeebf3f56cf9d0ed0250.json +52 -0
- neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/bert/hf-internal-testing/tiny-random-BertModel/cfb94bae5629e275593f.json +53 -0
- neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/bert/hf-internal-testing/tiny-random-BertModel/e050716b5de372871d73.json +52 -0
- neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/bert/hf-internal-testing/tiny-random-BertModel/e0768f223c51e12fd868.json +52 -0
- neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/bert/hf-internal-testing/tiny-random-BertModel/e2594a1f187f452902f7.json +52 -0
- neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/bert/hf-internal-testing/tiny-random-BertModel/e4834fd951418b796374.json +53 -0
- neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/bert/hf-internal-testing/tiny-random-BertModel/e7e71e6beffbf701391b.json +53 -0
- neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/bert/hf-internal-testing/tiny-random-BertModel/ea81a963f6aa67da9f09.json +53 -0
- neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/bert/hf-internal-testing/tiny-random-BertModel/ef32dca934503ba9400c.json +52 -0
- neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/bert/hf-internal-testing/tiny-random-BertModel/f15944a91bf873bc4059.json +52 -0
- neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/bert/sentence-transformers/all-MiniLM-L6-v2/b571d0d9ac9ad084fa8c.json +54 -0
- neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/bert/sentence-transformers/all-MiniLM-L6-v2/f99a0822ae493faf0bb5.json +54 -0
- neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/camembert/hf-internal-testing/tiny-random-camembert/16650c04744503a0af47.json +52 -0
- neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/camembert/hf-internal-testing/tiny-random-camembert/3d5fe21de242b8b602d5.json +52 -0
- neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/camembert/hf-internal-testing/tiny-random-camembert/4b4a4fbbe9d668bcf61e.json +52 -0
- neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/camembert/hf-internal-testing/tiny-random-camembert/5bca725791b646775427.json +53 -0
.gitattributes
CHANGED
|
@@ -10270,3 +10270,347 @@ neuronxcc-2.20.9961.0+0acef03a/MODULE_057bc784fc164fb34d3e+ed72d204/model.neff f
|
|
| 10270 |
neuronxcc-2.20.9961.0+0acef03a/MODULE_de733c6f96020a1e5f56+a9d440f5/model.neff filter=lfs diff=lfs merge=lfs -text
|
| 10271 |
neuronxcc-2.20.9961.0+0acef03a/MODULE_de733c6f96020a1e5f56+a9d440f5/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text
|
| 10272 |
neuronxcc-2.20.9961.0+0acef03a/MODULE_e3031c3c114f7c905db7+ae6a382b/model.neff filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10270 |
neuronxcc-2.20.9961.0+0acef03a/MODULE_de733c6f96020a1e5f56+a9d440f5/model.neff filter=lfs diff=lfs merge=lfs -text
|
| 10271 |
neuronxcc-2.20.9961.0+0acef03a/MODULE_de733c6f96020a1e5f56+a9d440f5/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text
|
| 10272 |
neuronxcc-2.20.9961.0+0acef03a/MODULE_e3031c3c114f7c905db7+ae6a382b/model.neff filter=lfs diff=lfs merge=lfs -text
|
| 10273 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_0219e831452f3e9b80e6/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10274 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_021be40fb5716d1066d1/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10275 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_02c51eae95f4097f74e7/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10276 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_07d9dac237105afed7b4/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10277 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_082c855afd5bbe38fea8/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10278 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_0994f3d43a554bcbbcd7/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10279 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_0ad6e67d0b4363af0472/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10280 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_0af77bd813eb760ae10d/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10281 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_0b0b6686a4841c281f89/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10282 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_0b384d0739d57659345e/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10283 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_0bfe6d17355fd2f0836f/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10284 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_0ca055684d61c552e3ec/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10285 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_0ca23862a0ff1499156f/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10286 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_0d7dca7e1b02d11fa30b/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10287 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_0e02d4795b77fba80c35/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10288 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_0f556b899de48f28b455/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10289 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_0fdfb4247e7d07ebbad0/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10290 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_101f045ec3ef38dff069/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10291 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_11228616321528259762+e30acd3a/model.neff filter=lfs diff=lfs merge=lfs -text
|
| 10292 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_1179fb416e242252b8b1/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10293 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_117dcaf2b5ba5b392c51/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10294 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_11d26d78110e3ea447dd/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10295 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_12273156641748218648+e30acd3a/model.neff filter=lfs diff=lfs merge=lfs -text
|
| 10296 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_1227467f6a1477aec333/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10297 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_1355027528627e06e5cb/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10298 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_136344c1e04a80fc9e83/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10299 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_14069605881026998085+e30acd3a/model.neff filter=lfs diff=lfs merge=lfs -text
|
| 10300 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_14160024224657763603+e30acd3a/model.neff filter=lfs diff=lfs merge=lfs -text
|
| 10301 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_14829227305888857035+e30acd3a/model.neff filter=lfs diff=lfs merge=lfs -text
|
| 10302 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_148a07ab282c4e1a2a0e/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10303 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_15025462673285903344+e30acd3a/model.neff filter=lfs diff=lfs merge=lfs -text
|
| 10304 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_15f7e443873c3474a6aa/decoder/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10305 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_15f7e443873c3474a6aa/encoder/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10306 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_16650c04744503a0af47/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10307 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_16839706381867715922+e30acd3a/model.neff filter=lfs diff=lfs merge=lfs -text
|
| 10308 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_16b01b31bf5bb1c85c1d/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10309 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_17327912813737302838+e30acd3a/model.neff filter=lfs diff=lfs merge=lfs -text
|
| 10310 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_17419856824540332941+e30acd3a/model.neff filter=lfs diff=lfs merge=lfs -text
|
| 10311 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_17641195202625304294+e30acd3a/model.neff filter=lfs diff=lfs merge=lfs -text
|
| 10312 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_17711110885328520544+e30acd3a/model.neff filter=lfs diff=lfs merge=lfs -text
|
| 10313 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_17855694184933887987+e30acd3a/model.neff filter=lfs diff=lfs merge=lfs -text
|
| 10314 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_184d9b81ae20431d278e/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10315 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_18d8cc6bf53b525ebb83/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10316 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_19a9557944c3c798892c/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10317 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_19ebb6a6a5ec909e86f1/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10318 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_1ae5dec75b26da7fc293+253d6470/model.neff filter=lfs diff=lfs merge=lfs -text
|
| 10319 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_1be47d7ec35995ba24e2/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10320 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_1ccdb35db19ea6d46330/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10321 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_1d4e0541af5c102c02ad/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10322 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_1e1cab9afee16970464a/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10323 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_1f71844521461b69a9a1/text_encoder/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10324 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_1f71844521461b69a9a1/unet/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10325 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_1f71844521461b69a9a1/vae_decoder/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10326 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_1f71844521461b69a9a1/vae_encoder/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10327 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_1f997b4c07c5b98b2872/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10328 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_2011979c1c7685c0c1e8/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10329 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_22ac4beaed8c828e276d/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10330 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_22ce2cce0b08d134021c/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10331 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_2420b2b633bc1e938403/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10332 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_2518ad68ffda816de14c+a74130ed/model.neff filter=lfs diff=lfs merge=lfs -text
|
| 10333 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_2518ad68ffda816de14c+a74130ed/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text
|
| 10334 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_27494e54568e0f4aef97/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10335 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_28bcefedc9caadd676ab/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10336 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_2994655886375ea65794/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10337 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_2bfc916223b281bde6c9/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10338 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_2c3447cbfc1aa2c980e4/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10339 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_2d941194111edd1cc349/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10340 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_2ec978f7548ba514cc92/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10341 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_2eeccd3fb290738b486c/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10342 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_30709c9a1366cc22f381/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10343 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_3091516cc256301854d5/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10344 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_3164ef3b6e4540774d38/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10345 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_3262637bc52e95809853+431f5505/model.neff filter=lfs diff=lfs merge=lfs -text
|
| 10346 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_33c68608ff1365e11b4b/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10347 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_35240b83eadb946e8397/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10348 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_3585a8b7eec15ef74cc9/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10349 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_3666724308aaa469662b/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10350 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_37fb28b99dfea65dc5fd/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10351 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_38fe3c7c7cf144065eac/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10352 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_3908bf519c210b434176/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10353 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_39152d050ca1aafdbcb7/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10354 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_3bf2eb59f27536b63a45/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10355 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_3d5fe21de242b8b602d5/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10356 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_3f7a39fcaca1f42af1d6/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10357 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_4067177570182b1343d2/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10358 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_4148dd3c4e0957c59aec/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10359 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_4375062474730619889+e30acd3a/model.neff filter=lfs diff=lfs merge=lfs -text
|
| 10360 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_44670f0e856e93e13945/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10361 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_45c7246705c9e6fab659/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10362 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_466672b98b30e850228e/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10363 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_467e3986218b1c421e16/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10364 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_4696932584f9d8f704d5/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10365 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_4750006367237009755+e30acd3a/model.neff filter=lfs diff=lfs merge=lfs -text
|
| 10366 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_484d55fa9705364e6d6c/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10367 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_491a208ef81533ee4361/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10368 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_4974b909ef52ed6985aa/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10369 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_4b4a4fbbe9d668bcf61e/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10370 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_4b5db21c35dab98379c0/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10371 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_4bf35dcb438eff118841/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10372 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_4d038e1c09d623b63731/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10373 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_4d2fe63b7ea76c7ef876+a74130ed/model.neff filter=lfs diff=lfs merge=lfs -text
|
| 10374 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_4d2fe63b7ea76c7ef876+a74130ed/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text
|
| 10375 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_4e4ef27b3302beb416e2+253d6470/model.neff filter=lfs diff=lfs merge=lfs -text
|
| 10376 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_50466361a10e0beb2743/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10377 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_50881c62b5e180d29b73/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10378 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_50dd1eff58edae4890c4/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10379 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_52ac96dddc861615c14b/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10380 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_530b46c2c544923d9ae4/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10381 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_5321652960071550735+e30acd3a/model.neff filter=lfs diff=lfs merge=lfs -text
|
| 10382 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_54999f3651eabb911710/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10383 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_565ec63172e78bb6a459/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10384 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_566b362576597dc93bf0/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10385 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_56fb08782842e65d4478/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10386 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_56fb7ca25c9741358f35/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10387 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_57575a85181cb2c0c6ce/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10388 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_59287e3a63d75be1484e/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10389 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_59c92a651b8b40190b9d/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10390 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_5bca725791b646775427/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10391 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_5cfaeab2b13c776d07bb/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10392 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_5d5dadc2c2138bf8ab44/decoder/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10393 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_5d5dadc2c2138bf8ab44/encoder/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10394 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_5dba74ecad23c5836b41/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10395 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_5de28d74475c2e525475/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10396 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_5e0f1f4e96fb7f38115d/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10397 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_5ead9d705b13f37e716b/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10398 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_5ee5e7496586a5b158cd/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10399 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_5fb0198cf9dd4a2e93ea/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10400 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_5fc297836c63bcff7ed3/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10401 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_601076bf2990d898404b/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10402 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_602b46624db97cda3fee/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10403 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_6081e29d0b26014e391f/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10404 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_61774b9874fadd5b1723/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10405 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_61a96b508e7be967c0c7+cd3419b6/model.neff filter=lfs diff=lfs merge=lfs -text
|
| 10406 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_61a96b508e7be967c0c7+cd3419b6/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text
|
| 10407 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_62c0826140d6564782c3/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10408 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_6356dda8884e943ca1eb/text_encoder/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10409 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_6356dda8884e943ca1eb/text_encoder_2/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10410 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_6356dda8884e943ca1eb/unet/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10411 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_6356dda8884e943ca1eb/vae_decoder/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10412 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_6356dda8884e943ca1eb/vae_encoder/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10413 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_639b34a908c080e3d3e9/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10414 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_63b1a6be8b23f66fef00/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10415 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_64383c5d9ccd5d74a246/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10416 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_64a180bec331b8ec91ba/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10417 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_655beeec84479afaaafe/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10418 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_66be3aba74892f370b62/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10419 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_68d42db5e52211fa0dc3/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10420 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_68df0af504c21aa2b1ce/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10421 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_6903f75a616124fbbe62/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10422 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_69748744deacc485a2da/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10423 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_6a46f0468637fa1ceea4/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10424 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_6b45e20838de2009119b/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10425 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_6cdfd3f8d054eaf72194/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10426 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_6e06599623de7d47c750/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10427 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_6ec1ef9088ffe38a3d25/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10428 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_707d5fc3c98b3c204500/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10429 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_70a99404c72ad381de36/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10430 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_70ae67fe6de015024b24+cd3419b6/model.neff filter=lfs diff=lfs merge=lfs -text
|
| 10431 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_70ae67fe6de015024b24+cd3419b6/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text
|
| 10432 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_71d6f99f019cce5d2c56/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10433 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_7291119501971561507+e30acd3a/model.neff filter=lfs diff=lfs merge=lfs -text
|
| 10434 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_72b1081c4393b26efe11/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10435 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_733d8ce97f615c7406f6/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10436 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_749c49190e3a9c9b1317/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10437 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_74c4ec2a3829c1027457/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10438 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_77e174f71c47d9f4d0b7/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10439 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_7b1d8863929b4701df6d/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10440 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_7b8399664c54026a03ff/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10441 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_7be6e0568963be54593a/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10442 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_7cc364920677c1ace017/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10443 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_7dd477985731dbce8cf8/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10444 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_7ec9c0b2b3c87c96c7d0/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10445 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_80563bbcc3f75213156d/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10446 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_80c925bab2fcc5749b91/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10447 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_8285b8316500e52286c9/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10448 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_8319eff5a8285defb5a3/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10449 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_833bce8fd7e57021a525/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10450 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_83466d3415d7c423ad3a/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10451 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_83b76f3670fb9dd6d79d/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10452 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_8417307499696621353+e30acd3a/model.neff filter=lfs diff=lfs merge=lfs -text
|
| 10453 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_855c66679f1728d4b0b9/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10454 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_876a3fac78c9e7d8d969/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10455 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_87b36020196a848d8295/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10456 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_87eb7ec28b9b01a3f8de/text_encoder/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10457 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_87eb7ec28b9b01a3f8de/unet/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10458 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_87eb7ec28b9b01a3f8de/vae_decoder/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10459 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_87eb7ec28b9b01a3f8de/vae_encoder/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10460 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_8829976eff976b676195/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10461 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_88abbb6c39ef61b204e1/decoder/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10462 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_88abbb6c39ef61b204e1/encoder/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10463 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_896e2cb6bda1ecefc195/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10464 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_89c332555d9bb1164bb3+431f5505/model.neff filter=lfs diff=lfs merge=lfs -text
|
| 10465 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_8afa7462593888c1ace0/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10466 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_8b1a6646a196796c979b/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10467 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_8eea34f80bdd528f4c47/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10468 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_9013e8baf47aa2490da7/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10469 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_903f2ac3444c8203b948/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10470 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_922088b97905a7fc46ca/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10471 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_9280fd71681625e0f026/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10472 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_92b322085492cfc5743f/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10473 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_92f51980d46489605055/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10474 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_93fb6328ff6b4914fec7/text_encoder/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10475 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_93fb6328ff6b4914fec7/text_encoder_2/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10476 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_93fb6328ff6b4914fec7/unet/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10477 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_93fb6328ff6b4914fec7/vae_decoder/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10478 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_93fb6328ff6b4914fec7/vae_encoder/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10479 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_950e3bf7ec0e47e9d1f6/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10480 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_9584ca4279d47aa94f96/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10481 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_96263cd071abd0bb8205/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10482 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_96735d336b988c7ae46c/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10483 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_96f2f0fe551f33210e73/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10484 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_98afed8f23bccfa2bf93/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10485 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_99a4d278a736dc55c4e1/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10486 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_99bc626550f56c193835/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10487 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_9a0e849430be2af050d7/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10488 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_9a67f4255c65b566abfd/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10489 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_9b1e403c2901fc8169d9/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10490 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_9b69ad26e6071c069631/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10491 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_9e7952fae90c1f6f8fb4/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10492 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_9f5df17622d13f7aa0a1/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10493 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_9f6a8efd40fcd1be4ca9/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10494 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_a1326d88e9b290f8e35a/controlnet_0/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10495 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_a1326d88e9b290f8e35a/text_encoder/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10496 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_a1326d88e9b290f8e35a/unet/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10497 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_a1326d88e9b290f8e35a/vae_decoder/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10498 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_a1326d88e9b290f8e35a/vae_encoder/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10499 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_a456d73c225440c520af/text_encoder/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10500 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_a456d73c225440c520af/unet/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10501 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_a456d73c225440c520af/vae_decoder/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10502 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_a456d73c225440c520af/vae_encoder/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10503 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_a6e434271f70307fe55a/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10504 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_a7dcaa4d6f7541916f6b/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10505 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_aa7706c37f42f9b0efa0/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10506 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_ab0ec5a632242310c520/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10507 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_ac82cc5cd27456228f9b/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10508 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_ad9de1959357baf1be93/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10509 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_aeebf3f56cf9d0ed0250/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10510 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_af36677e1d281b7581b7/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10511 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_b26cf211d0154814b6de/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10512 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_b2a5715c8de1d06e02d1/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10513 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_b45d43ae8e345b80b8b6/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10514 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_b46c903d70fcbd8dde04/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10515 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_b571d0d9ac9ad084fa8c/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10516 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_b5b638607d26526724c7/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10517 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_b6abe5e7902b7d92c00b/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10518 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_b825412615cae3305380/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10519 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_b83eb9efb666a7597fa6/controlnet_0/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10520 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_b83eb9efb666a7597fa6/controlnet_1/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10521 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_b83eb9efb666a7597fa6/text_encoder/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10522 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_b83eb9efb666a7597fa6/unet/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10523 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_b83eb9efb666a7597fa6/vae_decoder/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10524 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_b83eb9efb666a7597fa6/vae_encoder/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10525 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_ba276d9e084c36d4d299/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10526 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_bb5b129941b54904675f/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10527 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_bc33d8c25a64bc49fa25/text_encoder/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10528 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_bc33d8c25a64bc49fa25/text_encoder_2/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10529 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_bc33d8c25a64bc49fa25/unet/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10530 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_bc33d8c25a64bc49fa25/vae_decoder/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10531 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_bc33d8c25a64bc49fa25/vae_encoder/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10532 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_bc7d63ab74772beafa77/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10533 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_bd8a7636ac96599afce0/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10534 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_bf898d9815ecfc28a3c4/decoder/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10535 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_bf898d9815ecfc28a3c4/encoder/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10536 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_c121d453d2dce97dc9f2/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10537 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_c1a7e229a1e0089bc100/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10538 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_c3dac669c643d4e0b641/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10539 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_c6a6313df00b13f0bc20/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10540 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_c76ea064827fb5ffaf3a/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10541 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_c7711f055c4601678bfc/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10542 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_c845c7c1978a7f0fc5bc+cd3419b6/model.neff filter=lfs diff=lfs merge=lfs -text
|
| 10543 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_c845c7c1978a7f0fc5bc+cd3419b6/wrapped_neff.hlo filter=lfs diff=lfs merge=lfs -text
|
| 10544 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_cd2b22a4d8bd6ff87e79/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10545 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_ce96b3b9bef1f6cf0d93/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10546 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_cf3a4b3035690a565ab1/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10547 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_cfb94bae5629e275593f/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10548 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_cfbfacea58d61c7302ac/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10549 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_d0207458a6f6fb104830/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10550 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_d0dd0aeeae66ba529c6f/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10551 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_d2c282677041876b494e/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10552 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_d2da3177c42e88297899/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10553 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_d327dc6d21691f2390f2/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10554 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_d3a9e3a3693c0097041a/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10555 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_d4527b583703e675299f/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10556 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_d5fb9a76d0fdc62db217/text_encoder/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10557 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_d5fb9a76d0fdc62db217/unet/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10558 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_d5fb9a76d0fdc62db217/vae_decoder/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10559 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_d5fb9a76d0fdc62db217/vae_encoder/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10560 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_d63d38954db56a481479/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10561 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_d752631e2f1bc8b5bd5c/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10562 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_d780aaa6e4cc8ef4073b/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10563 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_d7d576d06e1491d72e5a/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10564 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_d83e395611ddc3a29d9f/decoder/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10565 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_d83e395611ddc3a29d9f/encoder/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10566 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_db7feb9a8e6a89d9b5cc/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10567 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_dbf38214a01c36374929/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10568 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_dc19e38388ce4a13824f/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10569 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_dcfeb3310672a794fe59/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10570 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_dec4d4d1adf057ba26a6/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10571 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_e00b8a80c7b4565a38b9/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10572 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_e01d4f3ed05b3b779179/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10573 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_e050716b5de372871d73/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10574 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_e0768f223c51e12fd868/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10575 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_e0d110db2ae6fd6f9a18/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10576 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_e0e485d1effe77c0355a/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10577 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_e207d10cd73986f34774/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10578 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_e2594a1f187f452902f7/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10579 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_e3343136a71050139f62/text_encoder/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10580 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_e3343136a71050139f62/text_encoder_2/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10581 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_e3343136a71050139f62/unet/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10582 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_e3343136a71050139f62/vae_decoder/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10583 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_e3343136a71050139f62/vae_encoder/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10584 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_e4834fd951418b796374/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10585 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_e57cbde649dde732937d/decoder/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10586 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_e57cbde649dde732937d/encoder/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10587 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_e59dd1535caa6a29b4cc/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10588 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_e5c893a9ead6645e9326/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10589 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_e7d6a1ed3ce052d450ca/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10590 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_e7e71e6beffbf701391b/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10591 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_ea65e810b73a07c4f93e/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10592 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_ea81a963f6aa67da9f09/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10593 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_eaa04c5b1a458bb8ede4/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10594 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_eaffcb1bcf2a2ba5568c/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10595 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_ebdd3f238f484caa6f2b/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10596 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_ed32d4174c8c48368338/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10597 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_ef32dca934503ba9400c/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10598 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_f0f76b9ba98b72bdf648/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10599 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_f15944a91bf873bc4059/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10600 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_f1ec63e05f9ea876842c/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10601 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_f2764d531dd4d92fcf44/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10602 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_f2fb67dde0ac51075166/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10603 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_f3e9a9a693c44ea917dc/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10604 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_f441d043990635e01090/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10605 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_f58c375fdf2f49018e38/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10606 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_f59412f8a600e9a71fb8/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10607 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_f73c821d92438436ad6c/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10608 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_f8697b18674e9f438a96/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10609 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_f8990edfbb4deaf97027/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10610 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_f99a0822ae493faf0bb5/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10611 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_fa6da73026ca7a0eb10f/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10612 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_fba7e5f3d8634f923189/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10613 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_fd402f1583fe91543618/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10614 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_fe61ce3dd9af75901342/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10615 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_ff3a95a3a80afa64563d/model.neuron filter=lfs diff=lfs merge=lfs -text
|
| 10616 |
+
neuronxcc-2.19.8089.0+8ab9f450/MODULE_ffe8abf61d5a2a0a2b8e/model.neuron filter=lfs diff=lfs merge=lfs -text
|
neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev0/qwen2/Qwen/Qwen2.5-0.5B/5eef7da50a217db5b302.json
ADDED
|
@@ -0,0 +1,97 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"_entry_class": "SingleModelCacheEntry",
|
| 3 |
+
"_model_id": "Qwen/Qwen2.5-0.5B",
|
| 4 |
+
"_task": "text-generation",
|
| 5 |
+
"architectures": [
|
| 6 |
+
"Qwen2ForCausalLM"
|
| 7 |
+
],
|
| 8 |
+
"attention_dropout": 0.0,
|
| 9 |
+
"hidden_act": "silu",
|
| 10 |
+
"hidden_size": 896,
|
| 11 |
+
"initializer_range": 0.02,
|
| 12 |
+
"intermediate_size": 4864,
|
| 13 |
+
"layer_types": [
|
| 14 |
+
"full_attention",
|
| 15 |
+
"full_attention",
|
| 16 |
+
"full_attention",
|
| 17 |
+
"full_attention",
|
| 18 |
+
"full_attention",
|
| 19 |
+
"full_attention",
|
| 20 |
+
"full_attention",
|
| 21 |
+
"full_attention",
|
| 22 |
+
"full_attention",
|
| 23 |
+
"full_attention",
|
| 24 |
+
"full_attention",
|
| 25 |
+
"full_attention",
|
| 26 |
+
"full_attention",
|
| 27 |
+
"full_attention",
|
| 28 |
+
"full_attention",
|
| 29 |
+
"full_attention",
|
| 30 |
+
"full_attention",
|
| 31 |
+
"full_attention",
|
| 32 |
+
"full_attention",
|
| 33 |
+
"full_attention",
|
| 34 |
+
"full_attention",
|
| 35 |
+
"full_attention",
|
| 36 |
+
"full_attention",
|
| 37 |
+
"full_attention"
|
| 38 |
+
],
|
| 39 |
+
"max_position_embeddings": 32768,
|
| 40 |
+
"max_window_layers": 24,
|
| 41 |
+
"model_type": "qwen2",
|
| 42 |
+
"neuron": {
|
| 43 |
+
"_serialized_key": "NxDNeuronConfig",
|
| 44 |
+
"async_mode": false,
|
| 45 |
+
"attn_kernel_enabled": false,
|
| 46 |
+
"batch_size": 1,
|
| 47 |
+
"capacity_factor": null,
|
| 48 |
+
"cc_pipeline_tiling_factor": 2,
|
| 49 |
+
"checkpoint_id": "Qwen/Qwen2.5-0.5B",
|
| 50 |
+
"checkpoint_revision": "060db6499f32faf8b98477b0a26969ef7d8b9987",
|
| 51 |
+
"continuous_batching": false,
|
| 52 |
+
"enable_bucketing": false,
|
| 53 |
+
"ep_degree": 1,
|
| 54 |
+
"flash_decoding_enabled": false,
|
| 55 |
+
"fused_qkv": false,
|
| 56 |
+
"glu_mlp": true,
|
| 57 |
+
"is_chunked_prefill": false,
|
| 58 |
+
"local_ranks_size": 2,
|
| 59 |
+
"logical_nc_config": 1,
|
| 60 |
+
"max_batch_size": 1,
|
| 61 |
+
"max_context_length": 128,
|
| 62 |
+
"max_topk": 256,
|
| 63 |
+
"mlp_kernel_enabled": false,
|
| 64 |
+
"mlp_kernel_fuse_residual_add": false,
|
| 65 |
+
"n_active_tokens": 128,
|
| 66 |
+
"neuronxcc_version": "2.19.8089.0+8ab9f450",
|
| 67 |
+
"num_cores_per_group": 1,
|
| 68 |
+
"on_device_sampling": true,
|
| 69 |
+
"optimum_neuron_version": "0.3.1.dev0",
|
| 70 |
+
"output_logits": false,
|
| 71 |
+
"padding_side": "right",
|
| 72 |
+
"pp_degree": 1,
|
| 73 |
+
"qk_layernorm": false,
|
| 74 |
+
"qkv_kernel_enabled": false,
|
| 75 |
+
"rpl_reduce_dtype": "bfloat16",
|
| 76 |
+
"sequence_length": 128,
|
| 77 |
+
"sequence_parallel_enabled": false,
|
| 78 |
+
"speculation_length": 0,
|
| 79 |
+
"start_rank_id": 0,
|
| 80 |
+
"target": null,
|
| 81 |
+
"torch_dtype": "bfloat16",
|
| 82 |
+
"tp_degree": 2,
|
| 83 |
+
"vocab_parallel": false
|
| 84 |
+
},
|
| 85 |
+
"num_attention_heads": 14,
|
| 86 |
+
"num_hidden_layers": 24,
|
| 87 |
+
"num_key_value_heads": 2,
|
| 88 |
+
"rms_norm_eps": 1e-06,
|
| 89 |
+
"rope_scaling": null,
|
| 90 |
+
"rope_theta": 1000000.0,
|
| 91 |
+
"sliding_window": null,
|
| 92 |
+
"tie_word_embeddings": true,
|
| 93 |
+
"use_cache": true,
|
| 94 |
+
"use_mrope": false,
|
| 95 |
+
"use_sliding_window": false,
|
| 96 |
+
"vocab_size": 151936
|
| 97 |
+
}
|
neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev0/qwen2/yujiepan/qwen2.5-128k-tiny-random/3292185f0123466a93a2.json
ADDED
|
@@ -0,0 +1,79 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"_entry_class": "SingleModelCacheEntry",
|
| 3 |
+
"_model_id": "yujiepan/qwen2.5-128k-tiny-random",
|
| 4 |
+
"_task": "text-generation",
|
| 5 |
+
"architectures": [
|
| 6 |
+
"Qwen2ForCausalLM"
|
| 7 |
+
],
|
| 8 |
+
"attention_dropout": 0.0,
|
| 9 |
+
"hidden_act": "silu",
|
| 10 |
+
"hidden_size": 8,
|
| 11 |
+
"initializer_range": 0.02,
|
| 12 |
+
"intermediate_size": 16,
|
| 13 |
+
"layer_types": [
|
| 14 |
+
"full_attention",
|
| 15 |
+
"full_attention"
|
| 16 |
+
],
|
| 17 |
+
"max_position_embeddings": 32768,
|
| 18 |
+
"max_window_layers": 1,
|
| 19 |
+
"model_type": "qwen2",
|
| 20 |
+
"neuron": {
|
| 21 |
+
"_serialized_key": "NxDNeuronConfig",
|
| 22 |
+
"async_mode": false,
|
| 23 |
+
"attn_kernel_enabled": false,
|
| 24 |
+
"batch_size": 2,
|
| 25 |
+
"capacity_factor": null,
|
| 26 |
+
"cc_pipeline_tiling_factor": 2,
|
| 27 |
+
"checkpoint_id": "yujiepan/qwen2.5-128k-tiny-random",
|
| 28 |
+
"checkpoint_revision": "c8296d4ca3f87782876d2382fbb6481d1beb8ef0",
|
| 29 |
+
"continuous_batching": true,
|
| 30 |
+
"enable_bucketing": false,
|
| 31 |
+
"ep_degree": 1,
|
| 32 |
+
"flash_decoding_enabled": false,
|
| 33 |
+
"fused_qkv": false,
|
| 34 |
+
"glu_mlp": true,
|
| 35 |
+
"is_chunked_prefill": false,
|
| 36 |
+
"local_ranks_size": 2,
|
| 37 |
+
"logical_nc_config": 1,
|
| 38 |
+
"max_batch_size": 2,
|
| 39 |
+
"max_context_length": 100,
|
| 40 |
+
"max_topk": 256,
|
| 41 |
+
"mlp_kernel_enabled": false,
|
| 42 |
+
"mlp_kernel_fuse_residual_add": false,
|
| 43 |
+
"n_active_tokens": 100,
|
| 44 |
+
"neuronxcc_version": "2.19.8089.0+8ab9f450",
|
| 45 |
+
"num_cores_per_group": 1,
|
| 46 |
+
"on_device_sampling": false,
|
| 47 |
+
"optimum_neuron_version": "0.3.1.dev0",
|
| 48 |
+
"output_logits": false,
|
| 49 |
+
"padding_side": "right",
|
| 50 |
+
"pp_degree": 1,
|
| 51 |
+
"qk_layernorm": false,
|
| 52 |
+
"qkv_kernel_enabled": false,
|
| 53 |
+
"rpl_reduce_dtype": "float16",
|
| 54 |
+
"sequence_length": 100,
|
| 55 |
+
"sequence_parallel_enabled": false,
|
| 56 |
+
"speculation_length": 0,
|
| 57 |
+
"start_rank_id": 0,
|
| 58 |
+
"target": null,
|
| 59 |
+
"torch_dtype": "float16",
|
| 60 |
+
"tp_degree": 2,
|
| 61 |
+
"vocab_parallel": false
|
| 62 |
+
},
|
| 63 |
+
"num_attention_heads": 4,
|
| 64 |
+
"num_hidden_layers": 2,
|
| 65 |
+
"num_key_value_heads": 2,
|
| 66 |
+
"rms_norm_eps": 1e-06,
|
| 67 |
+
"rope_scaling": {
|
| 68 |
+
"factor": 4.0,
|
| 69 |
+
"original_max_position_embeddings": 32768,
|
| 70 |
+
"rope_type": "yarn",
|
| 71 |
+
"type": "yarn"
|
| 72 |
+
},
|
| 73 |
+
"rope_theta": 1000000.0,
|
| 74 |
+
"sliding_window": null,
|
| 75 |
+
"tie_word_embeddings": false,
|
| 76 |
+
"use_cache": true,
|
| 77 |
+
"use_sliding_window": false,
|
| 78 |
+
"vocab_size": 152064
|
| 79 |
+
}
|
neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev0/qwen2/yujiepan/qwen2.5-128k-tiny-random/b60dca7d7a9c53810fe0.json
ADDED
|
@@ -0,0 +1,79 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"_entry_class": "SingleModelCacheEntry",
|
| 3 |
+
"_model_id": "yujiepan/qwen2.5-128k-tiny-random",
|
| 4 |
+
"_task": "text-generation",
|
| 5 |
+
"architectures": [
|
| 6 |
+
"Qwen2ForCausalLM"
|
| 7 |
+
],
|
| 8 |
+
"attention_dropout": 0.0,
|
| 9 |
+
"hidden_act": "silu",
|
| 10 |
+
"hidden_size": 8,
|
| 11 |
+
"initializer_range": 0.02,
|
| 12 |
+
"intermediate_size": 16,
|
| 13 |
+
"layer_types": [
|
| 14 |
+
"full_attention",
|
| 15 |
+
"full_attention"
|
| 16 |
+
],
|
| 17 |
+
"max_position_embeddings": 32768,
|
| 18 |
+
"max_window_layers": 1,
|
| 19 |
+
"model_type": "qwen2",
|
| 20 |
+
"neuron": {
|
| 21 |
+
"_serialized_key": "NxDNeuronConfig",
|
| 22 |
+
"async_mode": false,
|
| 23 |
+
"attn_kernel_enabled": false,
|
| 24 |
+
"batch_size": 1,
|
| 25 |
+
"capacity_factor": null,
|
| 26 |
+
"cc_pipeline_tiling_factor": 2,
|
| 27 |
+
"checkpoint_id": "yujiepan/qwen2.5-128k-tiny-random",
|
| 28 |
+
"checkpoint_revision": "c8296d4ca3f87782876d2382fbb6481d1beb8ef0",
|
| 29 |
+
"continuous_batching": false,
|
| 30 |
+
"enable_bucketing": false,
|
| 31 |
+
"ep_degree": 1,
|
| 32 |
+
"flash_decoding_enabled": false,
|
| 33 |
+
"fused_qkv": false,
|
| 34 |
+
"glu_mlp": true,
|
| 35 |
+
"is_chunked_prefill": false,
|
| 36 |
+
"local_ranks_size": 2,
|
| 37 |
+
"logical_nc_config": 1,
|
| 38 |
+
"max_batch_size": 1,
|
| 39 |
+
"max_context_length": 100,
|
| 40 |
+
"max_topk": 256,
|
| 41 |
+
"mlp_kernel_enabled": false,
|
| 42 |
+
"mlp_kernel_fuse_residual_add": false,
|
| 43 |
+
"n_active_tokens": 100,
|
| 44 |
+
"neuronxcc_version": "2.19.8089.0+8ab9f450",
|
| 45 |
+
"num_cores_per_group": 1,
|
| 46 |
+
"on_device_sampling": true,
|
| 47 |
+
"optimum_neuron_version": "0.3.1.dev0",
|
| 48 |
+
"output_logits": false,
|
| 49 |
+
"padding_side": "right",
|
| 50 |
+
"pp_degree": 1,
|
| 51 |
+
"qk_layernorm": false,
|
| 52 |
+
"qkv_kernel_enabled": false,
|
| 53 |
+
"rpl_reduce_dtype": "float16",
|
| 54 |
+
"sequence_length": 100,
|
| 55 |
+
"sequence_parallel_enabled": false,
|
| 56 |
+
"speculation_length": 0,
|
| 57 |
+
"start_rank_id": 0,
|
| 58 |
+
"target": null,
|
| 59 |
+
"torch_dtype": "float16",
|
| 60 |
+
"tp_degree": 2,
|
| 61 |
+
"vocab_parallel": false
|
| 62 |
+
},
|
| 63 |
+
"num_attention_heads": 4,
|
| 64 |
+
"num_hidden_layers": 2,
|
| 65 |
+
"num_key_value_heads": 2,
|
| 66 |
+
"rms_norm_eps": 1e-06,
|
| 67 |
+
"rope_scaling": {
|
| 68 |
+
"factor": 4.0,
|
| 69 |
+
"original_max_position_embeddings": 32768,
|
| 70 |
+
"rope_type": "yarn",
|
| 71 |
+
"type": "yarn"
|
| 72 |
+
},
|
| 73 |
+
"rope_theta": 1000000.0,
|
| 74 |
+
"sliding_window": null,
|
| 75 |
+
"tie_word_embeddings": false,
|
| 76 |
+
"use_cache": true,
|
| 77 |
+
"use_sliding_window": false,
|
| 78 |
+
"vocab_size": 152064
|
| 79 |
+
}
|
neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev0/qwen2/yujiepan/qwen2.5-128k-tiny-random/b9b0c081795fa9e33ca6.json
ADDED
|
@@ -0,0 +1,79 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"_entry_class": "SingleModelCacheEntry",
|
| 3 |
+
"_model_id": "yujiepan/qwen2.5-128k-tiny-random",
|
| 4 |
+
"_task": "text-generation",
|
| 5 |
+
"architectures": [
|
| 6 |
+
"Qwen2ForCausalLM"
|
| 7 |
+
],
|
| 8 |
+
"attention_dropout": 0.0,
|
| 9 |
+
"hidden_act": "silu",
|
| 10 |
+
"hidden_size": 8,
|
| 11 |
+
"initializer_range": 0.02,
|
| 12 |
+
"intermediate_size": 16,
|
| 13 |
+
"layer_types": [
|
| 14 |
+
"full_attention",
|
| 15 |
+
"full_attention"
|
| 16 |
+
],
|
| 17 |
+
"max_position_embeddings": 32768,
|
| 18 |
+
"max_window_layers": 1,
|
| 19 |
+
"model_type": "qwen2",
|
| 20 |
+
"neuron": {
|
| 21 |
+
"_serialized_key": "NxDNeuronConfig",
|
| 22 |
+
"async_mode": false,
|
| 23 |
+
"attn_kernel_enabled": false,
|
| 24 |
+
"batch_size": 1,
|
| 25 |
+
"capacity_factor": null,
|
| 26 |
+
"cc_pipeline_tiling_factor": 2,
|
| 27 |
+
"checkpoint_id": "yujiepan/qwen2.5-128k-tiny-random",
|
| 28 |
+
"checkpoint_revision": "c8296d4ca3f87782876d2382fbb6481d1beb8ef0",
|
| 29 |
+
"continuous_batching": false,
|
| 30 |
+
"enable_bucketing": false,
|
| 31 |
+
"ep_degree": 1,
|
| 32 |
+
"flash_decoding_enabled": false,
|
| 33 |
+
"fused_qkv": false,
|
| 34 |
+
"glu_mlp": true,
|
| 35 |
+
"is_chunked_prefill": false,
|
| 36 |
+
"local_ranks_size": 2,
|
| 37 |
+
"logical_nc_config": 1,
|
| 38 |
+
"max_batch_size": 1,
|
| 39 |
+
"max_context_length": 100,
|
| 40 |
+
"max_topk": 256,
|
| 41 |
+
"mlp_kernel_enabled": false,
|
| 42 |
+
"mlp_kernel_fuse_residual_add": false,
|
| 43 |
+
"n_active_tokens": 100,
|
| 44 |
+
"neuronxcc_version": "2.19.8089.0+8ab9f450",
|
| 45 |
+
"num_cores_per_group": 1,
|
| 46 |
+
"on_device_sampling": true,
|
| 47 |
+
"optimum_neuron_version": "0.3.1.dev0",
|
| 48 |
+
"output_logits": false,
|
| 49 |
+
"padding_side": "right",
|
| 50 |
+
"pp_degree": 1,
|
| 51 |
+
"qk_layernorm": false,
|
| 52 |
+
"qkv_kernel_enabled": false,
|
| 53 |
+
"rpl_reduce_dtype": "bfloat16",
|
| 54 |
+
"sequence_length": 100,
|
| 55 |
+
"sequence_parallel_enabled": false,
|
| 56 |
+
"speculation_length": 0,
|
| 57 |
+
"start_rank_id": 0,
|
| 58 |
+
"target": null,
|
| 59 |
+
"torch_dtype": "bfloat16",
|
| 60 |
+
"tp_degree": 2,
|
| 61 |
+
"vocab_parallel": false
|
| 62 |
+
},
|
| 63 |
+
"num_attention_heads": 4,
|
| 64 |
+
"num_hidden_layers": 2,
|
| 65 |
+
"num_key_value_heads": 2,
|
| 66 |
+
"rms_norm_eps": 1e-06,
|
| 67 |
+
"rope_scaling": {
|
| 68 |
+
"factor": 4.0,
|
| 69 |
+
"original_max_position_embeddings": 32768,
|
| 70 |
+
"rope_type": "yarn",
|
| 71 |
+
"type": "yarn"
|
| 72 |
+
},
|
| 73 |
+
"rope_theta": 1000000.0,
|
| 74 |
+
"sliding_window": null,
|
| 75 |
+
"tie_word_embeddings": false,
|
| 76 |
+
"use_cache": true,
|
| 77 |
+
"use_sliding_window": false,
|
| 78 |
+
"vocab_size": 152064
|
| 79 |
+
}
|
neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/albert/hf-internal-testing/tiny-random-AlbertModel/082c855afd5bbe38fea8.json
ADDED
|
@@ -0,0 +1,54 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"_entry_class": "SingleModelCacheEntry",
|
| 3 |
+
"_model_id": "hf-internal-testing/tiny-random-AlbertModel",
|
| 4 |
+
"_task": "fill-mask",
|
| 5 |
+
"architectures": [
|
| 6 |
+
"AlbertModel"
|
| 7 |
+
],
|
| 8 |
+
"attention_probs_dropout_prob": 0.1,
|
| 9 |
+
"classifier_dropout_prob": 0.1,
|
| 10 |
+
"embedding_size": 128,
|
| 11 |
+
"hidden_act": "gelu",
|
| 12 |
+
"hidden_dropout_prob": 0.1,
|
| 13 |
+
"hidden_size": 36,
|
| 14 |
+
"initializer_range": 0.02,
|
| 15 |
+
"inner_group_num": 1,
|
| 16 |
+
"intermediate_size": 37,
|
| 17 |
+
"layer_norm_eps": 1e-12,
|
| 18 |
+
"max_position_embeddings": 512,
|
| 19 |
+
"model_type": "albert",
|
| 20 |
+
"neuron": {
|
| 21 |
+
"auto_cast": null,
|
| 22 |
+
"auto_cast_type": null,
|
| 23 |
+
"compiler_type": "neuronx-cc",
|
| 24 |
+
"compiler_version": "2.19.8089.0+8ab9f450",
|
| 25 |
+
"disable_fallback": false,
|
| 26 |
+
"disable_fast_relayout": false,
|
| 27 |
+
"dynamic_batch_size": false,
|
| 28 |
+
"float_dtype": "fp32",
|
| 29 |
+
"inline_weights_to_neff": true,
|
| 30 |
+
"input_names": [
|
| 31 |
+
"input_ids",
|
| 32 |
+
"attention_mask",
|
| 33 |
+
"token_type_ids"
|
| 34 |
+
],
|
| 35 |
+
"int_dtype": "int64",
|
| 36 |
+
"model_type": "albert",
|
| 37 |
+
"optlevel": "2",
|
| 38 |
+
"output_attentions": false,
|
| 39 |
+
"output_hidden_states": false,
|
| 40 |
+
"output_names": [
|
| 41 |
+
"logits"
|
| 42 |
+
],
|
| 43 |
+
"static_batch_size": 1,
|
| 44 |
+
"static_sequence_length": 128,
|
| 45 |
+
"task": "fill-mask",
|
| 46 |
+
"tensor_parallel_size": 1
|
| 47 |
+
},
|
| 48 |
+
"num_attention_heads": 6,
|
| 49 |
+
"num_hidden_groups": 6,
|
| 50 |
+
"num_hidden_layers": 6,
|
| 51 |
+
"position_embedding_type": "absolute",
|
| 52 |
+
"type_vocab_size": 16,
|
| 53 |
+
"vocab_size": 30000
|
| 54 |
+
}
|
neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/albert/hf-internal-testing/tiny-random-AlbertModel/19ebb6a6a5ec909e86f1.json
ADDED
|
@@ -0,0 +1,55 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"_entry_class": "SingleModelCacheEntry",
|
| 3 |
+
"_model_id": "hf-internal-testing/tiny-random-AlbertModel",
|
| 4 |
+
"_task": "feature-extraction",
|
| 5 |
+
"architectures": [
|
| 6 |
+
"AlbertModel"
|
| 7 |
+
],
|
| 8 |
+
"attention_probs_dropout_prob": 0.1,
|
| 9 |
+
"classifier_dropout_prob": 0.1,
|
| 10 |
+
"embedding_size": 128,
|
| 11 |
+
"hidden_act": "gelu",
|
| 12 |
+
"hidden_dropout_prob": 0.1,
|
| 13 |
+
"hidden_size": 36,
|
| 14 |
+
"initializer_range": 0.02,
|
| 15 |
+
"inner_group_num": 1,
|
| 16 |
+
"intermediate_size": 37,
|
| 17 |
+
"layer_norm_eps": 1e-12,
|
| 18 |
+
"max_position_embeddings": 512,
|
| 19 |
+
"model_type": "albert",
|
| 20 |
+
"neuron": {
|
| 21 |
+
"auto_cast": null,
|
| 22 |
+
"auto_cast_type": null,
|
| 23 |
+
"compiler_type": "neuronx-cc",
|
| 24 |
+
"compiler_version": "2.19.8089.0+8ab9f450",
|
| 25 |
+
"disable_fallback": false,
|
| 26 |
+
"disable_fast_relayout": false,
|
| 27 |
+
"dynamic_batch_size": true,
|
| 28 |
+
"float_dtype": "fp32",
|
| 29 |
+
"inline_weights_to_neff": true,
|
| 30 |
+
"input_names": [
|
| 31 |
+
"input_ids",
|
| 32 |
+
"attention_mask",
|
| 33 |
+
"token_type_ids"
|
| 34 |
+
],
|
| 35 |
+
"int_dtype": "int64",
|
| 36 |
+
"model_type": "albert",
|
| 37 |
+
"optlevel": "2",
|
| 38 |
+
"output_attentions": false,
|
| 39 |
+
"output_hidden_states": false,
|
| 40 |
+
"output_names": [
|
| 41 |
+
"last_hidden_state",
|
| 42 |
+
"pooler_output"
|
| 43 |
+
],
|
| 44 |
+
"static_batch_size": 1,
|
| 45 |
+
"static_sequence_length": 32,
|
| 46 |
+
"task": "feature-extraction",
|
| 47 |
+
"tensor_parallel_size": 1
|
| 48 |
+
},
|
| 49 |
+
"num_attention_heads": 6,
|
| 50 |
+
"num_hidden_groups": 6,
|
| 51 |
+
"num_hidden_layers": 6,
|
| 52 |
+
"position_embedding_type": "absolute",
|
| 53 |
+
"type_vocab_size": 16,
|
| 54 |
+
"vocab_size": 30000
|
| 55 |
+
}
|
neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/albert/hf-internal-testing/tiny-random-AlbertModel/1e1cab9afee16970464a.json
ADDED
|
@@ -0,0 +1,55 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"_entry_class": "SingleModelCacheEntry",
|
| 3 |
+
"_model_id": "hf-internal-testing/tiny-random-AlbertModel",
|
| 4 |
+
"_task": "question-answering",
|
| 5 |
+
"architectures": [
|
| 6 |
+
"AlbertModel"
|
| 7 |
+
],
|
| 8 |
+
"attention_probs_dropout_prob": 0.1,
|
| 9 |
+
"classifier_dropout_prob": 0.1,
|
| 10 |
+
"embedding_size": 128,
|
| 11 |
+
"hidden_act": "gelu",
|
| 12 |
+
"hidden_dropout_prob": 0.1,
|
| 13 |
+
"hidden_size": 36,
|
| 14 |
+
"initializer_range": 0.02,
|
| 15 |
+
"inner_group_num": 1,
|
| 16 |
+
"intermediate_size": 37,
|
| 17 |
+
"layer_norm_eps": 1e-12,
|
| 18 |
+
"max_position_embeddings": 512,
|
| 19 |
+
"model_type": "albert",
|
| 20 |
+
"neuron": {
|
| 21 |
+
"auto_cast": null,
|
| 22 |
+
"auto_cast_type": null,
|
| 23 |
+
"compiler_type": "neuronx-cc",
|
| 24 |
+
"compiler_version": "2.19.8089.0+8ab9f450",
|
| 25 |
+
"disable_fallback": false,
|
| 26 |
+
"disable_fast_relayout": false,
|
| 27 |
+
"dynamic_batch_size": false,
|
| 28 |
+
"float_dtype": "fp32",
|
| 29 |
+
"inline_weights_to_neff": true,
|
| 30 |
+
"input_names": [
|
| 31 |
+
"input_ids",
|
| 32 |
+
"attention_mask",
|
| 33 |
+
"token_type_ids"
|
| 34 |
+
],
|
| 35 |
+
"int_dtype": "int64",
|
| 36 |
+
"model_type": "albert",
|
| 37 |
+
"optlevel": "2",
|
| 38 |
+
"output_attentions": false,
|
| 39 |
+
"output_hidden_states": false,
|
| 40 |
+
"output_names": [
|
| 41 |
+
"start_logits",
|
| 42 |
+
"end_logits"
|
| 43 |
+
],
|
| 44 |
+
"static_batch_size": 1,
|
| 45 |
+
"static_sequence_length": 32,
|
| 46 |
+
"task": "question-answering",
|
| 47 |
+
"tensor_parallel_size": 1
|
| 48 |
+
},
|
| 49 |
+
"num_attention_heads": 6,
|
| 50 |
+
"num_hidden_groups": 6,
|
| 51 |
+
"num_hidden_layers": 6,
|
| 52 |
+
"position_embedding_type": "absolute",
|
| 53 |
+
"type_vocab_size": 16,
|
| 54 |
+
"vocab_size": 30000
|
| 55 |
+
}
|
neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/albert/hf-internal-testing/tiny-random-AlbertModel/2420b2b633bc1e938403.json
ADDED
|
@@ -0,0 +1,54 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"_entry_class": "SingleModelCacheEntry",
|
| 3 |
+
"_model_id": "hf-internal-testing/tiny-random-AlbertModel",
|
| 4 |
+
"_task": "text-classification",
|
| 5 |
+
"architectures": [
|
| 6 |
+
"AlbertModel"
|
| 7 |
+
],
|
| 8 |
+
"attention_probs_dropout_prob": 0.1,
|
| 9 |
+
"classifier_dropout_prob": 0.1,
|
| 10 |
+
"embedding_size": 128,
|
| 11 |
+
"hidden_act": "gelu",
|
| 12 |
+
"hidden_dropout_prob": 0.1,
|
| 13 |
+
"hidden_size": 36,
|
| 14 |
+
"initializer_range": 0.02,
|
| 15 |
+
"inner_group_num": 1,
|
| 16 |
+
"intermediate_size": 37,
|
| 17 |
+
"layer_norm_eps": 1e-12,
|
| 18 |
+
"max_position_embeddings": 512,
|
| 19 |
+
"model_type": "albert",
|
| 20 |
+
"neuron": {
|
| 21 |
+
"auto_cast": null,
|
| 22 |
+
"auto_cast_type": null,
|
| 23 |
+
"compiler_type": "neuronx-cc",
|
| 24 |
+
"compiler_version": "2.19.8089.0+8ab9f450",
|
| 25 |
+
"disable_fallback": false,
|
| 26 |
+
"disable_fast_relayout": false,
|
| 27 |
+
"dynamic_batch_size": false,
|
| 28 |
+
"float_dtype": "fp32",
|
| 29 |
+
"inline_weights_to_neff": true,
|
| 30 |
+
"input_names": [
|
| 31 |
+
"input_ids",
|
| 32 |
+
"attention_mask",
|
| 33 |
+
"token_type_ids"
|
| 34 |
+
],
|
| 35 |
+
"int_dtype": "int64",
|
| 36 |
+
"model_type": "albert",
|
| 37 |
+
"optlevel": "2",
|
| 38 |
+
"output_attentions": false,
|
| 39 |
+
"output_hidden_states": false,
|
| 40 |
+
"output_names": [
|
| 41 |
+
"logits"
|
| 42 |
+
],
|
| 43 |
+
"static_batch_size": 1,
|
| 44 |
+
"static_sequence_length": 32,
|
| 45 |
+
"task": "text-classification",
|
| 46 |
+
"tensor_parallel_size": 1
|
| 47 |
+
},
|
| 48 |
+
"num_attention_heads": 6,
|
| 49 |
+
"num_hidden_groups": 6,
|
| 50 |
+
"num_hidden_layers": 6,
|
| 51 |
+
"position_embedding_type": "absolute",
|
| 52 |
+
"type_vocab_size": 16,
|
| 53 |
+
"vocab_size": 30000
|
| 54 |
+
}
|
neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/albert/hf-internal-testing/tiny-random-AlbertModel/3585a8b7eec15ef74cc9.json
ADDED
|
@@ -0,0 +1,55 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"_entry_class": "SingleModelCacheEntry",
|
| 3 |
+
"_model_id": "hf-internal-testing/tiny-random-AlbertModel",
|
| 4 |
+
"_task": "multiple-choice",
|
| 5 |
+
"architectures": [
|
| 6 |
+
"AlbertModel"
|
| 7 |
+
],
|
| 8 |
+
"attention_probs_dropout_prob": 0.1,
|
| 9 |
+
"classifier_dropout_prob": 0.1,
|
| 10 |
+
"embedding_size": 128,
|
| 11 |
+
"hidden_act": "gelu",
|
| 12 |
+
"hidden_dropout_prob": 0.1,
|
| 13 |
+
"hidden_size": 36,
|
| 14 |
+
"initializer_range": 0.02,
|
| 15 |
+
"inner_group_num": 1,
|
| 16 |
+
"intermediate_size": 37,
|
| 17 |
+
"layer_norm_eps": 1e-12,
|
| 18 |
+
"max_position_embeddings": 512,
|
| 19 |
+
"model_type": "albert",
|
| 20 |
+
"neuron": {
|
| 21 |
+
"auto_cast": null,
|
| 22 |
+
"auto_cast_type": null,
|
| 23 |
+
"compiler_type": "neuronx-cc",
|
| 24 |
+
"compiler_version": "2.19.8089.0+8ab9f450",
|
| 25 |
+
"disable_fallback": false,
|
| 26 |
+
"disable_fast_relayout": false,
|
| 27 |
+
"dynamic_batch_size": true,
|
| 28 |
+
"float_dtype": "fp32",
|
| 29 |
+
"inline_weights_to_neff": true,
|
| 30 |
+
"input_names": [
|
| 31 |
+
"input_ids",
|
| 32 |
+
"attention_mask",
|
| 33 |
+
"token_type_ids"
|
| 34 |
+
],
|
| 35 |
+
"int_dtype": "int64",
|
| 36 |
+
"model_type": "albert",
|
| 37 |
+
"optlevel": "2",
|
| 38 |
+
"output_attentions": false,
|
| 39 |
+
"output_hidden_states": false,
|
| 40 |
+
"output_names": [
|
| 41 |
+
"logits"
|
| 42 |
+
],
|
| 43 |
+
"static_batch_size": 1,
|
| 44 |
+
"static_num_choices": 4,
|
| 45 |
+
"static_sequence_length": 128,
|
| 46 |
+
"task": "multiple-choice",
|
| 47 |
+
"tensor_parallel_size": 1
|
| 48 |
+
},
|
| 49 |
+
"num_attention_heads": 6,
|
| 50 |
+
"num_hidden_groups": 6,
|
| 51 |
+
"num_hidden_layers": 6,
|
| 52 |
+
"position_embedding_type": "absolute",
|
| 53 |
+
"type_vocab_size": 16,
|
| 54 |
+
"vocab_size": 30000
|
| 55 |
+
}
|
neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/albert/hf-internal-testing/tiny-random-AlbertModel/4d038e1c09d623b63731.json
ADDED
|
@@ -0,0 +1,55 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"_entry_class": "SingleModelCacheEntry",
|
| 3 |
+
"_model_id": "hf-internal-testing/tiny-random-AlbertModel",
|
| 4 |
+
"_task": "feature-extraction",
|
| 5 |
+
"architectures": [
|
| 6 |
+
"AlbertModel"
|
| 7 |
+
],
|
| 8 |
+
"attention_probs_dropout_prob": 0.1,
|
| 9 |
+
"classifier_dropout_prob": 0.1,
|
| 10 |
+
"embedding_size": 128,
|
| 11 |
+
"hidden_act": "gelu",
|
| 12 |
+
"hidden_dropout_prob": 0.1,
|
| 13 |
+
"hidden_size": 36,
|
| 14 |
+
"initializer_range": 0.02,
|
| 15 |
+
"inner_group_num": 1,
|
| 16 |
+
"intermediate_size": 37,
|
| 17 |
+
"layer_norm_eps": 1e-12,
|
| 18 |
+
"max_position_embeddings": 512,
|
| 19 |
+
"model_type": "albert",
|
| 20 |
+
"neuron": {
|
| 21 |
+
"auto_cast": null,
|
| 22 |
+
"auto_cast_type": null,
|
| 23 |
+
"compiler_type": "neuronx-cc",
|
| 24 |
+
"compiler_version": "2.19.8089.0+8ab9f450",
|
| 25 |
+
"disable_fallback": false,
|
| 26 |
+
"disable_fast_relayout": false,
|
| 27 |
+
"dynamic_batch_size": false,
|
| 28 |
+
"float_dtype": "fp32",
|
| 29 |
+
"inline_weights_to_neff": true,
|
| 30 |
+
"input_names": [
|
| 31 |
+
"input_ids",
|
| 32 |
+
"attention_mask",
|
| 33 |
+
"token_type_ids"
|
| 34 |
+
],
|
| 35 |
+
"int_dtype": "int64",
|
| 36 |
+
"model_type": "albert",
|
| 37 |
+
"optlevel": "2",
|
| 38 |
+
"output_attentions": false,
|
| 39 |
+
"output_hidden_states": false,
|
| 40 |
+
"output_names": [
|
| 41 |
+
"last_hidden_state",
|
| 42 |
+
"pooler_output"
|
| 43 |
+
],
|
| 44 |
+
"static_batch_size": 1,
|
| 45 |
+
"static_sequence_length": 128,
|
| 46 |
+
"task": "feature-extraction",
|
| 47 |
+
"tensor_parallel_size": 1
|
| 48 |
+
},
|
| 49 |
+
"num_attention_heads": 6,
|
| 50 |
+
"num_hidden_groups": 6,
|
| 51 |
+
"num_hidden_layers": 6,
|
| 52 |
+
"position_embedding_type": "absolute",
|
| 53 |
+
"type_vocab_size": 16,
|
| 54 |
+
"vocab_size": 30000
|
| 55 |
+
}
|
neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/albert/hf-internal-testing/tiny-random-AlbertModel/59c92a651b8b40190b9d.json
ADDED
|
@@ -0,0 +1,54 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"_entry_class": "SingleModelCacheEntry",
|
| 3 |
+
"_model_id": "hf-internal-testing/tiny-random-AlbertModel",
|
| 4 |
+
"_task": "token-classification",
|
| 5 |
+
"architectures": [
|
| 6 |
+
"AlbertModel"
|
| 7 |
+
],
|
| 8 |
+
"attention_probs_dropout_prob": 0.1,
|
| 9 |
+
"classifier_dropout_prob": 0.1,
|
| 10 |
+
"embedding_size": 128,
|
| 11 |
+
"hidden_act": "gelu",
|
| 12 |
+
"hidden_dropout_prob": 0.1,
|
| 13 |
+
"hidden_size": 36,
|
| 14 |
+
"initializer_range": 0.02,
|
| 15 |
+
"inner_group_num": 1,
|
| 16 |
+
"intermediate_size": 37,
|
| 17 |
+
"layer_norm_eps": 1e-12,
|
| 18 |
+
"max_position_embeddings": 512,
|
| 19 |
+
"model_type": "albert",
|
| 20 |
+
"neuron": {
|
| 21 |
+
"auto_cast": null,
|
| 22 |
+
"auto_cast_type": null,
|
| 23 |
+
"compiler_type": "neuronx-cc",
|
| 24 |
+
"compiler_version": "2.19.8089.0+8ab9f450",
|
| 25 |
+
"disable_fallback": false,
|
| 26 |
+
"disable_fast_relayout": false,
|
| 27 |
+
"dynamic_batch_size": false,
|
| 28 |
+
"float_dtype": "fp32",
|
| 29 |
+
"inline_weights_to_neff": true,
|
| 30 |
+
"input_names": [
|
| 31 |
+
"input_ids",
|
| 32 |
+
"attention_mask",
|
| 33 |
+
"token_type_ids"
|
| 34 |
+
],
|
| 35 |
+
"int_dtype": "int64",
|
| 36 |
+
"model_type": "albert",
|
| 37 |
+
"optlevel": "2",
|
| 38 |
+
"output_attentions": false,
|
| 39 |
+
"output_hidden_states": false,
|
| 40 |
+
"output_names": [
|
| 41 |
+
"logits"
|
| 42 |
+
],
|
| 43 |
+
"static_batch_size": 1,
|
| 44 |
+
"static_sequence_length": 32,
|
| 45 |
+
"task": "token-classification",
|
| 46 |
+
"tensor_parallel_size": 1
|
| 47 |
+
},
|
| 48 |
+
"num_attention_heads": 6,
|
| 49 |
+
"num_hidden_groups": 6,
|
| 50 |
+
"num_hidden_layers": 6,
|
| 51 |
+
"position_embedding_type": "absolute",
|
| 52 |
+
"type_vocab_size": 16,
|
| 53 |
+
"vocab_size": 30000
|
| 54 |
+
}
|
neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/albert/hf-internal-testing/tiny-random-AlbertModel/707d5fc3c98b3c204500.json
ADDED
|
@@ -0,0 +1,54 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"_entry_class": "SingleModelCacheEntry",
|
| 3 |
+
"_model_id": "hf-internal-testing/tiny-random-AlbertModel",
|
| 4 |
+
"_task": "fill-mask",
|
| 5 |
+
"architectures": [
|
| 6 |
+
"AlbertModel"
|
| 7 |
+
],
|
| 8 |
+
"attention_probs_dropout_prob": 0.1,
|
| 9 |
+
"classifier_dropout_prob": 0.1,
|
| 10 |
+
"embedding_size": 128,
|
| 11 |
+
"hidden_act": "gelu",
|
| 12 |
+
"hidden_dropout_prob": 0.1,
|
| 13 |
+
"hidden_size": 36,
|
| 14 |
+
"initializer_range": 0.02,
|
| 15 |
+
"inner_group_num": 1,
|
| 16 |
+
"intermediate_size": 37,
|
| 17 |
+
"layer_norm_eps": 1e-12,
|
| 18 |
+
"max_position_embeddings": 512,
|
| 19 |
+
"model_type": "albert",
|
| 20 |
+
"neuron": {
|
| 21 |
+
"auto_cast": null,
|
| 22 |
+
"auto_cast_type": null,
|
| 23 |
+
"compiler_type": "neuronx-cc",
|
| 24 |
+
"compiler_version": "2.19.8089.0+8ab9f450",
|
| 25 |
+
"disable_fallback": false,
|
| 26 |
+
"disable_fast_relayout": false,
|
| 27 |
+
"dynamic_batch_size": true,
|
| 28 |
+
"float_dtype": "fp32",
|
| 29 |
+
"inline_weights_to_neff": true,
|
| 30 |
+
"input_names": [
|
| 31 |
+
"input_ids",
|
| 32 |
+
"attention_mask",
|
| 33 |
+
"token_type_ids"
|
| 34 |
+
],
|
| 35 |
+
"int_dtype": "int64",
|
| 36 |
+
"model_type": "albert",
|
| 37 |
+
"optlevel": "2",
|
| 38 |
+
"output_attentions": false,
|
| 39 |
+
"output_hidden_states": false,
|
| 40 |
+
"output_names": [
|
| 41 |
+
"logits"
|
| 42 |
+
],
|
| 43 |
+
"static_batch_size": 1,
|
| 44 |
+
"static_sequence_length": 32,
|
| 45 |
+
"task": "fill-mask",
|
| 46 |
+
"tensor_parallel_size": 1
|
| 47 |
+
},
|
| 48 |
+
"num_attention_heads": 6,
|
| 49 |
+
"num_hidden_groups": 6,
|
| 50 |
+
"num_hidden_layers": 6,
|
| 51 |
+
"position_embedding_type": "absolute",
|
| 52 |
+
"type_vocab_size": 16,
|
| 53 |
+
"vocab_size": 30000
|
| 54 |
+
}
|
neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/albert/hf-internal-testing/tiny-random-AlbertModel/8829976eff976b676195.json
ADDED
|
@@ -0,0 +1,54 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"_entry_class": "SingleModelCacheEntry",
|
| 3 |
+
"_model_id": "hf-internal-testing/tiny-random-AlbertModel",
|
| 4 |
+
"_task": "token-classification",
|
| 5 |
+
"architectures": [
|
| 6 |
+
"AlbertModel"
|
| 7 |
+
],
|
| 8 |
+
"attention_probs_dropout_prob": 0.1,
|
| 9 |
+
"classifier_dropout_prob": 0.1,
|
| 10 |
+
"embedding_size": 128,
|
| 11 |
+
"hidden_act": "gelu",
|
| 12 |
+
"hidden_dropout_prob": 0.1,
|
| 13 |
+
"hidden_size": 36,
|
| 14 |
+
"initializer_range": 0.02,
|
| 15 |
+
"inner_group_num": 1,
|
| 16 |
+
"intermediate_size": 37,
|
| 17 |
+
"layer_norm_eps": 1e-12,
|
| 18 |
+
"max_position_embeddings": 512,
|
| 19 |
+
"model_type": "albert",
|
| 20 |
+
"neuron": {
|
| 21 |
+
"auto_cast": null,
|
| 22 |
+
"auto_cast_type": null,
|
| 23 |
+
"compiler_type": "neuronx-cc",
|
| 24 |
+
"compiler_version": "2.19.8089.0+8ab9f450",
|
| 25 |
+
"disable_fallback": false,
|
| 26 |
+
"disable_fast_relayout": false,
|
| 27 |
+
"dynamic_batch_size": false,
|
| 28 |
+
"float_dtype": "fp32",
|
| 29 |
+
"inline_weights_to_neff": true,
|
| 30 |
+
"input_names": [
|
| 31 |
+
"input_ids",
|
| 32 |
+
"attention_mask",
|
| 33 |
+
"token_type_ids"
|
| 34 |
+
],
|
| 35 |
+
"int_dtype": "int64",
|
| 36 |
+
"model_type": "albert",
|
| 37 |
+
"optlevel": "2",
|
| 38 |
+
"output_attentions": false,
|
| 39 |
+
"output_hidden_states": false,
|
| 40 |
+
"output_names": [
|
| 41 |
+
"logits"
|
| 42 |
+
],
|
| 43 |
+
"static_batch_size": 1,
|
| 44 |
+
"static_sequence_length": 128,
|
| 45 |
+
"task": "token-classification",
|
| 46 |
+
"tensor_parallel_size": 1
|
| 47 |
+
},
|
| 48 |
+
"num_attention_heads": 6,
|
| 49 |
+
"num_hidden_groups": 6,
|
| 50 |
+
"num_hidden_layers": 6,
|
| 51 |
+
"position_embedding_type": "absolute",
|
| 52 |
+
"type_vocab_size": 16,
|
| 53 |
+
"vocab_size": 30000
|
| 54 |
+
}
|
neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/albert/hf-internal-testing/tiny-random-AlbertModel/903f2ac3444c8203b948.json
ADDED
|
@@ -0,0 +1,54 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"_entry_class": "SingleModelCacheEntry",
|
| 3 |
+
"_model_id": "hf-internal-testing/tiny-random-AlbertModel",
|
| 4 |
+
"_task": "fill-mask",
|
| 5 |
+
"architectures": [
|
| 6 |
+
"AlbertModel"
|
| 7 |
+
],
|
| 8 |
+
"attention_probs_dropout_prob": 0.1,
|
| 9 |
+
"classifier_dropout_prob": 0.1,
|
| 10 |
+
"embedding_size": 128,
|
| 11 |
+
"hidden_act": "gelu",
|
| 12 |
+
"hidden_dropout_prob": 0.1,
|
| 13 |
+
"hidden_size": 36,
|
| 14 |
+
"initializer_range": 0.02,
|
| 15 |
+
"inner_group_num": 1,
|
| 16 |
+
"intermediate_size": 37,
|
| 17 |
+
"layer_norm_eps": 1e-12,
|
| 18 |
+
"max_position_embeddings": 512,
|
| 19 |
+
"model_type": "albert",
|
| 20 |
+
"neuron": {
|
| 21 |
+
"auto_cast": null,
|
| 22 |
+
"auto_cast_type": null,
|
| 23 |
+
"compiler_type": "neuronx-cc",
|
| 24 |
+
"compiler_version": "2.19.8089.0+8ab9f450",
|
| 25 |
+
"disable_fallback": false,
|
| 26 |
+
"disable_fast_relayout": false,
|
| 27 |
+
"dynamic_batch_size": false,
|
| 28 |
+
"float_dtype": "fp32",
|
| 29 |
+
"inline_weights_to_neff": true,
|
| 30 |
+
"input_names": [
|
| 31 |
+
"input_ids",
|
| 32 |
+
"attention_mask",
|
| 33 |
+
"token_type_ids"
|
| 34 |
+
],
|
| 35 |
+
"int_dtype": "int64",
|
| 36 |
+
"model_type": "albert",
|
| 37 |
+
"optlevel": "2",
|
| 38 |
+
"output_attentions": false,
|
| 39 |
+
"output_hidden_states": false,
|
| 40 |
+
"output_names": [
|
| 41 |
+
"logits"
|
| 42 |
+
],
|
| 43 |
+
"static_batch_size": 1,
|
| 44 |
+
"static_sequence_length": 32,
|
| 45 |
+
"task": "fill-mask",
|
| 46 |
+
"tensor_parallel_size": 1
|
| 47 |
+
},
|
| 48 |
+
"num_attention_heads": 6,
|
| 49 |
+
"num_hidden_groups": 6,
|
| 50 |
+
"num_hidden_layers": 6,
|
| 51 |
+
"position_embedding_type": "absolute",
|
| 52 |
+
"type_vocab_size": 16,
|
| 53 |
+
"vocab_size": 30000
|
| 54 |
+
}
|
neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/albert/hf-internal-testing/tiny-random-AlbertModel/9b69ad26e6071c069631.json
ADDED
|
@@ -0,0 +1,55 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"_entry_class": "SingleModelCacheEntry",
|
| 3 |
+
"_model_id": "hf-internal-testing/tiny-random-AlbertModel",
|
| 4 |
+
"_task": "question-answering",
|
| 5 |
+
"architectures": [
|
| 6 |
+
"AlbertModel"
|
| 7 |
+
],
|
| 8 |
+
"attention_probs_dropout_prob": 0.1,
|
| 9 |
+
"classifier_dropout_prob": 0.1,
|
| 10 |
+
"embedding_size": 128,
|
| 11 |
+
"hidden_act": "gelu",
|
| 12 |
+
"hidden_dropout_prob": 0.1,
|
| 13 |
+
"hidden_size": 36,
|
| 14 |
+
"initializer_range": 0.02,
|
| 15 |
+
"inner_group_num": 1,
|
| 16 |
+
"intermediate_size": 37,
|
| 17 |
+
"layer_norm_eps": 1e-12,
|
| 18 |
+
"max_position_embeddings": 512,
|
| 19 |
+
"model_type": "albert",
|
| 20 |
+
"neuron": {
|
| 21 |
+
"auto_cast": null,
|
| 22 |
+
"auto_cast_type": null,
|
| 23 |
+
"compiler_type": "neuronx-cc",
|
| 24 |
+
"compiler_version": "2.19.8089.0+8ab9f450",
|
| 25 |
+
"disable_fallback": false,
|
| 26 |
+
"disable_fast_relayout": false,
|
| 27 |
+
"dynamic_batch_size": false,
|
| 28 |
+
"float_dtype": "fp32",
|
| 29 |
+
"inline_weights_to_neff": true,
|
| 30 |
+
"input_names": [
|
| 31 |
+
"input_ids",
|
| 32 |
+
"attention_mask",
|
| 33 |
+
"token_type_ids"
|
| 34 |
+
],
|
| 35 |
+
"int_dtype": "int64",
|
| 36 |
+
"model_type": "albert",
|
| 37 |
+
"optlevel": "2",
|
| 38 |
+
"output_attentions": false,
|
| 39 |
+
"output_hidden_states": false,
|
| 40 |
+
"output_names": [
|
| 41 |
+
"start_logits",
|
| 42 |
+
"end_logits"
|
| 43 |
+
],
|
| 44 |
+
"static_batch_size": 1,
|
| 45 |
+
"static_sequence_length": 128,
|
| 46 |
+
"task": "question-answering",
|
| 47 |
+
"tensor_parallel_size": 1
|
| 48 |
+
},
|
| 49 |
+
"num_attention_heads": 6,
|
| 50 |
+
"num_hidden_groups": 6,
|
| 51 |
+
"num_hidden_layers": 6,
|
| 52 |
+
"position_embedding_type": "absolute",
|
| 53 |
+
"type_vocab_size": 16,
|
| 54 |
+
"vocab_size": 30000
|
| 55 |
+
}
|
neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/albert/hf-internal-testing/tiny-random-AlbertModel/aa7706c37f42f9b0efa0.json
ADDED
|
@@ -0,0 +1,54 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"_entry_class": "SingleModelCacheEntry",
|
| 3 |
+
"_model_id": "hf-internal-testing/tiny-random-AlbertModel",
|
| 4 |
+
"_task": "token-classification",
|
| 5 |
+
"architectures": [
|
| 6 |
+
"AlbertModel"
|
| 7 |
+
],
|
| 8 |
+
"attention_probs_dropout_prob": 0.1,
|
| 9 |
+
"classifier_dropout_prob": 0.1,
|
| 10 |
+
"embedding_size": 128,
|
| 11 |
+
"hidden_act": "gelu",
|
| 12 |
+
"hidden_dropout_prob": 0.1,
|
| 13 |
+
"hidden_size": 36,
|
| 14 |
+
"initializer_range": 0.02,
|
| 15 |
+
"inner_group_num": 1,
|
| 16 |
+
"intermediate_size": 37,
|
| 17 |
+
"layer_norm_eps": 1e-12,
|
| 18 |
+
"max_position_embeddings": 512,
|
| 19 |
+
"model_type": "albert",
|
| 20 |
+
"neuron": {
|
| 21 |
+
"auto_cast": null,
|
| 22 |
+
"auto_cast_type": null,
|
| 23 |
+
"compiler_type": "neuronx-cc",
|
| 24 |
+
"compiler_version": "2.19.8089.0+8ab9f450",
|
| 25 |
+
"disable_fallback": false,
|
| 26 |
+
"disable_fast_relayout": false,
|
| 27 |
+
"dynamic_batch_size": true,
|
| 28 |
+
"float_dtype": "fp32",
|
| 29 |
+
"inline_weights_to_neff": true,
|
| 30 |
+
"input_names": [
|
| 31 |
+
"input_ids",
|
| 32 |
+
"attention_mask",
|
| 33 |
+
"token_type_ids"
|
| 34 |
+
],
|
| 35 |
+
"int_dtype": "int64",
|
| 36 |
+
"model_type": "albert",
|
| 37 |
+
"optlevel": "2",
|
| 38 |
+
"output_attentions": false,
|
| 39 |
+
"output_hidden_states": false,
|
| 40 |
+
"output_names": [
|
| 41 |
+
"logits"
|
| 42 |
+
],
|
| 43 |
+
"static_batch_size": 1,
|
| 44 |
+
"static_sequence_length": 32,
|
| 45 |
+
"task": "token-classification",
|
| 46 |
+
"tensor_parallel_size": 1
|
| 47 |
+
},
|
| 48 |
+
"num_attention_heads": 6,
|
| 49 |
+
"num_hidden_groups": 6,
|
| 50 |
+
"num_hidden_layers": 6,
|
| 51 |
+
"position_embedding_type": "absolute",
|
| 52 |
+
"type_vocab_size": 16,
|
| 53 |
+
"vocab_size": 30000
|
| 54 |
+
}
|
neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/albert/hf-internal-testing/tiny-random-AlbertModel/b5b638607d26526724c7.json
ADDED
|
@@ -0,0 +1,54 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"_entry_class": "SingleModelCacheEntry",
|
| 3 |
+
"_model_id": "hf-internal-testing/tiny-random-AlbertModel",
|
| 4 |
+
"_task": "text-classification",
|
| 5 |
+
"architectures": [
|
| 6 |
+
"AlbertModel"
|
| 7 |
+
],
|
| 8 |
+
"attention_probs_dropout_prob": 0.1,
|
| 9 |
+
"classifier_dropout_prob": 0.1,
|
| 10 |
+
"embedding_size": 128,
|
| 11 |
+
"hidden_act": "gelu",
|
| 12 |
+
"hidden_dropout_prob": 0.1,
|
| 13 |
+
"hidden_size": 36,
|
| 14 |
+
"initializer_range": 0.02,
|
| 15 |
+
"inner_group_num": 1,
|
| 16 |
+
"intermediate_size": 37,
|
| 17 |
+
"layer_norm_eps": 1e-12,
|
| 18 |
+
"max_position_embeddings": 512,
|
| 19 |
+
"model_type": "albert",
|
| 20 |
+
"neuron": {
|
| 21 |
+
"auto_cast": null,
|
| 22 |
+
"auto_cast_type": null,
|
| 23 |
+
"compiler_type": "neuronx-cc",
|
| 24 |
+
"compiler_version": "2.19.8089.0+8ab9f450",
|
| 25 |
+
"disable_fallback": false,
|
| 26 |
+
"disable_fast_relayout": false,
|
| 27 |
+
"dynamic_batch_size": false,
|
| 28 |
+
"float_dtype": "fp32",
|
| 29 |
+
"inline_weights_to_neff": true,
|
| 30 |
+
"input_names": [
|
| 31 |
+
"input_ids",
|
| 32 |
+
"attention_mask",
|
| 33 |
+
"token_type_ids"
|
| 34 |
+
],
|
| 35 |
+
"int_dtype": "int64",
|
| 36 |
+
"model_type": "albert",
|
| 37 |
+
"optlevel": "2",
|
| 38 |
+
"output_attentions": false,
|
| 39 |
+
"output_hidden_states": false,
|
| 40 |
+
"output_names": [
|
| 41 |
+
"logits"
|
| 42 |
+
],
|
| 43 |
+
"static_batch_size": 1,
|
| 44 |
+
"static_sequence_length": 128,
|
| 45 |
+
"task": "text-classification",
|
| 46 |
+
"tensor_parallel_size": 1
|
| 47 |
+
},
|
| 48 |
+
"num_attention_heads": 6,
|
| 49 |
+
"num_hidden_groups": 6,
|
| 50 |
+
"num_hidden_layers": 6,
|
| 51 |
+
"position_embedding_type": "absolute",
|
| 52 |
+
"type_vocab_size": 16,
|
| 53 |
+
"vocab_size": 30000
|
| 54 |
+
}
|
neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/albert/hf-internal-testing/tiny-random-AlbertModel/ce96b3b9bef1f6cf0d93.json
ADDED
|
@@ -0,0 +1,55 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"_entry_class": "SingleModelCacheEntry",
|
| 3 |
+
"_model_id": "hf-internal-testing/tiny-random-AlbertModel",
|
| 4 |
+
"_task": "question-answering",
|
| 5 |
+
"architectures": [
|
| 6 |
+
"AlbertModel"
|
| 7 |
+
],
|
| 8 |
+
"attention_probs_dropout_prob": 0.1,
|
| 9 |
+
"classifier_dropout_prob": 0.1,
|
| 10 |
+
"embedding_size": 128,
|
| 11 |
+
"hidden_act": "gelu",
|
| 12 |
+
"hidden_dropout_prob": 0.1,
|
| 13 |
+
"hidden_size": 36,
|
| 14 |
+
"initializer_range": 0.02,
|
| 15 |
+
"inner_group_num": 1,
|
| 16 |
+
"intermediate_size": 37,
|
| 17 |
+
"layer_norm_eps": 1e-12,
|
| 18 |
+
"max_position_embeddings": 512,
|
| 19 |
+
"model_type": "albert",
|
| 20 |
+
"neuron": {
|
| 21 |
+
"auto_cast": null,
|
| 22 |
+
"auto_cast_type": null,
|
| 23 |
+
"compiler_type": "neuronx-cc",
|
| 24 |
+
"compiler_version": "2.19.8089.0+8ab9f450",
|
| 25 |
+
"disable_fallback": false,
|
| 26 |
+
"disable_fast_relayout": false,
|
| 27 |
+
"dynamic_batch_size": true,
|
| 28 |
+
"float_dtype": "fp32",
|
| 29 |
+
"inline_weights_to_neff": true,
|
| 30 |
+
"input_names": [
|
| 31 |
+
"input_ids",
|
| 32 |
+
"attention_mask",
|
| 33 |
+
"token_type_ids"
|
| 34 |
+
],
|
| 35 |
+
"int_dtype": "int64",
|
| 36 |
+
"model_type": "albert",
|
| 37 |
+
"optlevel": "2",
|
| 38 |
+
"output_attentions": false,
|
| 39 |
+
"output_hidden_states": false,
|
| 40 |
+
"output_names": [
|
| 41 |
+
"start_logits",
|
| 42 |
+
"end_logits"
|
| 43 |
+
],
|
| 44 |
+
"static_batch_size": 1,
|
| 45 |
+
"static_sequence_length": 32,
|
| 46 |
+
"task": "question-answering",
|
| 47 |
+
"tensor_parallel_size": 1
|
| 48 |
+
},
|
| 49 |
+
"num_attention_heads": 6,
|
| 50 |
+
"num_hidden_groups": 6,
|
| 51 |
+
"num_hidden_layers": 6,
|
| 52 |
+
"position_embedding_type": "absolute",
|
| 53 |
+
"type_vocab_size": 16,
|
| 54 |
+
"vocab_size": 30000
|
| 55 |
+
}
|
neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/albert/hf-internal-testing/tiny-random-AlbertModel/cf3a4b3035690a565ab1.json
ADDED
|
@@ -0,0 +1,55 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"_entry_class": "SingleModelCacheEntry",
|
| 3 |
+
"_model_id": "hf-internal-testing/tiny-random-AlbertModel",
|
| 4 |
+
"_task": "feature-extraction",
|
| 5 |
+
"architectures": [
|
| 6 |
+
"AlbertModel"
|
| 7 |
+
],
|
| 8 |
+
"attention_probs_dropout_prob": 0.1,
|
| 9 |
+
"classifier_dropout_prob": 0.1,
|
| 10 |
+
"embedding_size": 128,
|
| 11 |
+
"hidden_act": "gelu",
|
| 12 |
+
"hidden_dropout_prob": 0.1,
|
| 13 |
+
"hidden_size": 36,
|
| 14 |
+
"initializer_range": 0.02,
|
| 15 |
+
"inner_group_num": 1,
|
| 16 |
+
"intermediate_size": 37,
|
| 17 |
+
"layer_norm_eps": 1e-12,
|
| 18 |
+
"max_position_embeddings": 512,
|
| 19 |
+
"model_type": "albert",
|
| 20 |
+
"neuron": {
|
| 21 |
+
"auto_cast": null,
|
| 22 |
+
"auto_cast_type": null,
|
| 23 |
+
"compiler_type": "neuronx-cc",
|
| 24 |
+
"compiler_version": "2.19.8089.0+8ab9f450",
|
| 25 |
+
"disable_fallback": false,
|
| 26 |
+
"disable_fast_relayout": false,
|
| 27 |
+
"dynamic_batch_size": false,
|
| 28 |
+
"float_dtype": "fp32",
|
| 29 |
+
"inline_weights_to_neff": true,
|
| 30 |
+
"input_names": [
|
| 31 |
+
"input_ids",
|
| 32 |
+
"attention_mask",
|
| 33 |
+
"token_type_ids"
|
| 34 |
+
],
|
| 35 |
+
"int_dtype": "int64",
|
| 36 |
+
"model_type": "albert",
|
| 37 |
+
"optlevel": "2",
|
| 38 |
+
"output_attentions": false,
|
| 39 |
+
"output_hidden_states": false,
|
| 40 |
+
"output_names": [
|
| 41 |
+
"last_hidden_state",
|
| 42 |
+
"pooler_output"
|
| 43 |
+
],
|
| 44 |
+
"static_batch_size": 1,
|
| 45 |
+
"static_sequence_length": 32,
|
| 46 |
+
"task": "feature-extraction",
|
| 47 |
+
"tensor_parallel_size": 1
|
| 48 |
+
},
|
| 49 |
+
"num_attention_heads": 6,
|
| 50 |
+
"num_hidden_groups": 6,
|
| 51 |
+
"num_hidden_layers": 6,
|
| 52 |
+
"position_embedding_type": "absolute",
|
| 53 |
+
"type_vocab_size": 16,
|
| 54 |
+
"vocab_size": 30000
|
| 55 |
+
}
|
neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/albert/hf-internal-testing/tiny-random-AlbertModel/d2da3177c42e88297899.json
ADDED
|
@@ -0,0 +1,55 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"_entry_class": "SingleModelCacheEntry",
|
| 3 |
+
"_model_id": "hf-internal-testing/tiny-random-AlbertModel",
|
| 4 |
+
"_task": "multiple-choice",
|
| 5 |
+
"architectures": [
|
| 6 |
+
"AlbertModel"
|
| 7 |
+
],
|
| 8 |
+
"attention_probs_dropout_prob": 0.1,
|
| 9 |
+
"classifier_dropout_prob": 0.1,
|
| 10 |
+
"embedding_size": 128,
|
| 11 |
+
"hidden_act": "gelu",
|
| 12 |
+
"hidden_dropout_prob": 0.1,
|
| 13 |
+
"hidden_size": 36,
|
| 14 |
+
"initializer_range": 0.02,
|
| 15 |
+
"inner_group_num": 1,
|
| 16 |
+
"intermediate_size": 37,
|
| 17 |
+
"layer_norm_eps": 1e-12,
|
| 18 |
+
"max_position_embeddings": 512,
|
| 19 |
+
"model_type": "albert",
|
| 20 |
+
"neuron": {
|
| 21 |
+
"auto_cast": null,
|
| 22 |
+
"auto_cast_type": null,
|
| 23 |
+
"compiler_type": "neuronx-cc",
|
| 24 |
+
"compiler_version": "2.19.8089.0+8ab9f450",
|
| 25 |
+
"disable_fallback": false,
|
| 26 |
+
"disable_fast_relayout": false,
|
| 27 |
+
"dynamic_batch_size": false,
|
| 28 |
+
"float_dtype": "fp32",
|
| 29 |
+
"inline_weights_to_neff": true,
|
| 30 |
+
"input_names": [
|
| 31 |
+
"input_ids",
|
| 32 |
+
"attention_mask",
|
| 33 |
+
"token_type_ids"
|
| 34 |
+
],
|
| 35 |
+
"int_dtype": "int64",
|
| 36 |
+
"model_type": "albert",
|
| 37 |
+
"optlevel": "2",
|
| 38 |
+
"output_attentions": false,
|
| 39 |
+
"output_hidden_states": false,
|
| 40 |
+
"output_names": [
|
| 41 |
+
"logits"
|
| 42 |
+
],
|
| 43 |
+
"static_batch_size": 1,
|
| 44 |
+
"static_num_choices": 4,
|
| 45 |
+
"static_sequence_length": 128,
|
| 46 |
+
"task": "multiple-choice",
|
| 47 |
+
"tensor_parallel_size": 1
|
| 48 |
+
},
|
| 49 |
+
"num_attention_heads": 6,
|
| 50 |
+
"num_hidden_groups": 6,
|
| 51 |
+
"num_hidden_layers": 6,
|
| 52 |
+
"position_embedding_type": "absolute",
|
| 53 |
+
"type_vocab_size": 16,
|
| 54 |
+
"vocab_size": 30000
|
| 55 |
+
}
|
neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/albert/hf-internal-testing/tiny-random-AlbertModel/e59dd1535caa6a29b4cc.json
ADDED
|
@@ -0,0 +1,54 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"_entry_class": "SingleModelCacheEntry",
|
| 3 |
+
"_model_id": "hf-internal-testing/tiny-random-AlbertModel",
|
| 4 |
+
"_task": "text-classification",
|
| 5 |
+
"architectures": [
|
| 6 |
+
"AlbertModel"
|
| 7 |
+
],
|
| 8 |
+
"attention_probs_dropout_prob": 0.1,
|
| 9 |
+
"classifier_dropout_prob": 0.1,
|
| 10 |
+
"embedding_size": 128,
|
| 11 |
+
"hidden_act": "gelu",
|
| 12 |
+
"hidden_dropout_prob": 0.1,
|
| 13 |
+
"hidden_size": 36,
|
| 14 |
+
"initializer_range": 0.02,
|
| 15 |
+
"inner_group_num": 1,
|
| 16 |
+
"intermediate_size": 37,
|
| 17 |
+
"layer_norm_eps": 1e-12,
|
| 18 |
+
"max_position_embeddings": 512,
|
| 19 |
+
"model_type": "albert",
|
| 20 |
+
"neuron": {
|
| 21 |
+
"auto_cast": null,
|
| 22 |
+
"auto_cast_type": null,
|
| 23 |
+
"compiler_type": "neuronx-cc",
|
| 24 |
+
"compiler_version": "2.19.8089.0+8ab9f450",
|
| 25 |
+
"disable_fallback": false,
|
| 26 |
+
"disable_fast_relayout": false,
|
| 27 |
+
"dynamic_batch_size": true,
|
| 28 |
+
"float_dtype": "fp32",
|
| 29 |
+
"inline_weights_to_neff": true,
|
| 30 |
+
"input_names": [
|
| 31 |
+
"input_ids",
|
| 32 |
+
"attention_mask",
|
| 33 |
+
"token_type_ids"
|
| 34 |
+
],
|
| 35 |
+
"int_dtype": "int64",
|
| 36 |
+
"model_type": "albert",
|
| 37 |
+
"optlevel": "2",
|
| 38 |
+
"output_attentions": false,
|
| 39 |
+
"output_hidden_states": false,
|
| 40 |
+
"output_names": [
|
| 41 |
+
"logits"
|
| 42 |
+
],
|
| 43 |
+
"static_batch_size": 1,
|
| 44 |
+
"static_sequence_length": 32,
|
| 45 |
+
"task": "text-classification",
|
| 46 |
+
"tensor_parallel_size": 1
|
| 47 |
+
},
|
| 48 |
+
"num_attention_heads": 6,
|
| 49 |
+
"num_hidden_groups": 6,
|
| 50 |
+
"num_hidden_layers": 6,
|
| 51 |
+
"position_embedding_type": "absolute",
|
| 52 |
+
"type_vocab_size": 16,
|
| 53 |
+
"vocab_size": 30000
|
| 54 |
+
}
|
neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/beit/hf-internal-testing/tiny-random-BeitForImageClassification/7b8399664c54026a03ff.json
ADDED
|
@@ -0,0 +1,90 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"_entry_class": "SingleModelCacheEntry",
|
| 3 |
+
"_model_id": "hf-internal-testing/tiny-random-BeitForImageClassification",
|
| 4 |
+
"_task": "image-classification",
|
| 5 |
+
"add_fpn": false,
|
| 6 |
+
"architectures": [
|
| 7 |
+
"BeitForImageClassification"
|
| 8 |
+
],
|
| 9 |
+
"attention_probs_dropout_prob": 0.1,
|
| 10 |
+
"auxiliary_channels": 256,
|
| 11 |
+
"auxiliary_concat_input": false,
|
| 12 |
+
"auxiliary_loss_weight": 0.4,
|
| 13 |
+
"auxiliary_num_convs": 1,
|
| 14 |
+
"drop_path_rate": 0.1,
|
| 15 |
+
"hidden_act": "gelu",
|
| 16 |
+
"hidden_dropout_prob": 0.1,
|
| 17 |
+
"hidden_size": 32,
|
| 18 |
+
"image_size": 30,
|
| 19 |
+
"initializer_range": 0.02,
|
| 20 |
+
"intermediate_size": 37,
|
| 21 |
+
"layer_norm_eps": 1e-12,
|
| 22 |
+
"layer_scale_init_value": 0.1,
|
| 23 |
+
"model_type": "beit",
|
| 24 |
+
"neuron": {
|
| 25 |
+
"auto_cast": null,
|
| 26 |
+
"auto_cast_type": null,
|
| 27 |
+
"compiler_type": "neuronx-cc",
|
| 28 |
+
"compiler_version": "2.19.8089.0+8ab9f450",
|
| 29 |
+
"disable_fallback": false,
|
| 30 |
+
"disable_fast_relayout": false,
|
| 31 |
+
"dynamic_batch_size": true,
|
| 32 |
+
"float_dtype": "fp32",
|
| 33 |
+
"inline_weights_to_neff": true,
|
| 34 |
+
"input_names": [
|
| 35 |
+
"pixel_values"
|
| 36 |
+
],
|
| 37 |
+
"int_dtype": "int64",
|
| 38 |
+
"model_type": "beit",
|
| 39 |
+
"optlevel": "2",
|
| 40 |
+
"output_attentions": false,
|
| 41 |
+
"output_hidden_states": false,
|
| 42 |
+
"output_names": [
|
| 43 |
+
"logits"
|
| 44 |
+
],
|
| 45 |
+
"static_batch_size": 1,
|
| 46 |
+
"static_image_size": 30,
|
| 47 |
+
"static_num_channels": 3,
|
| 48 |
+
"static_patch_size": 2,
|
| 49 |
+
"task": "image-classification",
|
| 50 |
+
"tensor_parallel_size": 1
|
| 51 |
+
},
|
| 52 |
+
"num_attention_heads": 4,
|
| 53 |
+
"num_channels": 3,
|
| 54 |
+
"num_hidden_layers": 4,
|
| 55 |
+
"out_features": [
|
| 56 |
+
"stem",
|
| 57 |
+
"stage1",
|
| 58 |
+
"stage2",
|
| 59 |
+
"stage3"
|
| 60 |
+
],
|
| 61 |
+
"out_indices": [
|
| 62 |
+
0,
|
| 63 |
+
1,
|
| 64 |
+
2,
|
| 65 |
+
3
|
| 66 |
+
],
|
| 67 |
+
"patch_size": 2,
|
| 68 |
+
"pool_scales": [
|
| 69 |
+
1,
|
| 70 |
+
2,
|
| 71 |
+
3,
|
| 72 |
+
6
|
| 73 |
+
],
|
| 74 |
+
"reshape_hidden_states": true,
|
| 75 |
+
"semantic_loss_ignore_index": 255,
|
| 76 |
+
"stage_names": [
|
| 77 |
+
"stem",
|
| 78 |
+
"stage1",
|
| 79 |
+
"stage2",
|
| 80 |
+
"stage3",
|
| 81 |
+
"stage4"
|
| 82 |
+
],
|
| 83 |
+
"use_absolute_position_embeddings": false,
|
| 84 |
+
"use_auxiliary_head": true,
|
| 85 |
+
"use_mask_token": false,
|
| 86 |
+
"use_mean_pooling": true,
|
| 87 |
+
"use_relative_position_bias": false,
|
| 88 |
+
"use_shared_relative_position_bias": false,
|
| 89 |
+
"vocab_size": 100
|
| 90 |
+
}
|
neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/beit/hf-internal-testing/tiny-random-BeitForImageClassification/8eea34f80bdd528f4c47.json
ADDED
|
@@ -0,0 +1,90 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"_entry_class": "SingleModelCacheEntry",
|
| 3 |
+
"_model_id": "hf-internal-testing/tiny-random-BeitForImageClassification",
|
| 4 |
+
"_task": "image-classification",
|
| 5 |
+
"add_fpn": false,
|
| 6 |
+
"architectures": [
|
| 7 |
+
"BeitForImageClassification"
|
| 8 |
+
],
|
| 9 |
+
"attention_probs_dropout_prob": 0.1,
|
| 10 |
+
"auxiliary_channels": 256,
|
| 11 |
+
"auxiliary_concat_input": false,
|
| 12 |
+
"auxiliary_loss_weight": 0.4,
|
| 13 |
+
"auxiliary_num_convs": 1,
|
| 14 |
+
"drop_path_rate": 0.1,
|
| 15 |
+
"hidden_act": "gelu",
|
| 16 |
+
"hidden_dropout_prob": 0.1,
|
| 17 |
+
"hidden_size": 32,
|
| 18 |
+
"image_size": 30,
|
| 19 |
+
"initializer_range": 0.02,
|
| 20 |
+
"intermediate_size": 37,
|
| 21 |
+
"layer_norm_eps": 1e-12,
|
| 22 |
+
"layer_scale_init_value": 0.1,
|
| 23 |
+
"model_type": "beit",
|
| 24 |
+
"neuron": {
|
| 25 |
+
"auto_cast": null,
|
| 26 |
+
"auto_cast_type": null,
|
| 27 |
+
"compiler_type": "neuronx-cc",
|
| 28 |
+
"compiler_version": "2.19.8089.0+8ab9f450",
|
| 29 |
+
"disable_fallback": false,
|
| 30 |
+
"disable_fast_relayout": false,
|
| 31 |
+
"dynamic_batch_size": false,
|
| 32 |
+
"float_dtype": "fp32",
|
| 33 |
+
"inline_weights_to_neff": true,
|
| 34 |
+
"input_names": [
|
| 35 |
+
"pixel_values"
|
| 36 |
+
],
|
| 37 |
+
"int_dtype": "int64",
|
| 38 |
+
"model_type": "beit",
|
| 39 |
+
"optlevel": "2",
|
| 40 |
+
"output_attentions": false,
|
| 41 |
+
"output_hidden_states": false,
|
| 42 |
+
"output_names": [
|
| 43 |
+
"logits"
|
| 44 |
+
],
|
| 45 |
+
"static_batch_size": 1,
|
| 46 |
+
"static_image_size": 30,
|
| 47 |
+
"static_num_channels": 3,
|
| 48 |
+
"static_patch_size": 2,
|
| 49 |
+
"task": "image-classification",
|
| 50 |
+
"tensor_parallel_size": 1
|
| 51 |
+
},
|
| 52 |
+
"num_attention_heads": 4,
|
| 53 |
+
"num_channels": 3,
|
| 54 |
+
"num_hidden_layers": 4,
|
| 55 |
+
"out_features": [
|
| 56 |
+
"stem",
|
| 57 |
+
"stage1",
|
| 58 |
+
"stage2",
|
| 59 |
+
"stage3"
|
| 60 |
+
],
|
| 61 |
+
"out_indices": [
|
| 62 |
+
0,
|
| 63 |
+
1,
|
| 64 |
+
2,
|
| 65 |
+
3
|
| 66 |
+
],
|
| 67 |
+
"patch_size": 2,
|
| 68 |
+
"pool_scales": [
|
| 69 |
+
1,
|
| 70 |
+
2,
|
| 71 |
+
3,
|
| 72 |
+
6
|
| 73 |
+
],
|
| 74 |
+
"reshape_hidden_states": true,
|
| 75 |
+
"semantic_loss_ignore_index": 255,
|
| 76 |
+
"stage_names": [
|
| 77 |
+
"stem",
|
| 78 |
+
"stage1",
|
| 79 |
+
"stage2",
|
| 80 |
+
"stage3",
|
| 81 |
+
"stage4"
|
| 82 |
+
],
|
| 83 |
+
"use_absolute_position_embeddings": false,
|
| 84 |
+
"use_auxiliary_head": true,
|
| 85 |
+
"use_mask_token": false,
|
| 86 |
+
"use_mean_pooling": true,
|
| 87 |
+
"use_relative_position_bias": false,
|
| 88 |
+
"use_shared_relative_position_bias": false,
|
| 89 |
+
"vocab_size": 100
|
| 90 |
+
}
|
neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/bert/Jingya/tiny-random-bert-remote-code/601076bf2990d898404b.json
ADDED
|
@@ -0,0 +1,52 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"_entry_class": "SingleModelCacheEntry",
|
| 3 |
+
"_model_id": "Jingya/tiny-random-bert-remote-code",
|
| 4 |
+
"_task": "text-classification",
|
| 5 |
+
"architectures": [
|
| 6 |
+
"BertModel"
|
| 7 |
+
],
|
| 8 |
+
"attention_probs_dropout_prob": 0.1,
|
| 9 |
+
"classifier_dropout": null,
|
| 10 |
+
"hidden_act": "gelu",
|
| 11 |
+
"hidden_dropout_prob": 0.1,
|
| 12 |
+
"hidden_size": 32,
|
| 13 |
+
"initializer_range": 0.02,
|
| 14 |
+
"intermediate_size": 37,
|
| 15 |
+
"layer_norm_eps": 1e-12,
|
| 16 |
+
"max_position_embeddings": 512,
|
| 17 |
+
"model_type": "bert",
|
| 18 |
+
"neuron": {
|
| 19 |
+
"auto_cast": null,
|
| 20 |
+
"auto_cast_type": null,
|
| 21 |
+
"compiler_type": "neuronx-cc",
|
| 22 |
+
"compiler_version": "2.19.8089.0+8ab9f450",
|
| 23 |
+
"disable_fallback": false,
|
| 24 |
+
"disable_fast_relayout": false,
|
| 25 |
+
"dynamic_batch_size": false,
|
| 26 |
+
"float_dtype": "fp32",
|
| 27 |
+
"inline_weights_to_neff": true,
|
| 28 |
+
"input_names": [
|
| 29 |
+
"input_ids",
|
| 30 |
+
"attention_mask",
|
| 31 |
+
"token_type_ids"
|
| 32 |
+
],
|
| 33 |
+
"int_dtype": "int64",
|
| 34 |
+
"model_type": "bert",
|
| 35 |
+
"optlevel": "2",
|
| 36 |
+
"output_attentions": false,
|
| 37 |
+
"output_hidden_states": false,
|
| 38 |
+
"output_names": [
|
| 39 |
+
"logits"
|
| 40 |
+
],
|
| 41 |
+
"static_batch_size": 1,
|
| 42 |
+
"static_sequence_length": 32,
|
| 43 |
+
"task": "text-classification",
|
| 44 |
+
"tensor_parallel_size": 1
|
| 45 |
+
},
|
| 46 |
+
"num_attention_heads": 4,
|
| 47 |
+
"num_hidden_layers": 5,
|
| 48 |
+
"position_embedding_type": "absolute",
|
| 49 |
+
"type_vocab_size": 16,
|
| 50 |
+
"use_cache": true,
|
| 51 |
+
"vocab_size": 1124
|
| 52 |
+
}
|
neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/bert/fxmarty/tiny-bert-sst2-distilled-subfolder/d7d576d06e1491d72e5a.json
ADDED
|
@@ -0,0 +1,61 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"_entry_class": "SingleModelCacheEntry",
|
| 3 |
+
"_model_id": "fxmarty/tiny-bert-sst2-distilled-subfolder",
|
| 4 |
+
"_task": "text-classification",
|
| 5 |
+
"architectures": [
|
| 6 |
+
"BertForSequenceClassification"
|
| 7 |
+
],
|
| 8 |
+
"attention_probs_dropout_prob": 0.1,
|
| 9 |
+
"classifier_dropout": null,
|
| 10 |
+
"hidden_act": "gelu",
|
| 11 |
+
"hidden_dropout_prob": 0.1,
|
| 12 |
+
"hidden_size": 128,
|
| 13 |
+
"id2label": {
|
| 14 |
+
"0": "negative",
|
| 15 |
+
"1": "positive"
|
| 16 |
+
},
|
| 17 |
+
"initializer_range": 0.02,
|
| 18 |
+
"intermediate_size": 512,
|
| 19 |
+
"label2id": {
|
| 20 |
+
"negative": "0",
|
| 21 |
+
"positive": "1"
|
| 22 |
+
},
|
| 23 |
+
"layer_norm_eps": 1e-12,
|
| 24 |
+
"max_position_embeddings": 512,
|
| 25 |
+
"model_type": "bert",
|
| 26 |
+
"neuron": {
|
| 27 |
+
"auto_cast": null,
|
| 28 |
+
"auto_cast_type": null,
|
| 29 |
+
"compiler_type": "neuronx-cc",
|
| 30 |
+
"compiler_version": "2.19.8089.0+8ab9f450",
|
| 31 |
+
"disable_fallback": false,
|
| 32 |
+
"disable_fast_relayout": false,
|
| 33 |
+
"dynamic_batch_size": false,
|
| 34 |
+
"float_dtype": "fp32",
|
| 35 |
+
"inline_weights_to_neff": true,
|
| 36 |
+
"input_names": [
|
| 37 |
+
"input_ids",
|
| 38 |
+
"attention_mask",
|
| 39 |
+
"token_type_ids"
|
| 40 |
+
],
|
| 41 |
+
"int_dtype": "int64",
|
| 42 |
+
"model_type": "bert",
|
| 43 |
+
"optlevel": "2",
|
| 44 |
+
"output_attentions": false,
|
| 45 |
+
"output_hidden_states": false,
|
| 46 |
+
"output_names": [
|
| 47 |
+
"logits"
|
| 48 |
+
],
|
| 49 |
+
"static_batch_size": 1,
|
| 50 |
+
"static_sequence_length": 32,
|
| 51 |
+
"task": "text-classification",
|
| 52 |
+
"tensor_parallel_size": 1
|
| 53 |
+
},
|
| 54 |
+
"num_attention_heads": 2,
|
| 55 |
+
"num_hidden_layers": 2,
|
| 56 |
+
"position_embedding_type": "absolute",
|
| 57 |
+
"problem_type": "single_label_classification",
|
| 58 |
+
"type_vocab_size": 2,
|
| 59 |
+
"use_cache": true,
|
| 60 |
+
"vocab_size": 30522
|
| 61 |
+
}
|
neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/bert/hf-internal-testing/tiny-random-BertModel/07d9dac237105afed7b4.json
ADDED
|
@@ -0,0 +1,52 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"_entry_class": "SingleModelCacheEntry",
|
| 3 |
+
"_model_id": "hf-internal-testing/tiny-random-BertModel",
|
| 4 |
+
"_task": "fill-mask",
|
| 5 |
+
"architectures": [
|
| 6 |
+
"BertModel"
|
| 7 |
+
],
|
| 8 |
+
"attention_probs_dropout_prob": 0.1,
|
| 9 |
+
"classifier_dropout": null,
|
| 10 |
+
"hidden_act": "gelu",
|
| 11 |
+
"hidden_dropout_prob": 0.1,
|
| 12 |
+
"hidden_size": 32,
|
| 13 |
+
"initializer_range": 0.02,
|
| 14 |
+
"intermediate_size": 37,
|
| 15 |
+
"layer_norm_eps": 1e-12,
|
| 16 |
+
"max_position_embeddings": 512,
|
| 17 |
+
"model_type": "bert",
|
| 18 |
+
"neuron": {
|
| 19 |
+
"auto_cast": null,
|
| 20 |
+
"auto_cast_type": null,
|
| 21 |
+
"compiler_type": "neuronx-cc",
|
| 22 |
+
"compiler_version": "2.19.8089.0+8ab9f450",
|
| 23 |
+
"disable_fallback": false,
|
| 24 |
+
"disable_fast_relayout": false,
|
| 25 |
+
"dynamic_batch_size": false,
|
| 26 |
+
"float_dtype": "fp32",
|
| 27 |
+
"inline_weights_to_neff": true,
|
| 28 |
+
"input_names": [
|
| 29 |
+
"input_ids",
|
| 30 |
+
"attention_mask",
|
| 31 |
+
"token_type_ids"
|
| 32 |
+
],
|
| 33 |
+
"int_dtype": "int64",
|
| 34 |
+
"model_type": "bert",
|
| 35 |
+
"optlevel": "2",
|
| 36 |
+
"output_attentions": false,
|
| 37 |
+
"output_hidden_states": false,
|
| 38 |
+
"output_names": [
|
| 39 |
+
"logits"
|
| 40 |
+
],
|
| 41 |
+
"static_batch_size": 1,
|
| 42 |
+
"static_sequence_length": 32,
|
| 43 |
+
"task": "fill-mask",
|
| 44 |
+
"tensor_parallel_size": 1
|
| 45 |
+
},
|
| 46 |
+
"num_attention_heads": 4,
|
| 47 |
+
"num_hidden_layers": 5,
|
| 48 |
+
"position_embedding_type": "absolute",
|
| 49 |
+
"type_vocab_size": 16,
|
| 50 |
+
"use_cache": true,
|
| 51 |
+
"vocab_size": 1124
|
| 52 |
+
}
|
neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/bert/hf-internal-testing/tiny-random-BertModel/0d7dca7e1b02d11fa30b.json
ADDED
|
@@ -0,0 +1,52 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"_entry_class": "SingleModelCacheEntry",
|
| 3 |
+
"_model_id": "hf-internal-testing/tiny-random-BertModel",
|
| 4 |
+
"_task": "text-classification",
|
| 5 |
+
"architectures": [
|
| 6 |
+
"BertModel"
|
| 7 |
+
],
|
| 8 |
+
"attention_probs_dropout_prob": 0.1,
|
| 9 |
+
"classifier_dropout": null,
|
| 10 |
+
"hidden_act": "gelu",
|
| 11 |
+
"hidden_dropout_prob": 0.1,
|
| 12 |
+
"hidden_size": 32,
|
| 13 |
+
"initializer_range": 0.02,
|
| 14 |
+
"intermediate_size": 37,
|
| 15 |
+
"layer_norm_eps": 1e-12,
|
| 16 |
+
"max_position_embeddings": 512,
|
| 17 |
+
"model_type": "bert",
|
| 18 |
+
"neuron": {
|
| 19 |
+
"auto_cast": null,
|
| 20 |
+
"auto_cast_type": null,
|
| 21 |
+
"compiler_type": "neuronx-cc",
|
| 22 |
+
"compiler_version": "2.19.8089.0+8ab9f450",
|
| 23 |
+
"disable_fallback": false,
|
| 24 |
+
"disable_fast_relayout": false,
|
| 25 |
+
"dynamic_batch_size": false,
|
| 26 |
+
"float_dtype": "fp32",
|
| 27 |
+
"inline_weights_to_neff": true,
|
| 28 |
+
"input_names": [
|
| 29 |
+
"input_ids",
|
| 30 |
+
"attention_mask",
|
| 31 |
+
"token_type_ids"
|
| 32 |
+
],
|
| 33 |
+
"int_dtype": "int64",
|
| 34 |
+
"model_type": "bert",
|
| 35 |
+
"optlevel": "2",
|
| 36 |
+
"output_attentions": false,
|
| 37 |
+
"output_hidden_states": false,
|
| 38 |
+
"output_names": [
|
| 39 |
+
"logits"
|
| 40 |
+
],
|
| 41 |
+
"static_batch_size": 1,
|
| 42 |
+
"static_sequence_length": 32,
|
| 43 |
+
"task": "text-classification",
|
| 44 |
+
"tensor_parallel_size": 1
|
| 45 |
+
},
|
| 46 |
+
"num_attention_heads": 4,
|
| 47 |
+
"num_hidden_layers": 5,
|
| 48 |
+
"position_embedding_type": "absolute",
|
| 49 |
+
"type_vocab_size": 16,
|
| 50 |
+
"use_cache": true,
|
| 51 |
+
"vocab_size": 1124
|
| 52 |
+
}
|
neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/bert/hf-internal-testing/tiny-random-BertModel/22ce2cce0b08d134021c.json
ADDED
|
@@ -0,0 +1,53 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"_entry_class": "SingleModelCacheEntry",
|
| 3 |
+
"_model_id": "hf-internal-testing/tiny-random-BertModel",
|
| 4 |
+
"_task": "multiple-choice",
|
| 5 |
+
"architectures": [
|
| 6 |
+
"BertModel"
|
| 7 |
+
],
|
| 8 |
+
"attention_probs_dropout_prob": 0.1,
|
| 9 |
+
"classifier_dropout": null,
|
| 10 |
+
"hidden_act": "gelu",
|
| 11 |
+
"hidden_dropout_prob": 0.1,
|
| 12 |
+
"hidden_size": 32,
|
| 13 |
+
"initializer_range": 0.02,
|
| 14 |
+
"intermediate_size": 37,
|
| 15 |
+
"layer_norm_eps": 1e-12,
|
| 16 |
+
"max_position_embeddings": 512,
|
| 17 |
+
"model_type": "bert",
|
| 18 |
+
"neuron": {
|
| 19 |
+
"auto_cast": null,
|
| 20 |
+
"auto_cast_type": null,
|
| 21 |
+
"compiler_type": "neuronx-cc",
|
| 22 |
+
"compiler_version": "2.19.8089.0+8ab9f450",
|
| 23 |
+
"disable_fallback": false,
|
| 24 |
+
"disable_fast_relayout": false,
|
| 25 |
+
"dynamic_batch_size": false,
|
| 26 |
+
"float_dtype": "fp32",
|
| 27 |
+
"inline_weights_to_neff": true,
|
| 28 |
+
"input_names": [
|
| 29 |
+
"input_ids",
|
| 30 |
+
"attention_mask",
|
| 31 |
+
"token_type_ids"
|
| 32 |
+
],
|
| 33 |
+
"int_dtype": "int64",
|
| 34 |
+
"model_type": "bert",
|
| 35 |
+
"optlevel": "2",
|
| 36 |
+
"output_attentions": false,
|
| 37 |
+
"output_hidden_states": false,
|
| 38 |
+
"output_names": [
|
| 39 |
+
"logits"
|
| 40 |
+
],
|
| 41 |
+
"static_batch_size": 1,
|
| 42 |
+
"static_num_choices": 4,
|
| 43 |
+
"static_sequence_length": 128,
|
| 44 |
+
"task": "multiple-choice",
|
| 45 |
+
"tensor_parallel_size": 1
|
| 46 |
+
},
|
| 47 |
+
"num_attention_heads": 4,
|
| 48 |
+
"num_hidden_layers": 5,
|
| 49 |
+
"position_embedding_type": "absolute",
|
| 50 |
+
"type_vocab_size": 16,
|
| 51 |
+
"use_cache": true,
|
| 52 |
+
"vocab_size": 1124
|
| 53 |
+
}
|
neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/bert/hf-internal-testing/tiny-random-BertModel/28bcefedc9caadd676ab.json
ADDED
|
@@ -0,0 +1,53 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"_entry_class": "SingleModelCacheEntry",
|
| 3 |
+
"_model_id": "hf-internal-testing/tiny-random-BertModel",
|
| 4 |
+
"_task": "feature-extraction",
|
| 5 |
+
"architectures": [
|
| 6 |
+
"BertModel"
|
| 7 |
+
],
|
| 8 |
+
"attention_probs_dropout_prob": 0.1,
|
| 9 |
+
"classifier_dropout": null,
|
| 10 |
+
"hidden_act": "gelu",
|
| 11 |
+
"hidden_dropout_prob": 0.1,
|
| 12 |
+
"hidden_size": 32,
|
| 13 |
+
"initializer_range": 0.02,
|
| 14 |
+
"intermediate_size": 37,
|
| 15 |
+
"layer_norm_eps": 1e-12,
|
| 16 |
+
"max_position_embeddings": 512,
|
| 17 |
+
"model_type": "bert",
|
| 18 |
+
"neuron": {
|
| 19 |
+
"auto_cast": null,
|
| 20 |
+
"auto_cast_type": null,
|
| 21 |
+
"compiler_type": "neuronx-cc",
|
| 22 |
+
"compiler_version": "2.19.8089.0+8ab9f450",
|
| 23 |
+
"disable_fallback": false,
|
| 24 |
+
"disable_fast_relayout": false,
|
| 25 |
+
"dynamic_batch_size": false,
|
| 26 |
+
"float_dtype": "fp32",
|
| 27 |
+
"inline_weights_to_neff": true,
|
| 28 |
+
"input_names": [
|
| 29 |
+
"input_ids",
|
| 30 |
+
"attention_mask",
|
| 31 |
+
"token_type_ids"
|
| 32 |
+
],
|
| 33 |
+
"int_dtype": "int64",
|
| 34 |
+
"model_type": "bert",
|
| 35 |
+
"optlevel": "2",
|
| 36 |
+
"output_attentions": false,
|
| 37 |
+
"output_hidden_states": false,
|
| 38 |
+
"output_names": [
|
| 39 |
+
"last_hidden_state",
|
| 40 |
+
"pooler_output"
|
| 41 |
+
],
|
| 42 |
+
"static_batch_size": 1,
|
| 43 |
+
"static_sequence_length": 128,
|
| 44 |
+
"task": "feature-extraction",
|
| 45 |
+
"tensor_parallel_size": 1
|
| 46 |
+
},
|
| 47 |
+
"num_attention_heads": 4,
|
| 48 |
+
"num_hidden_layers": 5,
|
| 49 |
+
"position_embedding_type": "absolute",
|
| 50 |
+
"type_vocab_size": 16,
|
| 51 |
+
"use_cache": true,
|
| 52 |
+
"vocab_size": 1124
|
| 53 |
+
}
|
neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/bert/hf-internal-testing/tiny-random-BertModel/3908bf519c210b434176.json
ADDED
|
@@ -0,0 +1,53 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"_entry_class": "SingleModelCacheEntry",
|
| 3 |
+
"_model_id": "hf-internal-testing/tiny-random-BertModel",
|
| 4 |
+
"_task": "feature-extraction",
|
| 5 |
+
"architectures": [
|
| 6 |
+
"BertModel"
|
| 7 |
+
],
|
| 8 |
+
"attention_probs_dropout_prob": 0.1,
|
| 9 |
+
"classifier_dropout": null,
|
| 10 |
+
"hidden_act": "gelu",
|
| 11 |
+
"hidden_dropout_prob": 0.1,
|
| 12 |
+
"hidden_size": 32,
|
| 13 |
+
"initializer_range": 0.02,
|
| 14 |
+
"intermediate_size": 37,
|
| 15 |
+
"layer_norm_eps": 1e-12,
|
| 16 |
+
"max_position_embeddings": 512,
|
| 17 |
+
"model_type": "bert",
|
| 18 |
+
"neuron": {
|
| 19 |
+
"auto_cast": null,
|
| 20 |
+
"auto_cast_type": null,
|
| 21 |
+
"compiler_type": "neuronx-cc",
|
| 22 |
+
"compiler_version": "2.19.8089.0+8ab9f450",
|
| 23 |
+
"disable_fallback": false,
|
| 24 |
+
"disable_fast_relayout": false,
|
| 25 |
+
"dynamic_batch_size": false,
|
| 26 |
+
"float_dtype": "fp32",
|
| 27 |
+
"inline_weights_to_neff": true,
|
| 28 |
+
"input_names": [
|
| 29 |
+
"input_ids",
|
| 30 |
+
"attention_mask",
|
| 31 |
+
"token_type_ids"
|
| 32 |
+
],
|
| 33 |
+
"int_dtype": "int64",
|
| 34 |
+
"model_type": "bert",
|
| 35 |
+
"optlevel": "2",
|
| 36 |
+
"output_attentions": false,
|
| 37 |
+
"output_hidden_states": false,
|
| 38 |
+
"output_names": [
|
| 39 |
+
"last_hidden_state",
|
| 40 |
+
"pooler_output"
|
| 41 |
+
],
|
| 42 |
+
"static_batch_size": 1,
|
| 43 |
+
"static_sequence_length": 32,
|
| 44 |
+
"task": "feature-extraction",
|
| 45 |
+
"tensor_parallel_size": 1
|
| 46 |
+
},
|
| 47 |
+
"num_attention_heads": 4,
|
| 48 |
+
"num_hidden_layers": 5,
|
| 49 |
+
"position_embedding_type": "absolute",
|
| 50 |
+
"type_vocab_size": 16,
|
| 51 |
+
"use_cache": true,
|
| 52 |
+
"vocab_size": 1124
|
| 53 |
+
}
|
neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/bert/hf-internal-testing/tiny-random-BertModel/5ead9d705b13f37e716b.json
ADDED
|
@@ -0,0 +1,52 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"_entry_class": "SingleModelCacheEntry",
|
| 3 |
+
"_model_id": "hf-internal-testing/tiny-random-BertModel",
|
| 4 |
+
"_task": "text-classification",
|
| 5 |
+
"architectures": [
|
| 6 |
+
"BertModel"
|
| 7 |
+
],
|
| 8 |
+
"attention_probs_dropout_prob": 0.1,
|
| 9 |
+
"classifier_dropout": null,
|
| 10 |
+
"hidden_act": "gelu",
|
| 11 |
+
"hidden_dropout_prob": 0.1,
|
| 12 |
+
"hidden_size": 32,
|
| 13 |
+
"initializer_range": 0.02,
|
| 14 |
+
"intermediate_size": 37,
|
| 15 |
+
"layer_norm_eps": 1e-12,
|
| 16 |
+
"max_position_embeddings": 512,
|
| 17 |
+
"model_type": "bert",
|
| 18 |
+
"neuron": {
|
| 19 |
+
"auto_cast": null,
|
| 20 |
+
"auto_cast_type": null,
|
| 21 |
+
"compiler_type": "neuronx-cc",
|
| 22 |
+
"compiler_version": "2.19.8089.0+8ab9f450",
|
| 23 |
+
"disable_fallback": false,
|
| 24 |
+
"disable_fast_relayout": false,
|
| 25 |
+
"dynamic_batch_size": false,
|
| 26 |
+
"float_dtype": "fp32",
|
| 27 |
+
"inline_weights_to_neff": false,
|
| 28 |
+
"input_names": [
|
| 29 |
+
"input_ids",
|
| 30 |
+
"attention_mask",
|
| 31 |
+
"token_type_ids"
|
| 32 |
+
],
|
| 33 |
+
"int_dtype": "int64",
|
| 34 |
+
"model_type": "bert",
|
| 35 |
+
"optlevel": "2",
|
| 36 |
+
"output_attentions": false,
|
| 37 |
+
"output_hidden_states": false,
|
| 38 |
+
"output_names": [
|
| 39 |
+
"logits"
|
| 40 |
+
],
|
| 41 |
+
"static_batch_size": 1,
|
| 42 |
+
"static_sequence_length": 32,
|
| 43 |
+
"task": "text-classification",
|
| 44 |
+
"tensor_parallel_size": 1
|
| 45 |
+
},
|
| 46 |
+
"num_attention_heads": 4,
|
| 47 |
+
"num_hidden_layers": 5,
|
| 48 |
+
"position_embedding_type": "absolute",
|
| 49 |
+
"type_vocab_size": 16,
|
| 50 |
+
"use_cache": true,
|
| 51 |
+
"vocab_size": 1124
|
| 52 |
+
}
|
neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/bert/hf-internal-testing/tiny-random-BertModel/80c925bab2fcc5749b91.json
ADDED
|
@@ -0,0 +1,53 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"_entry_class": "SingleModelCacheEntry",
|
| 3 |
+
"_model_id": "hf-internal-testing/tiny-random-BertModel",
|
| 4 |
+
"_task": "question-answering",
|
| 5 |
+
"architectures": [
|
| 6 |
+
"BertModel"
|
| 7 |
+
],
|
| 8 |
+
"attention_probs_dropout_prob": 0.1,
|
| 9 |
+
"classifier_dropout": null,
|
| 10 |
+
"hidden_act": "gelu",
|
| 11 |
+
"hidden_dropout_prob": 0.1,
|
| 12 |
+
"hidden_size": 32,
|
| 13 |
+
"initializer_range": 0.02,
|
| 14 |
+
"intermediate_size": 37,
|
| 15 |
+
"layer_norm_eps": 1e-12,
|
| 16 |
+
"max_position_embeddings": 512,
|
| 17 |
+
"model_type": "bert",
|
| 18 |
+
"neuron": {
|
| 19 |
+
"auto_cast": null,
|
| 20 |
+
"auto_cast_type": null,
|
| 21 |
+
"compiler_type": "neuronx-cc",
|
| 22 |
+
"compiler_version": "2.19.8089.0+8ab9f450",
|
| 23 |
+
"disable_fallback": false,
|
| 24 |
+
"disable_fast_relayout": false,
|
| 25 |
+
"dynamic_batch_size": false,
|
| 26 |
+
"float_dtype": "fp32",
|
| 27 |
+
"inline_weights_to_neff": true,
|
| 28 |
+
"input_names": [
|
| 29 |
+
"input_ids",
|
| 30 |
+
"attention_mask",
|
| 31 |
+
"token_type_ids"
|
| 32 |
+
],
|
| 33 |
+
"int_dtype": "int64",
|
| 34 |
+
"model_type": "bert",
|
| 35 |
+
"optlevel": "2",
|
| 36 |
+
"output_attentions": false,
|
| 37 |
+
"output_hidden_states": false,
|
| 38 |
+
"output_names": [
|
| 39 |
+
"start_logits",
|
| 40 |
+
"end_logits"
|
| 41 |
+
],
|
| 42 |
+
"static_batch_size": 1,
|
| 43 |
+
"static_sequence_length": 128,
|
| 44 |
+
"task": "question-answering",
|
| 45 |
+
"tensor_parallel_size": 1
|
| 46 |
+
},
|
| 47 |
+
"num_attention_heads": 4,
|
| 48 |
+
"num_hidden_layers": 5,
|
| 49 |
+
"position_embedding_type": "absolute",
|
| 50 |
+
"type_vocab_size": 16,
|
| 51 |
+
"use_cache": true,
|
| 52 |
+
"vocab_size": 1124
|
| 53 |
+
}
|
neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/bert/hf-internal-testing/tiny-random-BertModel/92f51980d46489605055.json
ADDED
|
@@ -0,0 +1,52 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"_entry_class": "SingleModelCacheEntry",
|
| 3 |
+
"_model_id": "hf-internal-testing/tiny-random-BertModel",
|
| 4 |
+
"_task": "text-classification",
|
| 5 |
+
"architectures": [
|
| 6 |
+
"BertModel"
|
| 7 |
+
],
|
| 8 |
+
"attention_probs_dropout_prob": 0.1,
|
| 9 |
+
"classifier_dropout": null,
|
| 10 |
+
"hidden_act": "gelu",
|
| 11 |
+
"hidden_dropout_prob": 0.1,
|
| 12 |
+
"hidden_size": 32,
|
| 13 |
+
"initializer_range": 0.02,
|
| 14 |
+
"intermediate_size": 37,
|
| 15 |
+
"layer_norm_eps": 1e-12,
|
| 16 |
+
"max_position_embeddings": 512,
|
| 17 |
+
"model_type": "bert",
|
| 18 |
+
"neuron": {
|
| 19 |
+
"auto_cast": null,
|
| 20 |
+
"auto_cast_type": null,
|
| 21 |
+
"compiler_type": "neuronx-cc",
|
| 22 |
+
"compiler_version": "2.19.8089.0+8ab9f450",
|
| 23 |
+
"disable_fallback": false,
|
| 24 |
+
"disable_fast_relayout": false,
|
| 25 |
+
"dynamic_batch_size": false,
|
| 26 |
+
"float_dtype": "fp32",
|
| 27 |
+
"inline_weights_to_neff": true,
|
| 28 |
+
"input_names": [
|
| 29 |
+
"input_ids",
|
| 30 |
+
"attention_mask",
|
| 31 |
+
"token_type_ids"
|
| 32 |
+
],
|
| 33 |
+
"int_dtype": "int64",
|
| 34 |
+
"model_type": "bert",
|
| 35 |
+
"optlevel": "2",
|
| 36 |
+
"output_attentions": false,
|
| 37 |
+
"output_hidden_states": false,
|
| 38 |
+
"output_names": [
|
| 39 |
+
"logits"
|
| 40 |
+
],
|
| 41 |
+
"static_batch_size": 1,
|
| 42 |
+
"static_sequence_length": 128,
|
| 43 |
+
"task": "text-classification",
|
| 44 |
+
"tensor_parallel_size": 1
|
| 45 |
+
},
|
| 46 |
+
"num_attention_heads": 4,
|
| 47 |
+
"num_hidden_layers": 5,
|
| 48 |
+
"position_embedding_type": "absolute",
|
| 49 |
+
"type_vocab_size": 16,
|
| 50 |
+
"use_cache": true,
|
| 51 |
+
"vocab_size": 1124
|
| 52 |
+
}
|
neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/bert/hf-internal-testing/tiny-random-BertModel/aeebf3f56cf9d0ed0250.json
ADDED
|
@@ -0,0 +1,52 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"_entry_class": "SingleModelCacheEntry",
|
| 3 |
+
"_model_id": "hf-internal-testing/tiny-random-BertModel",
|
| 4 |
+
"_task": "token-classification",
|
| 5 |
+
"architectures": [
|
| 6 |
+
"BertModel"
|
| 7 |
+
],
|
| 8 |
+
"attention_probs_dropout_prob": 0.1,
|
| 9 |
+
"classifier_dropout": null,
|
| 10 |
+
"hidden_act": "gelu",
|
| 11 |
+
"hidden_dropout_prob": 0.1,
|
| 12 |
+
"hidden_size": 32,
|
| 13 |
+
"initializer_range": 0.02,
|
| 14 |
+
"intermediate_size": 37,
|
| 15 |
+
"layer_norm_eps": 1e-12,
|
| 16 |
+
"max_position_embeddings": 512,
|
| 17 |
+
"model_type": "bert",
|
| 18 |
+
"neuron": {
|
| 19 |
+
"auto_cast": null,
|
| 20 |
+
"auto_cast_type": null,
|
| 21 |
+
"compiler_type": "neuronx-cc",
|
| 22 |
+
"compiler_version": "2.19.8089.0+8ab9f450",
|
| 23 |
+
"disable_fallback": false,
|
| 24 |
+
"disable_fast_relayout": false,
|
| 25 |
+
"dynamic_batch_size": false,
|
| 26 |
+
"float_dtype": "fp32",
|
| 27 |
+
"inline_weights_to_neff": true,
|
| 28 |
+
"input_names": [
|
| 29 |
+
"input_ids",
|
| 30 |
+
"attention_mask",
|
| 31 |
+
"token_type_ids"
|
| 32 |
+
],
|
| 33 |
+
"int_dtype": "int64",
|
| 34 |
+
"model_type": "bert",
|
| 35 |
+
"optlevel": "2",
|
| 36 |
+
"output_attentions": false,
|
| 37 |
+
"output_hidden_states": false,
|
| 38 |
+
"output_names": [
|
| 39 |
+
"logits"
|
| 40 |
+
],
|
| 41 |
+
"static_batch_size": 1,
|
| 42 |
+
"static_sequence_length": 32,
|
| 43 |
+
"task": "token-classification",
|
| 44 |
+
"tensor_parallel_size": 1
|
| 45 |
+
},
|
| 46 |
+
"num_attention_heads": 4,
|
| 47 |
+
"num_hidden_layers": 5,
|
| 48 |
+
"position_embedding_type": "absolute",
|
| 49 |
+
"type_vocab_size": 16,
|
| 50 |
+
"use_cache": true,
|
| 51 |
+
"vocab_size": 1124
|
| 52 |
+
}
|
neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/bert/hf-internal-testing/tiny-random-BertModel/cfb94bae5629e275593f.json
ADDED
|
@@ -0,0 +1,53 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"_entry_class": "SingleModelCacheEntry",
|
| 3 |
+
"_model_id": "hf-internal-testing/tiny-random-BertModel",
|
| 4 |
+
"_task": "feature-extraction",
|
| 5 |
+
"architectures": [
|
| 6 |
+
"BertModel"
|
| 7 |
+
],
|
| 8 |
+
"attention_probs_dropout_prob": 0.1,
|
| 9 |
+
"classifier_dropout": null,
|
| 10 |
+
"hidden_act": "gelu",
|
| 11 |
+
"hidden_dropout_prob": 0.1,
|
| 12 |
+
"hidden_size": 32,
|
| 13 |
+
"initializer_range": 0.02,
|
| 14 |
+
"intermediate_size": 37,
|
| 15 |
+
"layer_norm_eps": 1e-12,
|
| 16 |
+
"max_position_embeddings": 512,
|
| 17 |
+
"model_type": "bert",
|
| 18 |
+
"neuron": {
|
| 19 |
+
"auto_cast": null,
|
| 20 |
+
"auto_cast_type": null,
|
| 21 |
+
"compiler_type": "neuronx-cc",
|
| 22 |
+
"compiler_version": "2.19.8089.0+8ab9f450",
|
| 23 |
+
"disable_fallback": false,
|
| 24 |
+
"disable_fast_relayout": false,
|
| 25 |
+
"dynamic_batch_size": true,
|
| 26 |
+
"float_dtype": "fp32",
|
| 27 |
+
"inline_weights_to_neff": true,
|
| 28 |
+
"input_names": [
|
| 29 |
+
"input_ids",
|
| 30 |
+
"attention_mask",
|
| 31 |
+
"token_type_ids"
|
| 32 |
+
],
|
| 33 |
+
"int_dtype": "int64",
|
| 34 |
+
"model_type": "bert",
|
| 35 |
+
"optlevel": "2",
|
| 36 |
+
"output_attentions": false,
|
| 37 |
+
"output_hidden_states": false,
|
| 38 |
+
"output_names": [
|
| 39 |
+
"last_hidden_state",
|
| 40 |
+
"pooler_output"
|
| 41 |
+
],
|
| 42 |
+
"static_batch_size": 1,
|
| 43 |
+
"static_sequence_length": 32,
|
| 44 |
+
"task": "feature-extraction",
|
| 45 |
+
"tensor_parallel_size": 1
|
| 46 |
+
},
|
| 47 |
+
"num_attention_heads": 4,
|
| 48 |
+
"num_hidden_layers": 5,
|
| 49 |
+
"position_embedding_type": "absolute",
|
| 50 |
+
"type_vocab_size": 16,
|
| 51 |
+
"use_cache": true,
|
| 52 |
+
"vocab_size": 1124
|
| 53 |
+
}
|
neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/bert/hf-internal-testing/tiny-random-BertModel/e050716b5de372871d73.json
ADDED
|
@@ -0,0 +1,52 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"_entry_class": "SingleModelCacheEntry",
|
| 3 |
+
"_model_id": "hf-internal-testing/tiny-random-BertModel",
|
| 4 |
+
"_task": "token-classification",
|
| 5 |
+
"architectures": [
|
| 6 |
+
"BertModel"
|
| 7 |
+
],
|
| 8 |
+
"attention_probs_dropout_prob": 0.1,
|
| 9 |
+
"classifier_dropout": null,
|
| 10 |
+
"hidden_act": "gelu",
|
| 11 |
+
"hidden_dropout_prob": 0.1,
|
| 12 |
+
"hidden_size": 32,
|
| 13 |
+
"initializer_range": 0.02,
|
| 14 |
+
"intermediate_size": 37,
|
| 15 |
+
"layer_norm_eps": 1e-12,
|
| 16 |
+
"max_position_embeddings": 512,
|
| 17 |
+
"model_type": "bert",
|
| 18 |
+
"neuron": {
|
| 19 |
+
"auto_cast": null,
|
| 20 |
+
"auto_cast_type": null,
|
| 21 |
+
"compiler_type": "neuronx-cc",
|
| 22 |
+
"compiler_version": "2.19.8089.0+8ab9f450",
|
| 23 |
+
"disable_fallback": false,
|
| 24 |
+
"disable_fast_relayout": false,
|
| 25 |
+
"dynamic_batch_size": false,
|
| 26 |
+
"float_dtype": "fp32",
|
| 27 |
+
"inline_weights_to_neff": true,
|
| 28 |
+
"input_names": [
|
| 29 |
+
"input_ids",
|
| 30 |
+
"attention_mask",
|
| 31 |
+
"token_type_ids"
|
| 32 |
+
],
|
| 33 |
+
"int_dtype": "int64",
|
| 34 |
+
"model_type": "bert",
|
| 35 |
+
"optlevel": "2",
|
| 36 |
+
"output_attentions": false,
|
| 37 |
+
"output_hidden_states": false,
|
| 38 |
+
"output_names": [
|
| 39 |
+
"logits"
|
| 40 |
+
],
|
| 41 |
+
"static_batch_size": 1,
|
| 42 |
+
"static_sequence_length": 128,
|
| 43 |
+
"task": "token-classification",
|
| 44 |
+
"tensor_parallel_size": 1
|
| 45 |
+
},
|
| 46 |
+
"num_attention_heads": 4,
|
| 47 |
+
"num_hidden_layers": 5,
|
| 48 |
+
"position_embedding_type": "absolute",
|
| 49 |
+
"type_vocab_size": 16,
|
| 50 |
+
"use_cache": true,
|
| 51 |
+
"vocab_size": 1124
|
| 52 |
+
}
|
neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/bert/hf-internal-testing/tiny-random-BertModel/e0768f223c51e12fd868.json
ADDED
|
@@ -0,0 +1,52 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"_entry_class": "SingleModelCacheEntry",
|
| 3 |
+
"_model_id": "hf-internal-testing/tiny-random-BertModel",
|
| 4 |
+
"_task": "fill-mask",
|
| 5 |
+
"architectures": [
|
| 6 |
+
"BertModel"
|
| 7 |
+
],
|
| 8 |
+
"attention_probs_dropout_prob": 0.1,
|
| 9 |
+
"classifier_dropout": null,
|
| 10 |
+
"hidden_act": "gelu",
|
| 11 |
+
"hidden_dropout_prob": 0.1,
|
| 12 |
+
"hidden_size": 32,
|
| 13 |
+
"initializer_range": 0.02,
|
| 14 |
+
"intermediate_size": 37,
|
| 15 |
+
"layer_norm_eps": 1e-12,
|
| 16 |
+
"max_position_embeddings": 512,
|
| 17 |
+
"model_type": "bert",
|
| 18 |
+
"neuron": {
|
| 19 |
+
"auto_cast": null,
|
| 20 |
+
"auto_cast_type": null,
|
| 21 |
+
"compiler_type": "neuronx-cc",
|
| 22 |
+
"compiler_version": "2.19.8089.0+8ab9f450",
|
| 23 |
+
"disable_fallback": false,
|
| 24 |
+
"disable_fast_relayout": false,
|
| 25 |
+
"dynamic_batch_size": true,
|
| 26 |
+
"float_dtype": "fp32",
|
| 27 |
+
"inline_weights_to_neff": true,
|
| 28 |
+
"input_names": [
|
| 29 |
+
"input_ids",
|
| 30 |
+
"attention_mask",
|
| 31 |
+
"token_type_ids"
|
| 32 |
+
],
|
| 33 |
+
"int_dtype": "int64",
|
| 34 |
+
"model_type": "bert",
|
| 35 |
+
"optlevel": "2",
|
| 36 |
+
"output_attentions": false,
|
| 37 |
+
"output_hidden_states": false,
|
| 38 |
+
"output_names": [
|
| 39 |
+
"logits"
|
| 40 |
+
],
|
| 41 |
+
"static_batch_size": 1,
|
| 42 |
+
"static_sequence_length": 32,
|
| 43 |
+
"task": "fill-mask",
|
| 44 |
+
"tensor_parallel_size": 1
|
| 45 |
+
},
|
| 46 |
+
"num_attention_heads": 4,
|
| 47 |
+
"num_hidden_layers": 5,
|
| 48 |
+
"position_embedding_type": "absolute",
|
| 49 |
+
"type_vocab_size": 16,
|
| 50 |
+
"use_cache": true,
|
| 51 |
+
"vocab_size": 1124
|
| 52 |
+
}
|
neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/bert/hf-internal-testing/tiny-random-BertModel/e2594a1f187f452902f7.json
ADDED
|
@@ -0,0 +1,52 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"_entry_class": "SingleModelCacheEntry",
|
| 3 |
+
"_model_id": "hf-internal-testing/tiny-random-BertModel",
|
| 4 |
+
"_task": "fill-mask",
|
| 5 |
+
"architectures": [
|
| 6 |
+
"BertModel"
|
| 7 |
+
],
|
| 8 |
+
"attention_probs_dropout_prob": 0.1,
|
| 9 |
+
"classifier_dropout": null,
|
| 10 |
+
"hidden_act": "gelu",
|
| 11 |
+
"hidden_dropout_prob": 0.1,
|
| 12 |
+
"hidden_size": 32,
|
| 13 |
+
"initializer_range": 0.02,
|
| 14 |
+
"intermediate_size": 37,
|
| 15 |
+
"layer_norm_eps": 1e-12,
|
| 16 |
+
"max_position_embeddings": 512,
|
| 17 |
+
"model_type": "bert",
|
| 18 |
+
"neuron": {
|
| 19 |
+
"auto_cast": null,
|
| 20 |
+
"auto_cast_type": null,
|
| 21 |
+
"compiler_type": "neuronx-cc",
|
| 22 |
+
"compiler_version": "2.19.8089.0+8ab9f450",
|
| 23 |
+
"disable_fallback": false,
|
| 24 |
+
"disable_fast_relayout": false,
|
| 25 |
+
"dynamic_batch_size": false,
|
| 26 |
+
"float_dtype": "fp32",
|
| 27 |
+
"inline_weights_to_neff": true,
|
| 28 |
+
"input_names": [
|
| 29 |
+
"input_ids",
|
| 30 |
+
"attention_mask",
|
| 31 |
+
"token_type_ids"
|
| 32 |
+
],
|
| 33 |
+
"int_dtype": "int64",
|
| 34 |
+
"model_type": "bert",
|
| 35 |
+
"optlevel": "2",
|
| 36 |
+
"output_attentions": false,
|
| 37 |
+
"output_hidden_states": false,
|
| 38 |
+
"output_names": [
|
| 39 |
+
"logits"
|
| 40 |
+
],
|
| 41 |
+
"static_batch_size": 1,
|
| 42 |
+
"static_sequence_length": 128,
|
| 43 |
+
"task": "fill-mask",
|
| 44 |
+
"tensor_parallel_size": 1
|
| 45 |
+
},
|
| 46 |
+
"num_attention_heads": 4,
|
| 47 |
+
"num_hidden_layers": 5,
|
| 48 |
+
"position_embedding_type": "absolute",
|
| 49 |
+
"type_vocab_size": 16,
|
| 50 |
+
"use_cache": true,
|
| 51 |
+
"vocab_size": 1124
|
| 52 |
+
}
|
neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/bert/hf-internal-testing/tiny-random-BertModel/e4834fd951418b796374.json
ADDED
|
@@ -0,0 +1,53 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"_entry_class": "SingleModelCacheEntry",
|
| 3 |
+
"_model_id": "hf-internal-testing/tiny-random-BertModel",
|
| 4 |
+
"_task": "multiple-choice",
|
| 5 |
+
"architectures": [
|
| 6 |
+
"BertModel"
|
| 7 |
+
],
|
| 8 |
+
"attention_probs_dropout_prob": 0.1,
|
| 9 |
+
"classifier_dropout": null,
|
| 10 |
+
"hidden_act": "gelu",
|
| 11 |
+
"hidden_dropout_prob": 0.1,
|
| 12 |
+
"hidden_size": 32,
|
| 13 |
+
"initializer_range": 0.02,
|
| 14 |
+
"intermediate_size": 37,
|
| 15 |
+
"layer_norm_eps": 1e-12,
|
| 16 |
+
"max_position_embeddings": 512,
|
| 17 |
+
"model_type": "bert",
|
| 18 |
+
"neuron": {
|
| 19 |
+
"auto_cast": null,
|
| 20 |
+
"auto_cast_type": null,
|
| 21 |
+
"compiler_type": "neuronx-cc",
|
| 22 |
+
"compiler_version": "2.19.8089.0+8ab9f450",
|
| 23 |
+
"disable_fallback": false,
|
| 24 |
+
"disable_fast_relayout": false,
|
| 25 |
+
"dynamic_batch_size": true,
|
| 26 |
+
"float_dtype": "fp32",
|
| 27 |
+
"inline_weights_to_neff": true,
|
| 28 |
+
"input_names": [
|
| 29 |
+
"input_ids",
|
| 30 |
+
"attention_mask",
|
| 31 |
+
"token_type_ids"
|
| 32 |
+
],
|
| 33 |
+
"int_dtype": "int64",
|
| 34 |
+
"model_type": "bert",
|
| 35 |
+
"optlevel": "2",
|
| 36 |
+
"output_attentions": false,
|
| 37 |
+
"output_hidden_states": false,
|
| 38 |
+
"output_names": [
|
| 39 |
+
"logits"
|
| 40 |
+
],
|
| 41 |
+
"static_batch_size": 1,
|
| 42 |
+
"static_num_choices": 4,
|
| 43 |
+
"static_sequence_length": 128,
|
| 44 |
+
"task": "multiple-choice",
|
| 45 |
+
"tensor_parallel_size": 1
|
| 46 |
+
},
|
| 47 |
+
"num_attention_heads": 4,
|
| 48 |
+
"num_hidden_layers": 5,
|
| 49 |
+
"position_embedding_type": "absolute",
|
| 50 |
+
"type_vocab_size": 16,
|
| 51 |
+
"use_cache": true,
|
| 52 |
+
"vocab_size": 1124
|
| 53 |
+
}
|
neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/bert/hf-internal-testing/tiny-random-BertModel/e7e71e6beffbf701391b.json
ADDED
|
@@ -0,0 +1,53 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"_entry_class": "SingleModelCacheEntry",
|
| 3 |
+
"_model_id": "hf-internal-testing/tiny-random-BertModel",
|
| 4 |
+
"_task": "question-answering",
|
| 5 |
+
"architectures": [
|
| 6 |
+
"BertModel"
|
| 7 |
+
],
|
| 8 |
+
"attention_probs_dropout_prob": 0.1,
|
| 9 |
+
"classifier_dropout": null,
|
| 10 |
+
"hidden_act": "gelu",
|
| 11 |
+
"hidden_dropout_prob": 0.1,
|
| 12 |
+
"hidden_size": 32,
|
| 13 |
+
"initializer_range": 0.02,
|
| 14 |
+
"intermediate_size": 37,
|
| 15 |
+
"layer_norm_eps": 1e-12,
|
| 16 |
+
"max_position_embeddings": 512,
|
| 17 |
+
"model_type": "bert",
|
| 18 |
+
"neuron": {
|
| 19 |
+
"auto_cast": null,
|
| 20 |
+
"auto_cast_type": null,
|
| 21 |
+
"compiler_type": "neuronx-cc",
|
| 22 |
+
"compiler_version": "2.19.8089.0+8ab9f450",
|
| 23 |
+
"disable_fallback": false,
|
| 24 |
+
"disable_fast_relayout": false,
|
| 25 |
+
"dynamic_batch_size": false,
|
| 26 |
+
"float_dtype": "fp32",
|
| 27 |
+
"inline_weights_to_neff": true,
|
| 28 |
+
"input_names": [
|
| 29 |
+
"input_ids",
|
| 30 |
+
"attention_mask",
|
| 31 |
+
"token_type_ids"
|
| 32 |
+
],
|
| 33 |
+
"int_dtype": "int64",
|
| 34 |
+
"model_type": "bert",
|
| 35 |
+
"optlevel": "2",
|
| 36 |
+
"output_attentions": false,
|
| 37 |
+
"output_hidden_states": false,
|
| 38 |
+
"output_names": [
|
| 39 |
+
"start_logits",
|
| 40 |
+
"end_logits"
|
| 41 |
+
],
|
| 42 |
+
"static_batch_size": 1,
|
| 43 |
+
"static_sequence_length": 32,
|
| 44 |
+
"task": "question-answering",
|
| 45 |
+
"tensor_parallel_size": 1
|
| 46 |
+
},
|
| 47 |
+
"num_attention_heads": 4,
|
| 48 |
+
"num_hidden_layers": 5,
|
| 49 |
+
"position_embedding_type": "absolute",
|
| 50 |
+
"type_vocab_size": 16,
|
| 51 |
+
"use_cache": true,
|
| 52 |
+
"vocab_size": 1124
|
| 53 |
+
}
|
neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/bert/hf-internal-testing/tiny-random-BertModel/ea81a963f6aa67da9f09.json
ADDED
|
@@ -0,0 +1,53 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"_entry_class": "SingleModelCacheEntry",
|
| 3 |
+
"_model_id": "hf-internal-testing/tiny-random-BertModel",
|
| 4 |
+
"_task": "question-answering",
|
| 5 |
+
"architectures": [
|
| 6 |
+
"BertModel"
|
| 7 |
+
],
|
| 8 |
+
"attention_probs_dropout_prob": 0.1,
|
| 9 |
+
"classifier_dropout": null,
|
| 10 |
+
"hidden_act": "gelu",
|
| 11 |
+
"hidden_dropout_prob": 0.1,
|
| 12 |
+
"hidden_size": 32,
|
| 13 |
+
"initializer_range": 0.02,
|
| 14 |
+
"intermediate_size": 37,
|
| 15 |
+
"layer_norm_eps": 1e-12,
|
| 16 |
+
"max_position_embeddings": 512,
|
| 17 |
+
"model_type": "bert",
|
| 18 |
+
"neuron": {
|
| 19 |
+
"auto_cast": null,
|
| 20 |
+
"auto_cast_type": null,
|
| 21 |
+
"compiler_type": "neuronx-cc",
|
| 22 |
+
"compiler_version": "2.19.8089.0+8ab9f450",
|
| 23 |
+
"disable_fallback": false,
|
| 24 |
+
"disable_fast_relayout": false,
|
| 25 |
+
"dynamic_batch_size": true,
|
| 26 |
+
"float_dtype": "fp32",
|
| 27 |
+
"inline_weights_to_neff": true,
|
| 28 |
+
"input_names": [
|
| 29 |
+
"input_ids",
|
| 30 |
+
"attention_mask",
|
| 31 |
+
"token_type_ids"
|
| 32 |
+
],
|
| 33 |
+
"int_dtype": "int64",
|
| 34 |
+
"model_type": "bert",
|
| 35 |
+
"optlevel": "2",
|
| 36 |
+
"output_attentions": false,
|
| 37 |
+
"output_hidden_states": false,
|
| 38 |
+
"output_names": [
|
| 39 |
+
"start_logits",
|
| 40 |
+
"end_logits"
|
| 41 |
+
],
|
| 42 |
+
"static_batch_size": 1,
|
| 43 |
+
"static_sequence_length": 32,
|
| 44 |
+
"task": "question-answering",
|
| 45 |
+
"tensor_parallel_size": 1
|
| 46 |
+
},
|
| 47 |
+
"num_attention_heads": 4,
|
| 48 |
+
"num_hidden_layers": 5,
|
| 49 |
+
"position_embedding_type": "absolute",
|
| 50 |
+
"type_vocab_size": 16,
|
| 51 |
+
"use_cache": true,
|
| 52 |
+
"vocab_size": 1124
|
| 53 |
+
}
|
neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/bert/hf-internal-testing/tiny-random-BertModel/ef32dca934503ba9400c.json
ADDED
|
@@ -0,0 +1,52 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"_entry_class": "SingleModelCacheEntry",
|
| 3 |
+
"_model_id": "hf-internal-testing/tiny-random-BertModel",
|
| 4 |
+
"_task": "token-classification",
|
| 5 |
+
"architectures": [
|
| 6 |
+
"BertModel"
|
| 7 |
+
],
|
| 8 |
+
"attention_probs_dropout_prob": 0.1,
|
| 9 |
+
"classifier_dropout": null,
|
| 10 |
+
"hidden_act": "gelu",
|
| 11 |
+
"hidden_dropout_prob": 0.1,
|
| 12 |
+
"hidden_size": 32,
|
| 13 |
+
"initializer_range": 0.02,
|
| 14 |
+
"intermediate_size": 37,
|
| 15 |
+
"layer_norm_eps": 1e-12,
|
| 16 |
+
"max_position_embeddings": 512,
|
| 17 |
+
"model_type": "bert",
|
| 18 |
+
"neuron": {
|
| 19 |
+
"auto_cast": null,
|
| 20 |
+
"auto_cast_type": null,
|
| 21 |
+
"compiler_type": "neuronx-cc",
|
| 22 |
+
"compiler_version": "2.19.8089.0+8ab9f450",
|
| 23 |
+
"disable_fallback": false,
|
| 24 |
+
"disable_fast_relayout": false,
|
| 25 |
+
"dynamic_batch_size": true,
|
| 26 |
+
"float_dtype": "fp32",
|
| 27 |
+
"inline_weights_to_neff": true,
|
| 28 |
+
"input_names": [
|
| 29 |
+
"input_ids",
|
| 30 |
+
"attention_mask",
|
| 31 |
+
"token_type_ids"
|
| 32 |
+
],
|
| 33 |
+
"int_dtype": "int64",
|
| 34 |
+
"model_type": "bert",
|
| 35 |
+
"optlevel": "2",
|
| 36 |
+
"output_attentions": false,
|
| 37 |
+
"output_hidden_states": false,
|
| 38 |
+
"output_names": [
|
| 39 |
+
"logits"
|
| 40 |
+
],
|
| 41 |
+
"static_batch_size": 1,
|
| 42 |
+
"static_sequence_length": 32,
|
| 43 |
+
"task": "token-classification",
|
| 44 |
+
"tensor_parallel_size": 1
|
| 45 |
+
},
|
| 46 |
+
"num_attention_heads": 4,
|
| 47 |
+
"num_hidden_layers": 5,
|
| 48 |
+
"position_embedding_type": "absolute",
|
| 49 |
+
"type_vocab_size": 16,
|
| 50 |
+
"use_cache": true,
|
| 51 |
+
"vocab_size": 1124
|
| 52 |
+
}
|
neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/bert/hf-internal-testing/tiny-random-BertModel/f15944a91bf873bc4059.json
ADDED
|
@@ -0,0 +1,52 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"_entry_class": "SingleModelCacheEntry",
|
| 3 |
+
"_model_id": "hf-internal-testing/tiny-random-BertModel",
|
| 4 |
+
"_task": "text-classification",
|
| 5 |
+
"architectures": [
|
| 6 |
+
"BertModel"
|
| 7 |
+
],
|
| 8 |
+
"attention_probs_dropout_prob": 0.1,
|
| 9 |
+
"classifier_dropout": null,
|
| 10 |
+
"hidden_act": "gelu",
|
| 11 |
+
"hidden_dropout_prob": 0.1,
|
| 12 |
+
"hidden_size": 32,
|
| 13 |
+
"initializer_range": 0.02,
|
| 14 |
+
"intermediate_size": 37,
|
| 15 |
+
"layer_norm_eps": 1e-12,
|
| 16 |
+
"max_position_embeddings": 512,
|
| 17 |
+
"model_type": "bert",
|
| 18 |
+
"neuron": {
|
| 19 |
+
"auto_cast": null,
|
| 20 |
+
"auto_cast_type": null,
|
| 21 |
+
"compiler_type": "neuronx-cc",
|
| 22 |
+
"compiler_version": "2.19.8089.0+8ab9f450",
|
| 23 |
+
"disable_fallback": false,
|
| 24 |
+
"disable_fast_relayout": false,
|
| 25 |
+
"dynamic_batch_size": true,
|
| 26 |
+
"float_dtype": "fp32",
|
| 27 |
+
"inline_weights_to_neff": true,
|
| 28 |
+
"input_names": [
|
| 29 |
+
"input_ids",
|
| 30 |
+
"attention_mask",
|
| 31 |
+
"token_type_ids"
|
| 32 |
+
],
|
| 33 |
+
"int_dtype": "int64",
|
| 34 |
+
"model_type": "bert",
|
| 35 |
+
"optlevel": "2",
|
| 36 |
+
"output_attentions": false,
|
| 37 |
+
"output_hidden_states": false,
|
| 38 |
+
"output_names": [
|
| 39 |
+
"logits"
|
| 40 |
+
],
|
| 41 |
+
"static_batch_size": 1,
|
| 42 |
+
"static_sequence_length": 32,
|
| 43 |
+
"task": "text-classification",
|
| 44 |
+
"tensor_parallel_size": 1
|
| 45 |
+
},
|
| 46 |
+
"num_attention_heads": 4,
|
| 47 |
+
"num_hidden_layers": 5,
|
| 48 |
+
"position_embedding_type": "absolute",
|
| 49 |
+
"type_vocab_size": 16,
|
| 50 |
+
"use_cache": true,
|
| 51 |
+
"vocab_size": 1124
|
| 52 |
+
}
|
neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/bert/sentence-transformers/all-MiniLM-L6-v2/b571d0d9ac9ad084fa8c.json
ADDED
|
@@ -0,0 +1,54 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"_entry_class": "SingleModelCacheEntry",
|
| 3 |
+
"_model_id": "sentence-transformers/all-MiniLM-L6-v2",
|
| 4 |
+
"_task": "feature-extraction",
|
| 5 |
+
"architectures": [
|
| 6 |
+
"BertModel"
|
| 7 |
+
],
|
| 8 |
+
"attention_probs_dropout_prob": 0.1,
|
| 9 |
+
"classifier_dropout": null,
|
| 10 |
+
"export_model_type": "transformer",
|
| 11 |
+
"gradient_checkpointing": false,
|
| 12 |
+
"hidden_act": "gelu",
|
| 13 |
+
"hidden_dropout_prob": 0.1,
|
| 14 |
+
"hidden_size": 384,
|
| 15 |
+
"initializer_range": 0.02,
|
| 16 |
+
"intermediate_size": 1536,
|
| 17 |
+
"layer_norm_eps": 1e-12,
|
| 18 |
+
"max_position_embeddings": 512,
|
| 19 |
+
"model_type": "bert",
|
| 20 |
+
"neuron": {
|
| 21 |
+
"auto_cast": null,
|
| 22 |
+
"auto_cast_type": null,
|
| 23 |
+
"compiler_type": "neuronx-cc",
|
| 24 |
+
"compiler_version": "2.19.8089.0+8ab9f450",
|
| 25 |
+
"disable_fallback": false,
|
| 26 |
+
"disable_fast_relayout": false,
|
| 27 |
+
"dynamic_batch_size": false,
|
| 28 |
+
"float_dtype": "fp32",
|
| 29 |
+
"inline_weights_to_neff": true,
|
| 30 |
+
"input_names": [
|
| 31 |
+
"input_ids",
|
| 32 |
+
"attention_mask"
|
| 33 |
+
],
|
| 34 |
+
"int_dtype": "int64",
|
| 35 |
+
"model_type": "transformer",
|
| 36 |
+
"optlevel": "2",
|
| 37 |
+
"output_attentions": false,
|
| 38 |
+
"output_hidden_states": false,
|
| 39 |
+
"output_names": [
|
| 40 |
+
"token_embeddings",
|
| 41 |
+
"sentence_embedding"
|
| 42 |
+
],
|
| 43 |
+
"static_batch_size": 1,
|
| 44 |
+
"static_sequence_length": 16,
|
| 45 |
+
"task": "feature-extraction",
|
| 46 |
+
"tensor_parallel_size": 1
|
| 47 |
+
},
|
| 48 |
+
"num_attention_heads": 12,
|
| 49 |
+
"num_hidden_layers": 6,
|
| 50 |
+
"position_embedding_type": "absolute",
|
| 51 |
+
"type_vocab_size": 2,
|
| 52 |
+
"use_cache": true,
|
| 53 |
+
"vocab_size": 30522
|
| 54 |
+
}
|
neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/bert/sentence-transformers/all-MiniLM-L6-v2/f99a0822ae493faf0bb5.json
ADDED
|
@@ -0,0 +1,54 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"_entry_class": "SingleModelCacheEntry",
|
| 3 |
+
"_model_id": "sentence-transformers/all-MiniLM-L6-v2",
|
| 4 |
+
"_task": "feature-extraction",
|
| 5 |
+
"architectures": [
|
| 6 |
+
"BertModel"
|
| 7 |
+
],
|
| 8 |
+
"attention_probs_dropout_prob": 0.1,
|
| 9 |
+
"classifier_dropout": null,
|
| 10 |
+
"export_model_type": "transformer",
|
| 11 |
+
"gradient_checkpointing": false,
|
| 12 |
+
"hidden_act": "gelu",
|
| 13 |
+
"hidden_dropout_prob": 0.1,
|
| 14 |
+
"hidden_size": 384,
|
| 15 |
+
"initializer_range": 0.02,
|
| 16 |
+
"intermediate_size": 1536,
|
| 17 |
+
"layer_norm_eps": 1e-12,
|
| 18 |
+
"max_position_embeddings": 512,
|
| 19 |
+
"model_type": "bert",
|
| 20 |
+
"neuron": {
|
| 21 |
+
"auto_cast": null,
|
| 22 |
+
"auto_cast_type": null,
|
| 23 |
+
"compiler_type": "neuronx-cc",
|
| 24 |
+
"compiler_version": "2.19.8089.0+8ab9f450",
|
| 25 |
+
"disable_fallback": false,
|
| 26 |
+
"disable_fast_relayout": false,
|
| 27 |
+
"dynamic_batch_size": true,
|
| 28 |
+
"float_dtype": "fp32",
|
| 29 |
+
"inline_weights_to_neff": true,
|
| 30 |
+
"input_names": [
|
| 31 |
+
"input_ids",
|
| 32 |
+
"attention_mask"
|
| 33 |
+
],
|
| 34 |
+
"int_dtype": "int64",
|
| 35 |
+
"model_type": "transformer",
|
| 36 |
+
"optlevel": "2",
|
| 37 |
+
"output_attentions": false,
|
| 38 |
+
"output_hidden_states": false,
|
| 39 |
+
"output_names": [
|
| 40 |
+
"token_embeddings",
|
| 41 |
+
"sentence_embedding"
|
| 42 |
+
],
|
| 43 |
+
"static_batch_size": 1,
|
| 44 |
+
"static_sequence_length": 32,
|
| 45 |
+
"task": "feature-extraction",
|
| 46 |
+
"tensor_parallel_size": 1
|
| 47 |
+
},
|
| 48 |
+
"num_attention_heads": 12,
|
| 49 |
+
"num_hidden_layers": 6,
|
| 50 |
+
"position_embedding_type": "absolute",
|
| 51 |
+
"type_vocab_size": 2,
|
| 52 |
+
"use_cache": true,
|
| 53 |
+
"vocab_size": 30522
|
| 54 |
+
}
|
neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/camembert/hf-internal-testing/tiny-random-camembert/16650c04744503a0af47.json
ADDED
|
@@ -0,0 +1,52 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"_entry_class": "SingleModelCacheEntry",
|
| 3 |
+
"_model_id": "hf-internal-testing/tiny-random-camembert",
|
| 4 |
+
"_task": "token-classification",
|
| 5 |
+
"architectures": [
|
| 6 |
+
"CamembertModel"
|
| 7 |
+
],
|
| 8 |
+
"attention_probs_dropout_prob": 0.1,
|
| 9 |
+
"classifier_dropout": null,
|
| 10 |
+
"gradient_checkpointing": false,
|
| 11 |
+
"hidden_act": "gelu",
|
| 12 |
+
"hidden_dropout_prob": 0.1,
|
| 13 |
+
"hidden_size": 32,
|
| 14 |
+
"initializer_range": 0.02,
|
| 15 |
+
"intermediate_size": 37,
|
| 16 |
+
"layer_norm_eps": 1e-12,
|
| 17 |
+
"max_position_embeddings": 512,
|
| 18 |
+
"model_type": "camembert",
|
| 19 |
+
"neuron": {
|
| 20 |
+
"auto_cast": null,
|
| 21 |
+
"auto_cast_type": null,
|
| 22 |
+
"compiler_type": "neuronx-cc",
|
| 23 |
+
"compiler_version": "2.19.8089.0+8ab9f450",
|
| 24 |
+
"disable_fallback": false,
|
| 25 |
+
"disable_fast_relayout": false,
|
| 26 |
+
"dynamic_batch_size": false,
|
| 27 |
+
"float_dtype": "fp32",
|
| 28 |
+
"inline_weights_to_neff": true,
|
| 29 |
+
"input_names": [
|
| 30 |
+
"input_ids",
|
| 31 |
+
"attention_mask"
|
| 32 |
+
],
|
| 33 |
+
"int_dtype": "int64",
|
| 34 |
+
"model_type": "camembert",
|
| 35 |
+
"optlevel": "2",
|
| 36 |
+
"output_attentions": false,
|
| 37 |
+
"output_hidden_states": false,
|
| 38 |
+
"output_names": [
|
| 39 |
+
"logits"
|
| 40 |
+
],
|
| 41 |
+
"static_batch_size": 1,
|
| 42 |
+
"static_sequence_length": 32,
|
| 43 |
+
"task": "token-classification",
|
| 44 |
+
"tensor_parallel_size": 1
|
| 45 |
+
},
|
| 46 |
+
"num_attention_heads": 4,
|
| 47 |
+
"num_hidden_layers": 5,
|
| 48 |
+
"position_embedding_type": "absolute",
|
| 49 |
+
"type_vocab_size": 16,
|
| 50 |
+
"use_cache": true,
|
| 51 |
+
"vocab_size": 1000
|
| 52 |
+
}
|
neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/camembert/hf-internal-testing/tiny-random-camembert/3d5fe21de242b8b602d5.json
ADDED
|
@@ -0,0 +1,52 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"_entry_class": "SingleModelCacheEntry",
|
| 3 |
+
"_model_id": "hf-internal-testing/tiny-random-camembert",
|
| 4 |
+
"_task": "fill-mask",
|
| 5 |
+
"architectures": [
|
| 6 |
+
"CamembertModel"
|
| 7 |
+
],
|
| 8 |
+
"attention_probs_dropout_prob": 0.1,
|
| 9 |
+
"classifier_dropout": null,
|
| 10 |
+
"gradient_checkpointing": false,
|
| 11 |
+
"hidden_act": "gelu",
|
| 12 |
+
"hidden_dropout_prob": 0.1,
|
| 13 |
+
"hidden_size": 32,
|
| 14 |
+
"initializer_range": 0.02,
|
| 15 |
+
"intermediate_size": 37,
|
| 16 |
+
"layer_norm_eps": 1e-12,
|
| 17 |
+
"max_position_embeddings": 512,
|
| 18 |
+
"model_type": "camembert",
|
| 19 |
+
"neuron": {
|
| 20 |
+
"auto_cast": null,
|
| 21 |
+
"auto_cast_type": null,
|
| 22 |
+
"compiler_type": "neuronx-cc",
|
| 23 |
+
"compiler_version": "2.19.8089.0+8ab9f450",
|
| 24 |
+
"disable_fallback": false,
|
| 25 |
+
"disable_fast_relayout": false,
|
| 26 |
+
"dynamic_batch_size": true,
|
| 27 |
+
"float_dtype": "fp32",
|
| 28 |
+
"inline_weights_to_neff": true,
|
| 29 |
+
"input_names": [
|
| 30 |
+
"input_ids",
|
| 31 |
+
"attention_mask"
|
| 32 |
+
],
|
| 33 |
+
"int_dtype": "int64",
|
| 34 |
+
"model_type": "camembert",
|
| 35 |
+
"optlevel": "2",
|
| 36 |
+
"output_attentions": false,
|
| 37 |
+
"output_hidden_states": false,
|
| 38 |
+
"output_names": [
|
| 39 |
+
"logits"
|
| 40 |
+
],
|
| 41 |
+
"static_batch_size": 1,
|
| 42 |
+
"static_sequence_length": 32,
|
| 43 |
+
"task": "fill-mask",
|
| 44 |
+
"tensor_parallel_size": 1
|
| 45 |
+
},
|
| 46 |
+
"num_attention_heads": 4,
|
| 47 |
+
"num_hidden_layers": 5,
|
| 48 |
+
"position_embedding_type": "absolute",
|
| 49 |
+
"type_vocab_size": 16,
|
| 50 |
+
"use_cache": true,
|
| 51 |
+
"vocab_size": 1000
|
| 52 |
+
}
|
neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/camembert/hf-internal-testing/tiny-random-camembert/4b4a4fbbe9d668bcf61e.json
ADDED
|
@@ -0,0 +1,52 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"_entry_class": "SingleModelCacheEntry",
|
| 3 |
+
"_model_id": "hf-internal-testing/tiny-random-camembert",
|
| 4 |
+
"_task": "token-classification",
|
| 5 |
+
"architectures": [
|
| 6 |
+
"CamembertModel"
|
| 7 |
+
],
|
| 8 |
+
"attention_probs_dropout_prob": 0.1,
|
| 9 |
+
"classifier_dropout": null,
|
| 10 |
+
"gradient_checkpointing": false,
|
| 11 |
+
"hidden_act": "gelu",
|
| 12 |
+
"hidden_dropout_prob": 0.1,
|
| 13 |
+
"hidden_size": 32,
|
| 14 |
+
"initializer_range": 0.02,
|
| 15 |
+
"intermediate_size": 37,
|
| 16 |
+
"layer_norm_eps": 1e-12,
|
| 17 |
+
"max_position_embeddings": 512,
|
| 18 |
+
"model_type": "camembert",
|
| 19 |
+
"neuron": {
|
| 20 |
+
"auto_cast": null,
|
| 21 |
+
"auto_cast_type": null,
|
| 22 |
+
"compiler_type": "neuronx-cc",
|
| 23 |
+
"compiler_version": "2.19.8089.0+8ab9f450",
|
| 24 |
+
"disable_fallback": false,
|
| 25 |
+
"disable_fast_relayout": false,
|
| 26 |
+
"dynamic_batch_size": true,
|
| 27 |
+
"float_dtype": "fp32",
|
| 28 |
+
"inline_weights_to_neff": true,
|
| 29 |
+
"input_names": [
|
| 30 |
+
"input_ids",
|
| 31 |
+
"attention_mask"
|
| 32 |
+
],
|
| 33 |
+
"int_dtype": "int64",
|
| 34 |
+
"model_type": "camembert",
|
| 35 |
+
"optlevel": "2",
|
| 36 |
+
"output_attentions": false,
|
| 37 |
+
"output_hidden_states": false,
|
| 38 |
+
"output_names": [
|
| 39 |
+
"logits"
|
| 40 |
+
],
|
| 41 |
+
"static_batch_size": 1,
|
| 42 |
+
"static_sequence_length": 32,
|
| 43 |
+
"task": "token-classification",
|
| 44 |
+
"tensor_parallel_size": 1
|
| 45 |
+
},
|
| 46 |
+
"num_attention_heads": 4,
|
| 47 |
+
"num_hidden_layers": 5,
|
| 48 |
+
"position_embedding_type": "absolute",
|
| 49 |
+
"type_vocab_size": 16,
|
| 50 |
+
"use_cache": true,
|
| 51 |
+
"vocab_size": 1000
|
| 52 |
+
}
|
neuronxcc-2.19.8089.0+8ab9f450/0_REGISTRY/0.3.1.dev1/camembert/hf-internal-testing/tiny-random-camembert/5bca725791b646775427.json
ADDED
|
@@ -0,0 +1,53 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"_entry_class": "SingleModelCacheEntry",
|
| 3 |
+
"_model_id": "hf-internal-testing/tiny-random-camembert",
|
| 4 |
+
"_task": "question-answering",
|
| 5 |
+
"architectures": [
|
| 6 |
+
"CamembertModel"
|
| 7 |
+
],
|
| 8 |
+
"attention_probs_dropout_prob": 0.1,
|
| 9 |
+
"classifier_dropout": null,
|
| 10 |
+
"gradient_checkpointing": false,
|
| 11 |
+
"hidden_act": "gelu",
|
| 12 |
+
"hidden_dropout_prob": 0.1,
|
| 13 |
+
"hidden_size": 32,
|
| 14 |
+
"initializer_range": 0.02,
|
| 15 |
+
"intermediate_size": 37,
|
| 16 |
+
"layer_norm_eps": 1e-12,
|
| 17 |
+
"max_position_embeddings": 512,
|
| 18 |
+
"model_type": "camembert",
|
| 19 |
+
"neuron": {
|
| 20 |
+
"auto_cast": null,
|
| 21 |
+
"auto_cast_type": null,
|
| 22 |
+
"compiler_type": "neuronx-cc",
|
| 23 |
+
"compiler_version": "2.19.8089.0+8ab9f450",
|
| 24 |
+
"disable_fallback": false,
|
| 25 |
+
"disable_fast_relayout": false,
|
| 26 |
+
"dynamic_batch_size": false,
|
| 27 |
+
"float_dtype": "fp32",
|
| 28 |
+
"inline_weights_to_neff": true,
|
| 29 |
+
"input_names": [
|
| 30 |
+
"input_ids",
|
| 31 |
+
"attention_mask"
|
| 32 |
+
],
|
| 33 |
+
"int_dtype": "int64",
|
| 34 |
+
"model_type": "camembert",
|
| 35 |
+
"optlevel": "2",
|
| 36 |
+
"output_attentions": false,
|
| 37 |
+
"output_hidden_states": false,
|
| 38 |
+
"output_names": [
|
| 39 |
+
"start_logits",
|
| 40 |
+
"end_logits"
|
| 41 |
+
],
|
| 42 |
+
"static_batch_size": 1,
|
| 43 |
+
"static_sequence_length": 128,
|
| 44 |
+
"task": "question-answering",
|
| 45 |
+
"tensor_parallel_size": 1
|
| 46 |
+
},
|
| 47 |
+
"num_attention_heads": 4,
|
| 48 |
+
"num_hidden_layers": 5,
|
| 49 |
+
"position_embedding_type": "absolute",
|
| 50 |
+
"type_vocab_size": 16,
|
| 51 |
+
"use_cache": true,
|
| 52 |
+
"vocab_size": 1000
|
| 53 |
+
}
|