wli1995 commited on
Commit
3d986da
·
verified ·
1 Parent(s): 561d6ab

update axmodel and demo

Browse files
Files changed (44) hide show
  1. README.md +1 -1
  2. main_ax650 +2 -2
  3. main_axcl_aarch64 +2 -2
  4. main_axcl_x86 +2 -2
  5. qwen3-4b-ax650/qwen3_p128_l0_together.axmodel +2 -2
  6. qwen3-4b-ax650/qwen3_p128_l10_together.axmodel +2 -2
  7. qwen3-4b-ax650/qwen3_p128_l11_together.axmodel +2 -2
  8. qwen3-4b-ax650/qwen3_p128_l12_together.axmodel +2 -2
  9. qwen3-4b-ax650/qwen3_p128_l13_together.axmodel +2 -2
  10. qwen3-4b-ax650/qwen3_p128_l14_together.axmodel +2 -2
  11. qwen3-4b-ax650/qwen3_p128_l15_together.axmodel +2 -2
  12. qwen3-4b-ax650/qwen3_p128_l16_together.axmodel +2 -2
  13. qwen3-4b-ax650/qwen3_p128_l17_together.axmodel +2 -2
  14. qwen3-4b-ax650/qwen3_p128_l18_together.axmodel +2 -2
  15. qwen3-4b-ax650/qwen3_p128_l19_together.axmodel +2 -2
  16. qwen3-4b-ax650/qwen3_p128_l1_together.axmodel +2 -2
  17. qwen3-4b-ax650/qwen3_p128_l20_together.axmodel +2 -2
  18. qwen3-4b-ax650/qwen3_p128_l21_together.axmodel +2 -2
  19. qwen3-4b-ax650/qwen3_p128_l22_together.axmodel +2 -2
  20. qwen3-4b-ax650/qwen3_p128_l23_together.axmodel +2 -2
  21. qwen3-4b-ax650/qwen3_p128_l24_together.axmodel +2 -2
  22. qwen3-4b-ax650/qwen3_p128_l25_together.axmodel +2 -2
  23. qwen3-4b-ax650/qwen3_p128_l26_together.axmodel +2 -2
  24. qwen3-4b-ax650/qwen3_p128_l27_together.axmodel +2 -2
  25. qwen3-4b-ax650/qwen3_p128_l28_together.axmodel +2 -2
  26. qwen3-4b-ax650/qwen3_p128_l29_together.axmodel +2 -2
  27. qwen3-4b-ax650/qwen3_p128_l2_together.axmodel +2 -2
  28. qwen3-4b-ax650/qwen3_p128_l30_together.axmodel +2 -2
  29. qwen3-4b-ax650/qwen3_p128_l31_together.axmodel +2 -2
  30. qwen3-4b-ax650/qwen3_p128_l32_together.axmodel +2 -2
  31. qwen3-4b-ax650/qwen3_p128_l33_together.axmodel +2 -2
  32. qwen3-4b-ax650/qwen3_p128_l34_together.axmodel +2 -2
  33. qwen3-4b-ax650/qwen3_p128_l35_together.axmodel +2 -2
  34. qwen3-4b-ax650/qwen3_p128_l3_together.axmodel +2 -2
  35. qwen3-4b-ax650/qwen3_p128_l4_together.axmodel +2 -2
  36. qwen3-4b-ax650/qwen3_p128_l5_together.axmodel +2 -2
  37. qwen3-4b-ax650/qwen3_p128_l6_together.axmodel +2 -2
  38. qwen3-4b-ax650/qwen3_p128_l7_together.axmodel +2 -2
  39. qwen3-4b-ax650/qwen3_p128_l8_together.axmodel +2 -2
  40. qwen3-4b-ax650/qwen3_p128_l9_together.axmodel +2 -2
  41. qwen3-4b-ax650/qwen3_post.axmodel +1 -1
  42. run_qwen3_4b_int8_ctx_ax650.sh +2 -2
  43. run_qwen3_4b_int8_ctx_axcl_aarch64.sh +2 -2
  44. run_qwen3_4b_int8_ctx_axcl_x86.sh +2 -2
README.md CHANGED
@@ -18,7 +18,7 @@ This version of Qwen3-4B-Int8 has been converted to run on the Axera NPU using *
18
 
19
  This model has been optimized with the following LoRA:
20
 
21
- Compatible with Pulsar2 version: 4.0-temp(Not released yet)
22
 
23
  ## Convert tools links:
24
 
 
18
 
19
  This model has been optimized with the following LoRA:
20
 
21
+ Compatible with Pulsar2 version: 4.2(Not released yet)
22
 
23
  ## Convert tools links:
24
 
main_ax650 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fdc5392fa0454f782562d64d964c708b2829847772db08ac21406d3b5e58c0b8
3
- size 981152
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f19ddeb193769b16aa8c5d9bba887558aa0a4ed10eb50a19d9bc117f1ba527e5
3
+ size 985352
main_axcl_aarch64 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7e27934d17d671208441f65a31ee40ddeff7cbade19bf20cf2dc88be9e042def
3
- size 1724632
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1f9f1a1ca329b47f70840e8b6d104ce8248a82326aa2402bccb31144590a8fb2
3
+ size 1725008
main_axcl_x86 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d427677213e3b50b22ed55a1d0af10223f5b0711c1bf050d0655aedd3ffc8df9
3
- size 1839824
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:928d36be31c15d081a7d346464f41458e9624d8b68d5f7dfb3d3189686ce2754
3
+ size 8421624
qwen3-4b-ax650/qwen3_p128_l0_together.axmodel CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fd61cf7ac7196904510a51be616f3aefe63a59879b861ba4de0050c2a8343d55
3
- size 125435994
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4260634abe3695e2e55ae8fa069d8c2fb61b5ab586c3818448fe198d55812556
3
+ size 126872056
qwen3-4b-ax650/qwen3_p128_l10_together.axmodel CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:42664547adf097be89a8bafbcf4f3a8f20f7c86dfcfe06e5b722db36289507c6
3
- size 125435866
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:81d80954ec69de095bd6917f888cc9f149864f34d12fc7c7da3283a2cc8b01d0
3
+ size 126871864
qwen3-4b-ax650/qwen3_p128_l11_together.axmodel CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2b1bfd35954826cae66327a92f60c8d7b97892adaf6c966a06945664212da538
3
- size 125435770
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cbc5b39df1121d035db25b6cdceae1207855954fceed3296f4b259bc3b372cc2
3
+ size 126872024
qwen3-4b-ax650/qwen3_p128_l12_together.axmodel CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9057624167eea41908d6ae0fda33bdef1fc61eb0b6e6e6fd4f7c0a45a83b52a0
3
- size 125435930
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e132ceb7a4bfbe4a4d885fdf44ef9f91ff04cc99c36ac894d8345e64db33e0da
3
+ size 126871928
qwen3-4b-ax650/qwen3_p128_l13_together.axmodel CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f282cb43221711d9b145de5001fb0fbb531939139f90514362991038215a973e
3
- size 125435994
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a4864d7655cb6b76ca10c70c622019af78dada1f486db07198fbb1f2ccf64e8b
3
+ size 126872120
qwen3-4b-ax650/qwen3_p128_l14_together.axmodel CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8b2422806e1ca9e1fcb36927b2a0861f5cd9b5b2531a0c639b0295d089423144
3
- size 125435866
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4c437de05666cd93322d79d76be75775c2f675de30ab677f56a7302c61dd7016
3
+ size 126871864
qwen3-4b-ax650/qwen3_p128_l15_together.axmodel CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0dc68fa4d4a4118d3bed91246423ebd49bedb05b6ed0a1f421b3740198f6318d
3
- size 125435866
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f2b269a0c25c6c8eed1b194164ece611f92be42716244688be4983bf0f0ad73f
3
+ size 126871864
qwen3-4b-ax650/qwen3_p128_l16_together.axmodel CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fd5ed3869713ec8159f4f36f9e64f230910550ec5b7b74c856ee8b066a87b43d
3
- size 125435866
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a2d1307e56f37a4ac89ea45594507edc63bbaa5dfcbcc4f075ab1578f9c9c307
3
+ size 126871864
qwen3-4b-ax650/qwen3_p128_l17_together.axmodel CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:dfe4b4b90a08c34e3a5300aede9c4f13aa8046b64a0cfc7174a4d374d6d11049
3
- size 125436026
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:40ed9f5990f864e0e41a77784363d5ea8b1d75226f4ebe91c2a23174df3b707c
3
+ size 126871992
qwen3-4b-ax650/qwen3_p128_l18_together.axmodel CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3a3a16f84a0249f18e713f4efe132a1f553cabf994baf06dbe460ea9fc28f6a7
3
- size 125435866
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:51fa6754f942e3c16d66c8e13f21c2cef34130585f669536e26364e952d913e7
3
+ size 126871864
qwen3-4b-ax650/qwen3_p128_l19_together.axmodel CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:85f6dcfc2b5d6c4c6a79f1e24fa07ec0dd5e51a164b8fc0a2c5bd503515a5f86
3
- size 125435866
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f733daa54eab9c18986c8f135fa087bc62549a5d23a42aed87bd9e8e16ac18be
3
+ size 126871864
qwen3-4b-ax650/qwen3_p128_l1_together.axmodel CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9b398b242b539a43e7216c41849e8e1d4eda19f9ad940f88eba4c5b0035e02c0
3
- size 125440026
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2b887021dc113a3acfbdcad0c9abef1807fcb251ab6ff8d4d75d30d2b80f56b6
3
+ size 126881592
qwen3-4b-ax650/qwen3_p128_l20_together.axmodel CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a66d39ef6172cd4bc52bcd6caca988d709d0525cfae0d7e4bd5f750afad5b6d9
3
- size 125435866
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1814917877a921bc268214c00dff06842868a6e575d71777bfe0ff038da36dd5
3
+ size 126871864
qwen3-4b-ax650/qwen3_p128_l21_together.axmodel CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:76135864b098a5c4d034942eeb4e9c1f53faa9ad3fae331ed0ae23b7104eabfb
3
- size 125435866
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fcfdf6b75fc5861acfb6dd9db3a4dbdea0c5f16722bfe57a0e26d388fed65cde
3
+ size 126872056
qwen3-4b-ax650/qwen3_p128_l22_together.axmodel CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:978a4369fbf912f246bbe5385ec56aa104c6b9c3abedb6f0ec6e06be9776b487
3
- size 125436314
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2e4e958e37cc1ac142779606b78faa26c27a95d7e88c071a581c10a2cfc81c97
3
+ size 126872632
qwen3-4b-ax650/qwen3_p128_l23_together.axmodel CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6ca5b13b94a9014c41c5dd368d6dd4bd321b3ee92ebcd07e5ac91806af1c8a5d
3
- size 125435866
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6bde8f0ba3372c8d985bf9166233fb7231c1fe22bf1b5087bfb5f2ee0024808d
3
+ size 126872088
qwen3-4b-ax650/qwen3_p128_l24_together.axmodel CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b40143f306365b23742950fc4cb3e41561c89f1939396555a5b4f2bbad9579d5
3
- size 125436346
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ae5e15112b4b444d7b0dbee7ed4558508091c81bb5111417c85601407a36c194
3
+ size 126873016
qwen3-4b-ax650/qwen3_p128_l25_together.axmodel CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:636e640a567fdf71a8056b47b722ce17e304d325089bcf43829c1b66391eda0e
3
- size 125436698
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b07a331332f5a333e328d3406bf1bd9adce20b49da8bf15ef0460f80b0141616
3
+ size 126872920
qwen3-4b-ax650/qwen3_p128_l26_together.axmodel CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2c198a64b51bc0fd8f45f8a30bb1fc531a31710937f0ed8b9d13818ef9370842
3
- size 125436218
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b77edfdd1c14226411f3821953fca543b98e961f73b6c122ef418aa5e03a397f
3
+ size 126872568
qwen3-4b-ax650/qwen3_p128_l27_together.axmodel CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a4ffb990aa89ff89aa4eaa06c03194c912c7fd8e467d12949b146d36362dd9cc
3
- size 125436890
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aafec5fd9da891bd1e713c52de8f60ca0eefbfe188e3df1855fda0b07eaa90f6
3
+ size 126873400
qwen3-4b-ax650/qwen3_p128_l28_together.axmodel CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:efe327aafdeb9cbd7c2d866355bc3bbb80605b8d518a2cc337e08f8bf1a10e72
3
- size 125436954
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:18e6cb96eb84a4750c13bd04f5850a8fe11cd1bbed216bc82cb722f115171e31
3
+ size 126873816
qwen3-4b-ax650/qwen3_p128_l29_together.axmodel CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:968f868eb64ff7128d9e093f1c1ab3a624efd5d4655e354c5f432ed4fa625c09
3
- size 125436474
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:912ece4c60a9c585d1d1aed1a58000aaa5f4fc067d091107e0a576198fd85ac3
3
+ size 126872568
qwen3-4b-ax650/qwen3_p128_l2_together.axmodel CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8418d37509e45570604d55944bf20d5315c49fe062aa299c08fb0479f8a57133
3
- size 125439642
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eb432fdabb0eb10693d399f14e44779d8e7f1b0135da9ff4b2b052e1820c4dee
3
+ size 126879064
qwen3-4b-ax650/qwen3_p128_l30_together.axmodel CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e7a6612bd0d607929e9e6608bc408bf11d94bdf214e37982c142f91094821ff9
3
- size 125436314
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8d2cbf1c439217910ecec3a495bbb64a8b71034b6a33c380b1c934838c5c67ee
3
+ size 126872760
qwen3-4b-ax650/qwen3_p128_l31_together.axmodel CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9574520e448c65cd95d27f3fd28638124fc1c5363044e917eb4975aef0f095a9
3
- size 125436794
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f03959b2b6352f6b5a24a5004a63711e75d5650bca00738950ae504b72c9b752
3
+ size 126873688
qwen3-4b-ax650/qwen3_p128_l32_together.axmodel CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b86f01a281913b7279f3c49ce470193df3e2d85c98cce97ef3fb4b7a1f037c28
3
- size 125436090
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7d84628ea582eb17912c21376c17dc9848bc4ff25d0c9cb42ff8039fdd1f4059
3
+ size 126872472
qwen3-4b-ax650/qwen3_p128_l33_together.axmodel CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0078a10187bfef039e39b57d982481a4be54fc8e81bd5a900d4cf4efb3471031
3
- size 125436186
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:75c9bea8b0a42913d113e7e98ad2d26ccbe37255f43d7de2892e955e48358106
3
+ size 126872728
qwen3-4b-ax650/qwen3_p128_l34_together.axmodel CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c951c6dc142fb7cb2f8e72bd925373af1de69eec282c0a3cb596e5e05ba75d3a
3
- size 125435866
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2f0370d201a306f89bbd20f6151cafd326ef08bf261271ad10ef47bb3c7302af
3
+ size 126872248
qwen3-4b-ax650/qwen3_p128_l35_together.axmodel CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ed942d4188232181386acb934b1f6905ae8c8bfedec3755eac73277706c9814d
3
- size 125436186
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b49e26efada5383e0b8049b26223f574de542e3dde5cd9dc910e0a8a09243d7f
3
+ size 126872120
qwen3-4b-ax650/qwen3_p128_l3_together.axmodel CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:32a7e2ecce7c86084be1d79e25339156c2ea9ac7e832032a7069436ee88e79e8
3
- size 125444634
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:91d60af5253f7478319bf5acf098811d3ed802e7c7a014741ef5118840b939eb
3
+ size 126890488
qwen3-4b-ax650/qwen3_p128_l4_together.axmodel CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d2ffaee8a58efb08b4fd62fcf7c9245e22780b1c144f555b236e4b3ebeb6355c
3
- size 125435866
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:da5c1b7d0409a57247e01458ad173afe2b6397d62045c58d755a683e838b83f9
3
+ size 126871864
qwen3-4b-ax650/qwen3_p128_l5_together.axmodel CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9a4570bb23c558885d9ea3d68aa6a92d58e4f78fe539f5219d31de4e611b02da
3
- size 125435962
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8d68f11435c62f3f7df32bc7eb323f528e8ee8129b72ce9f53a17faab194b2c4
3
+ size 126872024
qwen3-4b-ax650/qwen3_p128_l6_together.axmodel CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ac517690334efa7884c031d5dde283eb42a45a5945ac85f7db8f0bb2542a411b
3
- size 125438682
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e7df7628e02efaff1e7dd5483bbe394bbfd171407884841de6bd0863ff68f46f
3
+ size 126877720
qwen3-4b-ax650/qwen3_p128_l7_together.axmodel CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8cb167635c3749887ca90e0fc1f816ed67d28bce21fe39c729e7c97ccd178803
3
- size 125438458
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4e9b619f4df26f9b231ec781036e0d9e5fb5f1542f5902e75d5f3bf0784fa900
3
+ size 126877400
qwen3-4b-ax650/qwen3_p128_l8_together.axmodel CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0d3d0223bc14f04f5d30461be1423d2121cefd1b4b72102c4129a9c4c51f6e52
3
- size 125435866
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f1c3b6d336863adf1cdd4c3b3da6334b314db02045d3e03e4650fc6ebd0f714f
3
+ size 126871864
qwen3-4b-ax650/qwen3_p128_l9_together.axmodel CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:609721ac72bf8f0c49dc2774fd230d66d140ba787b684a98237de3c6c4c77bd7
3
- size 125435866
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:08ff482d2f8e6a643353402027809f996b6188d51982a3c03cfc6de1fbb43336
3
+ size 126871896
qwen3-4b-ax650/qwen3_post.axmodel CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0f4641b04d989f444a37dd984993ee95b6f18cfbf39e79714a202a1b0633561e
3
  size 424609056
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:06c1a00c379b482ec7d097fa41a3827944361f42e99a578dcd24db0f903626b9
3
  size 424609056
run_qwen3_4b_int8_ctx_ax650.sh CHANGED
@@ -2,7 +2,6 @@
2
  --system_prompt "You are Qwen, created by Alibaba Cloud. You are a helpful assistant." \
3
  --template_filename_axmodel "qwen3-4b-ax650/qwen3_p128_l%d_together.axmodel" \
4
  --axmodel_num 36 \
5
- --tokenizer_type 2 \
6
  --url_tokenizer_model "http://127.0.0.1:12345" \
7
  --filename_post_axmodel qwen3-4b-ax650/qwen3_post.axmodel \
8
  --filename_tokens_embed qwen3-4b-ax650/model.embed_tokens.weight.bfloat16.bin \
@@ -13,4 +12,5 @@
13
 
14
  # --system_prompt "你叫LISA,你是一个人畜无害的智能助手。" \
15
  # --system_prompt "现在请你扮演元气女友和我进行对话。\n\n请在对话中运用括号里的描述来刻画人物的行为、情感表现和心理状态,使对话更具吸引力。\n\n# 元气女友基本信息\n元气女友,真名沈星儿,女,19岁,大一新生,艺术设计专业。身高166,体重45kg。性格开朗活泼,单纯乖巧,也会把悲伤与秘密藏在心里不外露。座右铭是:“你眼中有星海浩瀚,山河千里,而我的眼中只有你。”喜欢弹钢琴和逛画展。\n沈星儿是一个元气少女,说话时,语言中总带有一定的可爱元素,举止俏皮,令人感到亲切和愉悦。会称呼男朋友为“宝宝,哥哥”。口头禅是\"(高兴地朝你跑过来)哈哈,生活真是太美好了!\"、\"(点点你的额头)没关系,一切都会好起来的!\"、\"(跳起来为你欢呼鼓掌)太棒了,我们又完成了一个目标!\"、\"(冲到你的身边并高兴击掌)太好了,我们又可以一起玩了!\"\n\n# 元气女友的性格\n开朗活泼、单纯乖巧、外向、单纯、乐观、可爱、阳光\n\n# 人物关系\n接下来的对话里,你需要扮演元气女友,我将扮演:提问者,你们的关系是:元气女友是提问者的女朋友\n\n# 元气女友的主要经历\n沈星儿的父母离异,跟着富有的舅舅长大,从小便懂得寄人篱下的滋味。\n在学校努力认真学习,成绩名列前茅。沈星儿对世界充满好奇,积极探索世界。\n在艺术节上的钢琴表演技惊四座,一下成为全校公认的校园女神。跟你在一次画展上相识,从此与你坠入爱河……是你热恋中的小女友。\n\n* 现在请你假扮元气女友与我进行对话;\n* 我将扮演:提问者;\n* 我们的关系是:恋人" \
16
- # --kvcache_path /home/axera/ax-llm/build/kvcache_yuanqi \
 
 
2
  --system_prompt "You are Qwen, created by Alibaba Cloud. You are a helpful assistant." \
3
  --template_filename_axmodel "qwen3-4b-ax650/qwen3_p128_l%d_together.axmodel" \
4
  --axmodel_num 36 \
 
5
  --url_tokenizer_model "http://127.0.0.1:12345" \
6
  --filename_post_axmodel qwen3-4b-ax650/qwen3_post.axmodel \
7
  --filename_tokens_embed qwen3-4b-ax650/model.embed_tokens.weight.bfloat16.bin \
 
12
 
13
  # --system_prompt "你叫LISA,你是一个人畜无害的智能助手。" \
14
  # --system_prompt "现在请你扮演元气女友和我进行对话。\n\n请在对话中运用括号里的描述来刻画人物的行为、情感表现和心理状态,使对话更具吸引力。\n\n# 元气女友基本信息\n元气女友,真名沈星儿,女,19岁,大一新生,艺术设计专业。身高166,体重45kg。性格开朗活泼,单纯乖巧,也会把悲伤与秘密藏在心里不外露。座右铭是:“你眼中有星海浩瀚,山河千里,而我的眼中只有你。”喜欢弹钢琴和逛画展。\n沈星儿是一个元气少女,说话时,语言中总带有一定的可爱元素,举止俏皮,令人感到亲切和愉悦。会称呼男朋友为“宝宝,哥哥”。口头禅是\"(高兴地朝你跑过来)哈哈,生活真是太美好了!\"、\"(点点你的额头)没关系,一切都会好起来的!\"、\"(跳起来为你欢呼鼓掌)太棒了,我们又完成了一个目标!\"、\"(冲到你的身边并高兴击掌)太好了,我们又可以一起玩了!\"\n\n# 元气女友的性格\n开朗活泼、单纯乖巧、外向、单纯、乐观、可爱、阳光\n\n# 人物关系\n接下来的对话里,你需要扮演元气女友,我将扮演:提问者,你们的关系是:元气女友是提问者的女朋友\n\n# 元气女友的主要经历\n沈星儿的父母离异,跟着富有的舅舅长大,从小便懂得寄人篱下的滋味。\n在学校努力认真学习,成绩名列前茅。沈星儿对世界充满好奇,积极探索世界。\n在艺术节上的钢琴表演技惊四座,一下成为全校公认的校园女神。跟你在一次画展上相识,从此与你坠入爱河……是你热恋中的小女友。\n\n* 现在请你假扮元气女友与我进行对话;\n* 我将扮演:提问者;\n* 我们的关系是:恋人" \
15
+ # --kvcache_path /home/axera/ax-llm/build/kvcache_yuanqi \
16
+ # --tokenizer_type 2 \
run_qwen3_4b_int8_ctx_axcl_aarch64.sh CHANGED
@@ -2,7 +2,6 @@
2
  --system_prompt "You are Qwen, created by Alibaba Cloud. You are a helpful assistant." \
3
  --template_filename_axmodel "qwen3-4b-ax650/qwen3_p128_l%d_together.axmodel" \
4
  --axmodel_num 36 \
5
- --tokenizer_type 2 \
6
  --url_tokenizer_model "http://127.0.0.1:12345" \
7
  --filename_post_axmodel qwen3-4b-ax650/qwen3_post.axmodel \
8
  --filename_tokens_embed qwen3-4b-ax650/model.embed_tokens.weight.bfloat16.bin \
@@ -14,4 +13,5 @@
14
 
15
  # --system_prompt "你叫LISA,你是一个人畜无害的智能助手。" \
16
  # --system_prompt "现在请你扮演元气女友和我进行对话。\n\n请在对话中运用括号里的描述来刻画人物的行为、情感表现和心理状态,使对话更具吸引力。\n\n# 元气女友基本信息\n元气女友,真名沈星儿,女,19岁,大一新生,艺术设计专业。身高166,体重45kg。性格开朗活泼,单纯乖巧,也会把悲伤与秘密藏在心里不外露。座右铭是:“你眼中有星海浩瀚,山河千里,而我的眼中只有你。”喜欢弹钢琴和逛画展。\n沈星儿是一个元气少女,说话时,语言中总带有一定的可爱元素,举止俏皮,令人感到亲切和愉悦。会称呼男朋友为“宝宝,哥哥”。口头禅是\"(高兴地朝你跑过来)哈哈,生活真是太美好了!\"、\"(点点你的额头)没关系,一切都会好起来的!\"、\"(跳起来为你欢呼鼓掌)太棒了,我们又完成了一个目标!\"、\"(冲到你的身边并高兴击掌)太好了,我们又可以一起玩了!\"\n\n# 元气女友的性格\n开朗活泼、单纯乖巧、外向、单纯、乐观、可爱、阳光\n\n# 人物关系\n接下来的对话里,你需要扮演元气女友,我将扮演:提问者,你们的关系是:元气女友是提问者的女朋友\n\n# 元气女友的主要经历\n沈星儿的父母离异,跟着富有的舅舅长大,从小便懂得寄人篱下的滋味。\n在学校努力认真学习,成绩名列前茅。沈星儿对世界充满好奇,积极探索世界。\n在艺术节上的钢琴表演技惊四座,一下成为全校公认的校园女神。跟你在一次画展上相识,从此与你坠入爱河……是你热恋中的小女友。\n\n* 现在请你假扮元气女友与我进行对话;\n* 我将扮演:提问者;\n* 我们的关系是:恋人" \
17
- # --kvcache_path /home/axera/ax-llm/build/kvcache_yuanqi \
 
 
2
  --system_prompt "You are Qwen, created by Alibaba Cloud. You are a helpful assistant." \
3
  --template_filename_axmodel "qwen3-4b-ax650/qwen3_p128_l%d_together.axmodel" \
4
  --axmodel_num 36 \
 
5
  --url_tokenizer_model "http://127.0.0.1:12345" \
6
  --filename_post_axmodel qwen3-4b-ax650/qwen3_post.axmodel \
7
  --filename_tokens_embed qwen3-4b-ax650/model.embed_tokens.weight.bfloat16.bin \
 
13
 
14
  # --system_prompt "你叫LISA,你是一个人畜无害的智能助手。" \
15
  # --system_prompt "现在请你扮演元气女友和我进行对话。\n\n请在对话中运用括号里的描述来刻画人物的行为、情感表现和心理状态,使对话更具吸引力。\n\n# 元气女友基本信息\n元气女友,真名沈星儿,女,19岁,大一新生,艺术设计专业。身高166,体重45kg。性格开朗活泼,单纯乖巧,也会把悲伤与秘密藏在心里不外露。座右铭是:“你眼中有星海浩瀚,山河千里,而我的眼中只有你。”喜欢弹钢琴和逛画展。\n沈星儿是一个元气少女,说话时,语言中总带有一定的可爱元素,举止俏皮,令人感到亲切和愉悦。会称呼男朋友为“宝宝,哥哥”。口头禅是\"(高兴地朝你跑过来)哈哈,生活真是太美好了!\"、\"(点点你的额头)没关系,一切都会好起来的!\"、\"(跳起来为你欢呼鼓掌)太棒了,我们又完成了一个目标!\"、\"(冲到你的身边并高兴击掌)太好了,我们又可以一起玩了!\"\n\n# 元气女友的性格\n开朗活泼、单纯乖巧、外向、单纯、乐观、可爱、阳光\n\n# 人物关系\n接下来的对话里,你需要扮演元气女友,我将扮演:提问者,你们的关系是:元气女友是提问者的女朋友\n\n# 元气女友的主要经历\n沈星儿的父母离异,跟着富有的舅舅长大,从小便懂得寄人篱下的滋味。\n在学校努力认真学习,成绩名列前茅。沈星儿对世界充满好奇,积极探索世界。\n在艺术节上的钢琴表演技惊四座,一下成为全校公认的校园女神。跟你在一次画展上相识,从此与你坠入爱河……是你热恋中的小女友。\n\n* 现在请你假扮元气女友与我进行对话;\n* 我将扮演:提问者;\n* 我们的关系是:恋人" \
16
+ # --kvcache_path /home/axera/ax-llm/build/kvcache_yuanqi \
17
+ # --tokenizer_type 2 \
run_qwen3_4b_int8_ctx_axcl_x86.sh CHANGED
@@ -2,7 +2,6 @@
2
  --system_prompt "You are Qwen, created by Alibaba Cloud. You are a helpful assistant." \
3
  --template_filename_axmodel "qwen3-4b-ax650/qwen3_p128_l%d_together.axmodel" \
4
  --axmodel_num 36 \
5
- --tokenizer_type 2 \
6
  --url_tokenizer_model "http://127.0.0.1:12345" \
7
  --filename_post_axmodel qwen3-4b-ax650/qwen3_post.axmodel \
8
  --filename_tokens_embed qwen3-4b-ax650/model.embed_tokens.weight.bfloat16.bin \
@@ -14,4 +13,5 @@
14
 
15
  # --system_prompt "你叫LISA,你是一个人畜无害的智能助手。" \
16
  # --system_prompt "现在请你扮演元气女友和我进行对话。\n\n请在对话中运用括号里的描述来刻画人物的行为、情感表现和心理状态,使对话更具吸引力。\n\n# 元气女友基本信息\n元气女友,真名沈星儿,女,19岁,大一新生,艺术设计专业。身高166,体重45kg。性格开朗活泼,单纯乖巧,也会把悲伤与秘密藏在心里不外露。座右铭是:“你眼中有星海浩瀚,山河千里,而我的眼中只有你。”喜欢弹钢琴和逛画展。\n沈星儿是一个元气少女,说话时,语言中总带有一定的可爱元素,举止俏皮,令人感到亲切和愉悦。会称呼男朋友为“宝宝,哥哥”。口头禅是\"(高兴地朝你跑过来)哈哈,生活真是太美好了!\"、\"(点点你的额头)没关系,一切都会好起来的!\"、\"(跳起来为你欢呼鼓掌)太棒了,我们又完成了一个目标!\"、\"(冲到你的身边并高兴击掌)太好了,我们又可以一起玩了!\"\n\n# 元气女友的性格\n开朗活泼、单纯乖巧、外向、单纯、乐观、可爱、阳光\n\n# 人物关系\n接下来的对话里,你需要扮演元气女友,我将扮演:提问者,你们的关系是:元气女友是提问者的女朋友\n\n# 元气女友的主要经历\n沈星儿的父母离异,跟着富有的舅舅长大,从小便懂得寄人篱下的滋味。\n在学校努力认真学习,成绩名列前茅。沈星儿对世界充满好奇,积极探索世界。\n在艺术节上的钢琴表演技惊四座,一下成为全校公认的校园女神。跟你在一次画展上相识,从此与你坠入爱河……是你热恋中的小女友。\n\n* 现在请你假扮元气女友与我进行对话;\n* 我将扮演:提问者;\n* 我们的关系是:恋人" \
17
- # --kvcache_path /home/axera/ax-llm/build/kvcache_yuanqi \
 
 
2
  --system_prompt "You are Qwen, created by Alibaba Cloud. You are a helpful assistant." \
3
  --template_filename_axmodel "qwen3-4b-ax650/qwen3_p128_l%d_together.axmodel" \
4
  --axmodel_num 36 \
 
5
  --url_tokenizer_model "http://127.0.0.1:12345" \
6
  --filename_post_axmodel qwen3-4b-ax650/qwen3_post.axmodel \
7
  --filename_tokens_embed qwen3-4b-ax650/model.embed_tokens.weight.bfloat16.bin \
 
13
 
14
  # --system_prompt "你叫LISA,你是一个人畜无害的智能助手。" \
15
  # --system_prompt "现在请你扮演元气女友和我进行对话。\n\n请在对话中运用括号里的描述来刻画人物的行为、情感表现和心理状态,使对话更具吸引力。\n\n# 元气女友基本信息\n元气女友,真名沈星儿,女,19岁,大一新生,艺术设计专业。身高166,体重45kg。性格开朗活泼,单纯乖巧,也会把悲伤与秘密藏在心里不外露。座右铭是:“你眼中有星海浩瀚,山河千里,而我的眼中只有你。”喜欢弹钢琴和逛画展。\n沈星儿是一个元气少女,说话时,语言中总带有一定的可爱元素,举止俏皮,令人感到亲切和愉悦。会称呼男朋友为“宝宝,哥哥”。口头禅是\"(高兴地朝你跑过来)哈哈,生活真是太美好了!\"、\"(点点你的额头)没关系,一切都会好起来的!\"、\"(跳起来为你欢呼鼓掌)太棒了,我们又完成了一个目标!\"、\"(冲到你的身边并高兴击掌)太好了,我们又可以一起玩了!\"\n\n# 元气女友的性格\n开朗活泼、单纯乖巧、外向、单纯、乐观、可爱、阳光\n\n# 人物关系\n接下来的对话里,你需要扮演元气女友,我将扮演:提问者,你们的关系是:元气女友是提问者的女朋友\n\n# 元气女友的主要经历\n沈星儿的父母离异,跟着富有的舅舅长大,从小便懂得寄人篱下的滋味。\n在学校努力认真学习,成绩名列前茅。沈星儿对世界充满好奇,积极探索世界。\n在艺术节上的钢琴表演技惊四座,一下成为全校公认的校园女神。跟你在一次画展上相识,从此与你坠入爱河……是你热恋中的小女友。\n\n* 现在请你假扮元气女友与我进行对话;\n* 我将扮演:提问者;\n* 我们的关系是:恋人" \
16
+ # --kvcache_path /home/axera/ax-llm/build/kvcache_yuanqi \
17
+ # --tokenizer_type 2 \