iOS ANE best: dynamic int8 (14.7 tok/s)
Browse files
.gitattributes
CHANGED
|
@@ -36,3 +36,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
| 36 |
dynamic-int8/qwen3_5_0_8b_decode_int8.aimodel/main.mlirb filter=lfs diff=lfs merge=lfs -text
|
| 37 |
ios-gpu-static/qwen3_5_0_8b_ios_hc0.aimodel/main.mlirb filter=lfs diff=lfs merge=lfs -text
|
| 38 |
ios-gpu/qwen3_5_0_8b_ios_hc0.aimodel/main.mlirb filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
| 36 |
dynamic-int8/qwen3_5_0_8b_decode_int8.aimodel/main.mlirb filter=lfs diff=lfs merge=lfs -text
|
| 37 |
ios-gpu-static/qwen3_5_0_8b_ios_hc0.aimodel/main.mlirb filter=lfs diff=lfs merge=lfs -text
|
| 38 |
ios-gpu/qwen3_5_0_8b_ios_hc0.aimodel/main.mlirb filter=lfs diff=lfs merge=lfs -text
|
| 39 |
+
ios-ane/qwen3_5_0_8b_decode_int8.aimodel/main.mlirb filter=lfs diff=lfs merge=lfs -text
|
ios-ane/qwen3_5_0_8b_decode_int8.aimodel/main.hash
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
h�����[�B��L�g����r8���gL
|
ios-ane/qwen3_5_0_8b_decode_int8.aimodel/main.mlirb
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6802af95ef17b5f85bba42de1b8f4ca467aef6e4de1d72173883b0ae16674c1f
|
| 3 |
+
size 1016041748
|
ios-ane/qwen3_5_0_8b_decode_int8.aimodel/metadata.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"assetVersion" : "2.0"
|
| 3 |
+
}
|