iOS GPU best: int4-kmeans fused-kernel core (17.7 tok/s)
Browse files
.gitattributes
CHANGED
|
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
| 33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
| 33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
| 36 |
+
ios-gpu/gemma4_e2b_metal_int4km_L35.aimodel/main.mlirb filter=lfs diff=lfs merge=lfs -text
|
ios-gpu/gemma4_e2b_metal_int4km_L35.aimodel/main.hash
ADDED
|
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
|
|
|
| 1 |
+
_����k�M
|
| 2 |
+
�-J�xWޡl6��z�vN
|
ios-gpu/gemma4_e2b_metal_int4km_L35.aimodel/main.mlirb
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5fcb12a1e594efa86bb74d0ade2d4a139c7857dea16c361e99fc7ab3764e0f10
|
| 3 |
+
size 1392365289
|
ios-gpu/gemma4_e2b_metal_int4km_L35.aimodel/metadata.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"assetVersion" : "2.0"
|
| 3 |
+
}
|