Upload optimized ONNX models w/ GQA

#10
by Xenova HF Staff - opened
onnx/model.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7f40876b94cd0de51afcfe1e7d8080c279c7072137b7eb0abbab1c8ff5ba2e9f
3
- size 1638275586
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cf419c37a4f6073a325028245d4cae2e6135765f0f2841dbe6f48c8cd261bbcd
3
+ size 1449582810
onnx/model_bnb4.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:53bb7e8dd5184642c8ffe8776b98070da31678ec886c0b8eaea82fc0e3342325
3
+ size 368284174
onnx/model_fp16.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d29891daee174979d9988b78b3fe1c539a0c9b425734099ac46a30c4c613dfce
3
- size 819212911
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9b3bbb7e1435a9c52f4435b21dc77dc40b71a988ab2f0b4ce47b04b52ca9e8e8
3
+ size 724891911
onnx/model_int8.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cb7375a212a6583cbd96eaa739142f3a1a0d17cbd51043c60f081ea5ce6d21e3
3
+ size 364564558
onnx/model_q4.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4525a8138b8474d5a1ab005b1a3703317c6f13257f3ce69aa711c6c74eb786a3
3
- size 417375737
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a4ffda96e65beafc6f6cef0cbcf9fdc1cbdd79c230906bf3897d190547c7a596
3
+ size 387943246
onnx/model_q4f16.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:99bce272c14df5583be4299c4af4c9b9d52500b16a0e6e79f1beec948edb3fc4
3
- size 299220646
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cc63370efc2aca6d5307518b85162777132cc5b8d68eeb8154ea9b5fce09ad46
3
+ size 272737275
onnx/model_quantized.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:57987a3a24dc34ad2cb5e7e566840ccaece095e35a24ae4fc5b3086c7ddd6918
3
+ size 364564671
onnx/model_uint8.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:57987a3a24dc34ad2cb5e7e566840ccaece095e35a24ae4fc5b3086c7ddd6918
3
+ size 364564671