rolf-mozilla commited on
Commit
1c40fd6
·
unverified ·
1 Parent(s): 907f5cd

fixed quantize bug

Browse files
.gitattributes CHANGED
@@ -33,3 +33,13 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
 
 
 
 
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ onnx filter=lfs diff=lfs merge=lfs -text
37
+ onnx/decoder_model_merged_quantized.onnx filter=lfs diff=lfs merge=lfs -text
38
+ onnx/decoder_model_quantized.onnx filter=lfs diff=lfs merge=lfs -text
39
+ onnx/decoder_with_past_model.onnx filter=lfs diff=lfs merge=lfs -text
40
+ onnx/decoder_with_past_model_quantized.onnx filter=lfs diff=lfs merge=lfs -text
41
+ onnx/encoder_model.onnx filter=lfs diff=lfs merge=lfs -text
42
+ onnx/encoder_model_quantized.onnx filter=lfs diff=lfs merge=lfs -text
43
+ onnx/decoder_model.onnx filter=lfs diff=lfs merge=lfs -text
44
+ onnx/decoder_model_merged.onnx filter=lfs diff=lfs merge=lfs -text
45
+ spiece.model filter=lfs diff=lfs merge=lfs -text
generation_config.json CHANGED
@@ -3,5 +3,5 @@
3
  "decoder_start_token_id": 0,
4
  "eos_token_id": 1,
5
  "pad_token_id": 0,
6
- "transformers_version": "4.33.2"
7
  }
 
3
  "decoder_start_token_id": 0,
4
  "eos_token_id": 1,
5
  "pad_token_id": 0,
6
+ "transformers_version": "4.43.4"
7
  }
onnx/decoder_model.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6cd6a58ed61e3ad6b6648564b5c87f3422414f116a16064ee5da03ec2a73a8ef
3
- size 166761386
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:47fecb931e99812451230bfbcd05df81c330e92853fed4f223141ac18998d0f6
3
+ size 232559765
onnx/decoder_model_merged.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8b52d2aad9a394b4cae07a91300e9bcb631963d6104101c3a53b0180b7d5fdb6
3
- size 167000290
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7df44b9b954011517a74d593f49f5fac757aa903534951e8df4237150427c178
3
+ size 232798796
onnx/decoder_model_merged_quantized.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:962a974755eef4e1192591d91922e06624f7285e9a8a4c4a2a33a8ecbaa7c775
3
- size 42585712
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9e72338ec1b43134186d26db751876ec97719f60f3601451566bcef81780a48c
3
+ size 59198001
onnx/decoder_model_quantized.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:071c28acd17136d14facf28f55ef854083848ef5dcf8c2bce70a1a63fb562121
3
- size 42257376
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0ccc23acc49ac46b4ba29b02469b46807b25b9f4ef6ddb3f26c2cc7d083250cc
3
+ size 58868682
onnx/decoder_with_past_model.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:229cb63818c01c2a91a5db80136cfe7c693e1cda131ce84d5b6b69918b9ed9cc
3
- size 154132337
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:277fa93744c2c1da786980159a13b768c1c92f21625b8954eaa68cabac468b13
3
+ size 219930925
onnx/decoder_with_past_model_quantized.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6060047a733908eb820cfad6896124d648682add77b93904dc18c4907d65ae98
3
- size 39019088
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:600b50b5c2ccdd7e70a6d6386ab69d820a295e12a58f51ad9f62b149a5667372
3
+ size 55630603