chidamnat2002 commited on
Commit
0197d90
·
verified ·
1 Parent(s): 6a43eb9

Upload 10 files

Browse files

quantization of models

config.json CHANGED
@@ -1,5 +1,6 @@
1
  {
2
- "_name_or_path": "microsoft/MiniLM-L12-H384-uncased",
 
3
  "architectures": [
4
  "BertForSequenceClassification"
5
  ],
@@ -63,7 +64,7 @@
63
  "position_embedding_type": "absolute",
64
  "problem_type": "multi_label_classification",
65
  "torch_dtype": "float32",
66
- "transformers_version": "4.44.2",
67
  "type_vocab_size": 2,
68
  "use_cache": true,
69
  "vocab_size": 30522
 
1
  {
2
+ "_attn_implementation_autoset": true,
3
+ "_name_or_path": "Mozilla/content-multilabel-iab-classifier",
4
  "architectures": [
5
  "BertForSequenceClassification"
6
  ],
 
64
  "position_embedding_type": "absolute",
65
  "problem_type": "multi_label_classification",
66
  "torch_dtype": "float32",
67
+ "transformers_version": "4.49.0",
68
  "type_vocab_size": 2,
69
  "use_cache": true,
70
  "vocab_size": 30522
onnx/model.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3c3c076e3f4924ee497e0f7fb34f85857ba955e092d3254816eee0cac86feebd
3
+ size 133740267
onnx/model_fp16.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c6c79fc1ced771200eab9a96005a0d88dbfa491055265dd9ff892247f1b29e30
3
+ size 67021343
onnx/model_q4.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6ae0f888d3e323d5180ca12bb7959cec55fe525a45623b5c5158155133a7b3d0
3
+ size 62087374
onnx/model_quantized.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fc8c08f4544840e7e02a44af9c82d342528c6756b1cf3a95c94c9703fe275490
3
+ size 34125553
quantize_config.json ADDED
@@ -0,0 +1,14 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "modes": [
3
+ "q4",
4
+ "q8",
5
+ "fp16"
6
+ ],
7
+ "per_channel": true,
8
+ "reduce_range": true,
9
+ "block_size": null,
10
+ "is_symmetric": true,
11
+ "accuracy_level": null,
12
+ "quant_type": 1,
13
+ "op_block_list": null
14
+ }
tokenizer_config.json CHANGED
@@ -45,6 +45,7 @@
45
  "cls_token": "[CLS]",
46
  "do_basic_tokenize": true,
47
  "do_lower_case": true,
 
48
  "mask_token": "[MASK]",
49
  "max_length": 256,
50
  "model_max_length": 1000000000000000019884624838656,
 
45
  "cls_token": "[CLS]",
46
  "do_basic_tokenize": true,
47
  "do_lower_case": true,
48
+ "extra_special_tokens": {},
49
  "mask_token": "[MASK]",
50
  "max_length": 256,
51
  "model_max_length": 1000000000000000019884624838656,