MetaphoricalCode commited on
Commit
a9ebbbd
·
verified ·
1 Parent(s): 9f54338

Proper bos_token_id

Browse files
Files changed (2) hide show
  1. README.md +2 -0
  2. config.json +4 -4
README.md CHANGED
@@ -8,6 +8,8 @@ tags:
8
  - mergekitty
9
  - merge
10
  ---
 
 
11
  ## Quantized using the default exllamav3 (0.0.2) quantization process.
12
 
13
  - Original model: https://huggingface.co/trashpanda-org/QwQ-32B-Snowdrop-v0
 
8
  - mergekitty
9
  - merge
10
  ---
11
+ # UPDATE: 07.06.2025
12
+ - Proper bos_token_id was uploaded. Download the new config.json file for the model to work properly!
13
  ## Quantized using the default exllamav3 (0.0.2) quantization process.
14
 
15
  - Original model: https://huggingface.co/trashpanda-org/QwQ-32B-Snowdrop-v0
config.json CHANGED
@@ -5,7 +5,7 @@
5
  ],
6
  "attention_dropout": 0.0,
7
  "bos_token_id": 151643,
8
- "eos_token_id": 151643,
9
  "hidden_act": "silu",
10
  "hidden_size": 5120,
11
  "initializer_range": 0.02,
@@ -28,9 +28,9 @@
28
  "vocab_size": 151665,
29
  "quantization_config": {
30
  "quant_method": "exl3",
31
- "version": "0.0.2",
32
- "bits": 4.5,
33
- "head_bits": 8,
34
  "calibration": {
35
  "rows": 100,
36
  "cols": 2048
 
5
  ],
6
  "attention_dropout": 0.0,
7
  "bos_token_id": 151643,
8
+ "eos_token_id": 151645,
9
  "hidden_act": "silu",
10
  "hidden_size": 5120,
11
  "initializer_range": 0.02,
 
28
  "vocab_size": 151665,
29
  "quantization_config": {
30
  "quant_method": "exl3",
31
+ "version": "0.0.1",
32
+ "bits": 4.0,
33
+ "head_bits": 6,
34
  "calibration": {
35
  "rows": 100,
36
  "cols": 2048