Update config.json with the correct state
Browse filesThe model is compressed however was incorrectly saved using the "frozen" quantization_status, which results in incorrect loading through transformers.
- config.json +1 -1
config.json
CHANGED
|
@@ -75,6 +75,6 @@
|
|
| 75 |
],
|
| 76 |
"kv_cache_scheme": null,
|
| 77 |
"quant_method": "compressed-tensors",
|
| 78 |
-
"quantization_status": "
|
| 79 |
}
|
| 80 |
}
|
|
|
|
| 75 |
],
|
| 76 |
"kv_cache_scheme": null,
|
| 77 |
"quant_method": "compressed-tensors",
|
| 78 |
+
"quantization_status": "compressed"
|
| 79 |
}
|
| 80 |
}
|