caiovicentino1's picture
Add hlwq_config.json (rename from polar_config.json)
9884878 verified
raw
history blame contribute delete
658 Bytes
{
"method": "HLWQ",
"weight_bits": 5,
"kv_cache_bits": 3,
"block_size": 128,
"head_dim": 128,
"num_layers": 64,
"quantized_layers": 497,
"skipped_layers": 0,
"int4_group_size": 128,
"vram_gb": 19.1,
"base_model": "huihui-ai/Huihui-Qwopus3.5-27B-v3-abliterated",
"benchmark": {
"FP16": {
"tok_s": 21.804779849809538,
"peak_gb": 70.363202048,
"time": 4.586150407791138
},
"Q3": {
"tok_s": 22.092763850247692,
"peak_gb": 19.130801664,
"time": 4.526368935902913
},
"Q2": {
"tok_s": 22.038845106697618,
"peak_gb": 19.130801664,
"time": 4.537442843119304
}
}
}