Qwen3-0.6B-SplitQuant-w8a8g128 / compressed_config.json
Xinxiong0912's picture
Upload folder using huggingface_hub
7d8523d verified
{
"format": "mindpipe_hf_save_pretrained_debug",
"algorithm": "splitquant",
"model_path": "/mnt/42_store/wxx/modelzoo/Qwen/Qwen3-0.6B",
"result_dir": "/mnt/82_store/wxx/HWQuant/Mindpipe/results/Qwen3-0.6B/splitquant/splitquant_w8a8_q16k16v16_seq512",
"weight_bits": 8,
"activation_bits": 8,
"sequence_length": 512,
"group_size": 128,
"output_dir": "/mnt/82_store/wxx/HWQuant/Mindpipe/tmp_hf_save/Qwen3-0.6B-SplitQuant-w8a8g128/_pre_save_workflow",
"pre_save_metrics": {
"perplexity": 28.215095258159398,
"evaluation_dataset": "wikitext2",
"sequence_length": 512,
"evaluated_chunks": 4,
"batch_size": 1,
"elapsed_seconds": 1.5785746639594436,
"tokens_per_second": 1294.8389750999538,
"model_path": "/mnt/42_store/wxx/modelzoo/Qwen/Qwen3-0.6B",
"quantization_algorithm": "splitquant",
"weight_bits": 8,
"activation_bits": 8,
"device": "cuda:0",
"dtype": "float16",
"artifacts_path": "artifacts.json"
},
"load_note": "Use MindPipe to rebuild the compression structure before loading the HF state dict."
}