File size: 1,039 Bytes
d4fb112 | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 | {
"format": "mindpipe_hf_save_pretrained_debug",
"algorithm": "awq",
"model_path": "/mnt/82_store/LLM-weights/openbmb/MiniCPM-V",
"result_dir": "/mnt/82_store/wxx/HWQuant/Mindpipe/results/MiniCPM-V/awq/awq_w4a16_seq512",
"weight_bits": 4,
"activation_bits": 16,
"sequence_length": 512,
"group_size": 128,
"output_dir": "/mnt/82_store/wxx/HWQuant/Mindpipe/tmp_hf_save/MiniCPM-V-AWQ-w4a16g128/_pre_save_workflow",
"pre_save_metrics": {
"perplexity": 9.501230692469067,
"evaluation_dataset": "wikitext2",
"sequence_length": 512,
"evaluated_chunks": 4,
"batch_size": 1,
"elapsed_seconds": 0.47178575303405523,
"tokens_per_second": 4332.475041594689,
"model_path": "/mnt/82_store/LLM-weights/openbmb/MiniCPM-V",
"quantization_algorithm": "awq",
"weight_bits": 4,
"activation_bits": 16,
"device": "cuda:0",
"dtype": "float16",
"artifacts_path": "artifacts.json"
},
"load_note": "Use MindPipe to rebuild the compression structure before loading the HF state dict."
} |