decodeshare / artifacts /rebuttal /pca_prefill_decode_mismatch_layer28.json
Zishan Shao
Add lighthouse rebuttal artifacts
1c8e365
{
"config": {
"model": "meta-llama/Llama-2-7b-chat-hf",
"device": "cuda",
"model_dtype": "fp32",
"layers": "28",
"filter_regex": "",
"tasks_subspace": "gsm8k,commonsenseqa,strategyqa,aqua,arc_challenge,openbookqa,qasc,logiqa",
"n_subspace": 128,
"template_seed": 1234,
"template_randomization": 1,
"shuffle_choices": 1,
"answer_prefix": "\nFinal answer:",
"add_answer_prefix": 1,
"calib_decode_max_new_tokens": 128,
"decoding": "greedy",
"temperature": 0.7,
"top_p": 0.9,
"top_k": 0,
"ks": "32,64,128,256",
"pca_max_rows": 200000,
"per_task_max_states": 20000,
"pca_max_dim": 4096,
"batch_size": 4,
"max_prompt_len": 512,
"seed": 42,
"out_json": "rebuttal/pca_prefill_decode_mismatch_layer28.json"
},
"layers": [
28
],
"tasks_used": [
"gsm8k",
"commonsenseqa",
"strategyqa",
"aqua",
"arc_challenge",
"openbookqa",
"qasc",
"logiqa"
],
"by_layer": {
"28": {
"n_rows_prefill": 1024,
"n_rows_decode": 125624,
"d": 4096,
"k_max": 256,
"angles_deg": {
"32": {
"mean": 80.07994079589844,
"p50": 83.09337615966797,
"p95": 89.45713806152344,
"min": 38.77346420288086,
"max": 89.99810791015625
},
"64": {
"mean": 79.11544036865234,
"p50": 81.45398712158203,
"p95": 89.08732604980469,
"min": 32.79534149169922,
"max": 89.96986389160156
},
"128": {
"mean": 77.17108154296875,
"p50": 79.1217041015625,
"p95": 88.75955200195312,
"min": 27.36577033996582,
"max": 89.98320770263672
},
"256": {
"mean": 74.06597900390625,
"p50": 75.53594970703125,
"p95": 88.58094787597656,
"min": 21.949682235717773,
"max": 89.8911361694336
}
},
"cos_singulars": {
"32": {
"mean": 0.1674889326095581,
"min": 3.307082806713879e-05,
"max": 0.7796280384063721
},
"64": {
"mean": 0.18428365886211395,
"min": 0.000525902840308845,
"max": 0.8406106233596802
},
"128": {
"mean": 0.21747536957263947,
"min": 0.0002930520277004689,
"max": 0.8880901336669922
},
"256": {
"mean": 0.26861822605133057,
"min": 0.0018999958410859108,
"max": 0.9275124669075012
}
},
"explained_var_ratio": {
"32": {
"decode_by_decode": 0.2242752910874054,
"decode_by_prefill": 0.040454826437110264,
"prefill_by_prefill": 0.7956135344728951,
"prefill_by_decode": 0.0723876062212326
},
"64": {
"decode_by_decode": 0.287591268318897,
"decode_by_prefill": 0.05677867750419193,
"prefill_by_prefill": 0.8528749960118728,
"prefill_by_decode": 0.10226643959551017
},
"128": {
"decode_by_decode": 0.3630458220461663,
"decode_by_prefill": 0.08018399896361926,
"prefill_by_prefill": 0.9034699791539794,
"prefill_by_decode": 0.14957190001338527
},
"256": {
"decode_by_decode": 0.44764296315041163,
"decode_by_prefill": 0.11975813122324773,
"prefill_by_prefill": 0.9455660636505742,
"prefill_by_decode": 0.21092156502465595
}
}
}
}
}