| from mmengine.config import read_base |
|
|
| from opencompass.models import (HuggingFacewithChatTemplate, |
| TurboMindModelwithChatTemplate, |
| VLLMwithChatTemplate) |
| from opencompass.utils.text_postprocessors import extract_non_reasoning_content |
|
|
| with read_base(): |
| |
| from opencompass.configs.datasets.gsm8k.gsm8k_gen import \ |
| gsm8k_datasets |
| from opencompass.configs.datasets.race.race_gen import \ |
| race_datasets |
|
|
| |
| from ...rjob import eval, infer |
|
|
| Qwen3_0_6B_FP8_hf = dict( |
| type=HuggingFacewithChatTemplate, |
| abbr='qwen3_0_6b_fp8-hf', |
| path='Qwen/Qwen3-0.6B-FP8', |
| max_out_len=16384, |
| batch_size=8, |
| run_cfg=dict(num_gpus=1), |
| pred_postprocessor=dict(type=extract_non_reasoning_content)) |
|
|
| Qwen3_0_6B_FP8_turbomind = dict( |
| type=TurboMindModelwithChatTemplate, |
| abbr='qwen3-0_6b-fp8-turbomind', |
| path='Qwen/Qwen3-0.6B-FP8', |
| engine_config=dict(session_len=32768, max_batch_size=1), |
| gen_config=dict(top_k=1, max_new_tokens=16384), |
| max_seq_len=32768, |
| max_out_len=16384, |
| batch_size=1, |
| run_cfg=dict(num_gpus=1), |
| pred_postprocessor=dict(type=extract_non_reasoning_content)) |
|
|
| Qwen3_0_6B_FP8_vllm = dict( |
| type=VLLMwithChatTemplate, |
| abbr='qwen3-0_6b-fp8-vllm', |
| path='Qwen/Qwen3-0.6B-FP8', |
| model_kwargs=dict(tensor_parallel_size=1), |
| generation_kwargs=dict(do_sample=False), |
| max_seq_len=32768, |
| max_out_len=16384, |
| batch_size=16, |
| run_cfg=dict(num_gpus=1), |
| ) |
|
|
| race_datasets = [race_datasets[1]] |
| datasets = sum([v for k, v in locals().items() if k.endswith('_datasets')], []) |
|
|
| for d in datasets: |
| d['reader_cfg']['test_range'] = '[0:32]' |
|
|
| models = sum([v for k, v in locals().items() if k.endswith('_model')], []) |
|
|
| models = [Qwen3_0_6B_FP8_hf, Qwen3_0_6B_FP8_turbomind, Qwen3_0_6B_FP8_vllm] |
|
|
| summarizer = dict( |
| dataset_abbrs=[ |
| 'gsm8k', |
| 'race-middle', |
| 'race-high', |
| ], |
| summary_groups=sum( |
| [v for k, v in locals().items() if k.endswith('_summary_groups')], []), |
| ) |
|
|