| from mmengine.config import read_base |
|
|
| from opencompass.models import TurboMindModel |
|
|
| with read_base(): |
| from opencompass.configs.datasets.longbench.longbench import \ |
| longbench_datasets |
| from opencompass.configs.datasets.needlebench.needlebench_base.needlebench_base_gen import \ |
| needlebench_datasets |
| |
| from opencompass.configs.summarizers.groups.longbench import \ |
| longbench_summary_groups |
| from opencompass.configs.summarizers.needlebench import \ |
| needlebench_internal_200k_summarizer |
| from opencompass.configs.summarizers.needlebench import ( |
| needlebench_internal_32k_summarizer, |
| needlebench_internal_100k_summarizer) |
|
|
| from ...rjob import eval, infer |
|
|
| needlebench_internal_32k_summary_groups = needlebench_internal_32k_summarizer[ |
| 'summary_groups'] |
| needlebench_internal_100k_summary_groups = ( |
| needlebench_internal_100k_summarizer['summary_groups']) |
| needlebench_internal_200k_summary_groups = ( |
| needlebench_internal_200k_summarizer['summary_groups']) |
|
|
| models = [ |
| dict( |
| type=TurboMindModel, |
| abbr='qwen3-8b-base-turbomind', |
| path='Qwen/Qwen3-8B-Base', |
| engine_config=dict(session_len=264192, max_batch_size=8, tp=1), |
| gen_config=dict(top_k=1, |
| temperature=1e-6, |
| top_p=0.9, |
| max_new_tokens=2048, |
| min_out_len=2), |
| max_seq_len=264192, |
| max_out_len=500, |
| batch_size=1, |
| drop_middle=True, |
| run_cfg=dict(num_gpus=1), |
| ) |
| ] |
|
|
| datasets = [ |
| v[0] for k, v in locals().items() |
| if k.endswith('_datasets') and isinstance(v, list) and len(v) > 0 |
| ] |
|
|
| for d in datasets: |
| d['reader_cfg']['test_range'] = '[0:16]' |
|
|