|
|
from mmengine.config import read_base |
|
|
|
|
|
from opencompass.models import TurboMindModel |
|
|
|
|
|
with read_base(): |
|
|
from opencompass.configs.datasets.longbench.longbench import \ |
|
|
longbench_datasets |
|
|
from opencompass.configs.datasets.needlebench.needlebench_base.needlebench_base_gen import \ |
|
|
needlebench_datasets |
|
|
|
|
|
from opencompass.configs.summarizers.groups.longbench import \ |
|
|
longbench_summary_groups |
|
|
from opencompass.configs.summarizers.needlebench import \ |
|
|
needlebench_internal_200k_summarizer |
|
|
from opencompass.configs.summarizers.needlebench import ( |
|
|
needlebench_internal_32k_summarizer, |
|
|
needlebench_internal_100k_summarizer) |
|
|
|
|
|
from ...rjob import eval, infer |
|
|
|
|
|
needlebench_internal_32k_summary_groups = needlebench_internal_32k_summarizer[ |
|
|
'summary_groups'] |
|
|
needlebench_internal_100k_summary_groups = ( |
|
|
needlebench_internal_100k_summarizer['summary_groups']) |
|
|
needlebench_internal_200k_summary_groups = ( |
|
|
needlebench_internal_200k_summarizer['summary_groups']) |
|
|
|
|
|
models = [ |
|
|
dict( |
|
|
type=TurboMindModel, |
|
|
abbr='qwen3-8b-base-turbomind', |
|
|
path='Qwen/Qwen3-8B-Base', |
|
|
engine_config=dict(session_len=264192, max_batch_size=8, tp=1), |
|
|
gen_config=dict(top_k=1, |
|
|
temperature=1e-6, |
|
|
top_p=0.9, |
|
|
max_new_tokens=2048, |
|
|
min_out_len=2), |
|
|
max_seq_len=264192, |
|
|
max_out_len=500, |
|
|
batch_size=1, |
|
|
drop_middle=True, |
|
|
run_cfg=dict(num_gpus=1), |
|
|
) |
|
|
] |
|
|
|
|
|
datasets = [ |
|
|
v[0] for k, v in locals().items() |
|
|
if k.endswith('_datasets') and isinstance(v, list) and len(v) > 0 |
|
|
] |
|
|
|
|
|
for d in datasets: |
|
|
d['reader_cfg']['test_range'] = '[0:16]' |
|
|
|