-
Notifications
You must be signed in to change notification settings - Fork 407
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
[Sync] Sync with internal codes 2024.06.28 (#1279)
- Loading branch information
Showing
284 changed files
with
6,238 additions
and
1,295 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,57 @@ | ||
import os | ||
|
||
from opencompass.openicl.icl_prompt_template import PromptTemplate | ||
from opencompass.openicl.icl_retriever import ZeroRetriever | ||
from opencompass.openicl.icl_inferencer import PPLInferencer | ||
from opencompass.datasets import CharmDataset | ||
from opencompass.openicl.icl_evaluator import AccwithDetailsEvaluator | ||
|
||
charm_tasks = [ | ||
['Chinese_Anachronisms_Judgment', 'AB'], | ||
['Chinese_Movie_and_Music_Recommendation', 'ABCD'], | ||
['Chinese_Natural_Language_Inference', 'ABC'], | ||
['Chinese_Reading_Comprehension', 'ABCD'], | ||
['Chinese_Sequence_Understanding', 'ABCD'], | ||
['Chinese_Sport_Understanding', 'AB'], | ||
['Chinese_Time_Understanding', 'ABCD'], | ||
['Global_Anachronisms_Judgment', 'AB'], | ||
['Global_Movie_and_Music_Recommendation', 'ABCD'], | ||
['Global_Natural_Language_Inference', 'ABC'], | ||
['Global_Reading_Comprehension', 'ABCD'], | ||
['Global_Sequence_Understanding', 'ABCD'], | ||
['Global_Sport_Understanding', 'AB'], | ||
['Global_Time_Understanding', 'ABCDEF'], | ||
] | ||
|
||
charm_reason_datasets = [] | ||
for task_name, options in charm_tasks: | ||
|
||
with open(os.path.join(os.path.dirname(__file__), 'few-shot-examples', f'{task_name}_Direct.txt'), 'r') as f: | ||
few_shot_example = f.read() | ||
|
||
charm_reason_reader_cfg = dict(input_columns=['input'], output_column='target') | ||
|
||
charm_reason_infer_cfg = dict( | ||
prompt_template=dict( | ||
type=PromptTemplate, | ||
template={ | ||
f'({opt})': f'{few_shot_example}\n{{input}}\nA: {opt}' for opt in options | ||
}, | ||
), | ||
retriever=dict(type=ZeroRetriever), | ||
inferencer=dict(type=PPLInferencer), | ||
) | ||
|
||
charm_reason_eval_cfg = dict(evaluator=dict(type=AccwithDetailsEvaluator)) | ||
|
||
charm_reason_datasets.append( | ||
dict( | ||
type=CharmDataset, | ||
abbr=f'charm-reason-{task_name}_Direct', | ||
path=f'data/CHARM/reasoning', | ||
name=task_name, | ||
reader_cfg=charm_reason_reader_cfg, | ||
infer_cfg=charm_reason_infer_cfg, | ||
eval_cfg=charm_reason_eval_cfg, | ||
) | ||
) |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
57 changes: 57 additions & 0 deletions
57
configs/datasets/compassbench_20_v1_1/agent/cibench_template_gen_e6b12a.py
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,57 @@ | ||
from opencompass.openicl.icl_prompt_template import PromptTemplate | ||
from opencompass.openicl.icl_retriever import ZeroRetriever | ||
from opencompass.openicl.icl_inferencer import AgentInferencer | ||
from opencompass.datasets import CIBenchDataset, CIBenchEvaluator | ||
|
||
libs = [ | ||
'/lightgbm', | ||
'/matplotlib', | ||
'/nltk', | ||
'/opencv', | ||
'/pandas', | ||
'/pytorch', | ||
'/scipy', | ||
'/seaborn', | ||
'/sklearn', | ||
'/tensorflow', | ||
'_chinese/lightgbm', | ||
'_chinese/matplotlib', | ||
'_chinese/nltk', | ||
'_chinese/opencv', | ||
'_chinese/pandas', | ||
'_chinese/pytorch', | ||
'_chinese/scipy', | ||
'_chinese/seaborn', | ||
'_chinese/sklearn', | ||
'_chinese/tensorflow', | ||
] | ||
|
||
|
||
cibench_datasets = [] | ||
for lib in libs: | ||
cibench_reader_cfg = dict( | ||
input_columns=['questions'], output_column='references', train_split='test', test_split='test' | ||
) | ||
|
||
cibench_infer_cfg = dict( | ||
prompt_template=dict( | ||
type=PromptTemplate, | ||
template='{questions}', | ||
), | ||
retriever=dict(type=ZeroRetriever), | ||
inferencer=dict(type=AgentInferencer, infer_mode='every'), | ||
) | ||
|
||
cibench_eval_cfg = dict(evaluator=dict(type=CIBenchEvaluator), pred_role='BOT') | ||
|
||
cibench_datasets.append( | ||
dict( | ||
abbr=f'cibench_template{lib}', | ||
type=CIBenchDataset, | ||
path=f'data/compassbench_v1.1/agent-cibench/cibench_template{lib}', | ||
internet_check=False, | ||
reader_cfg=cibench_reader_cfg, | ||
infer_cfg=cibench_infer_cfg, | ||
eval_cfg=cibench_eval_cfg, | ||
) | ||
) |
56 changes: 56 additions & 0 deletions
56
configs/datasets/compassbench_20_v1_1/agent/mus_teval_gen_105c48.py
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,56 @@ | ||
from opencompass.openicl.icl_prompt_template import PromptTemplate | ||
from opencompass.openicl.icl_retriever import ZeroRetriever | ||
from opencompass.openicl.icl_inferencer import ChatInferencer | ||
from opencompass.openicl.icl_evaluator import TEvalEvaluator | ||
from opencompass.datasets import teval_postprocess, TEvalDataset | ||
|
||
plugin_eval_subject_mapping = { | ||
'instruct': ['instruct_v1'], | ||
'instruct_zh': ['instruct_v1_zh'], | ||
'plan': ['plan_json_v1', 'plan_str_v1'], | ||
'plan_zh': ['plan_json_v1_zh', 'plan_str_v1_zh'], | ||
'review': ['review_str_v1'], | ||
'review_zh': ['review_str_v1_zh'], | ||
'reason_retrieve_understand': ['reason_retrieve_understand_json_v1'], | ||
'reason_retrieve_understand_zh': ['reason_retrieve_understand_json_v1_zh'], | ||
'reason': ['reason_str_v1'], | ||
'reason_zh': ['reason_str_v1_zh'], | ||
'retrieve': ['retrieve_str_v1'], | ||
'retrieve_zh': ['retrieve_str_v1_zh'], | ||
'understand': ['understand_str_v1'], | ||
'understand_zh': ['understand_str_v1_zh'], | ||
} | ||
|
||
plugin_eval_datasets = [] | ||
for _name in plugin_eval_subject_mapping: | ||
plugin_eval_reader_cfg = dict(input_columns=['prompt'], output_column='ground_truth') | ||
plugin_eval_infer_cfg = dict( | ||
prompt_template=dict( | ||
type=PromptTemplate, | ||
template=dict( | ||
round=[ | ||
dict(role='HUMAN', prompt='{prompt}'), | ||
], | ||
), | ||
), | ||
retriever=dict(type=ZeroRetriever), | ||
inferencer=dict(type=ChatInferencer), | ||
) | ||
plugin_eval_eval_cfg = dict( | ||
evaluator=dict(type=TEvalEvaluator, subset=_name), | ||
pred_postprocessor=dict(type=teval_postprocess), | ||
num_gpus=1, | ||
) | ||
|
||
for subset in plugin_eval_subject_mapping[_name]: | ||
plugin_eval_datasets.append( | ||
dict( | ||
abbr='plugin_eval-mus-p10-' + subset, | ||
type=TEvalDataset, | ||
path='data/compassbench_v1.1/agent-teval-p10', | ||
name=subset, | ||
reader_cfg=plugin_eval_reader_cfg, | ||
infer_cfg=plugin_eval_infer_cfg, | ||
eval_cfg=plugin_eval_eval_cfg, | ||
) | ||
) |
Oops, something went wrong.