mirror of
https://github.com/open-compass/opencompass.git
synced 2025-05-30 16:03:24 +08:00

Some checks failed
lint / lint (push) Has been cancelled
* 0-shot Smolinstruct Add 0-shot evaluation and postprocess functions for Smolinstruct * fix acc postprocessor * update 0-shot acc postprocessor * rename 0-shot
56 lines
2.7 KiB
Python
56 lines
2.7 KiB
Python
from opencompass.openicl.icl_prompt_template import PromptTemplate
|
|
from opencompass.openicl.icl_retriever import ZeroRetriever, FixKRetriever
|
|
from opencompass.openicl.icl_inferencer import GenInferencer
|
|
from opencompass.datasets.smolinstruct import FTSEvaluator
|
|
from opencompass.datasets import SmolInstructDataset
|
|
|
|
fts_0shot_reader_cfg = dict(
|
|
input_columns=['input'],
|
|
output_column='output',
|
|
train_split='validation')
|
|
|
|
fts_hint_dict = {
|
|
'MG': """You are an expert chemist. Given the description of a molecule, your task is to generate the potential SMILES representation of the molecule.
|
|
The input contains the description of the molecule. Your reply should contain the potential SMILES representation of the molecule wrapped in <SMILES> and </SMILES> tags. Your reply must be valid and chemically reasonable.""",
|
|
'FS': """You are an expert chemist. Given the SMILES representation of reactants and reagents, your task is to predict the potential product using your chemical reaction knowledge.
|
|
The input contains both reactants and reagents, and different reactants and reagents are separated by ".". Your reply should contain the SMILES representation of the predicted product wrapped in <SMILES> and </SMILES> tags. Your reply must be valid and chemically reasonable.""",
|
|
'RS': """You are an expert chemist. Given the SMILES representation of the product, your task is to predict the potential reactants and reagents using your chemical reaction knowledge.
|
|
The input contains the SMILES representation of the product. Your reply should contain the SMILES representation of both reactants and reagents, and all reactants and reagents should be enclosed **together** within a single pair of <SMILES> and </SMILES> tags, separated by ".". Your reply must be valid and chemically reasonable.""",
|
|
}
|
|
|
|
name_dict = {
|
|
'MG': 'molecule_generation',
|
|
'FS': 'forward_synthesis',
|
|
'RS': 'retrosynthesis'
|
|
}
|
|
|
|
fts_0shot_instruct_datasets = []
|
|
for _name in name_dict:
|
|
_hint = fts_hint_dict[_name]
|
|
fts_0shot_infer_cfg = dict(
|
|
prompt_template=dict(
|
|
type=PromptTemplate,
|
|
template=f'{_hint}\nQuestion: {{input}}\nAnswer: ',
|
|
# template=f'<s>[INST] {{input}} [/INST]',
|
|
),
|
|
retriever=dict(type=ZeroRetriever),
|
|
inferencer=dict(type=GenInferencer),
|
|
)
|
|
|
|
fts_0shot_eval_cfg = dict(
|
|
evaluator=dict(type=FTSEvaluator),
|
|
)
|
|
|
|
fts_0shot_instruct_datasets.append(
|
|
dict(
|
|
abbr=f'{_name}-0shot-instruct',
|
|
type=SmolInstructDataset,
|
|
path='osunlp/SMolInstruct',
|
|
name=name_dict[_name],
|
|
reader_cfg=fts_0shot_reader_cfg,
|
|
infer_cfg=fts_0shot_infer_cfg,
|
|
eval_cfg=fts_0shot_eval_cfg,
|
|
))
|
|
|
|
del _name
|