File size: 693 Bytes
256a159 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 |
import re
from datasets import load_dataset
from opencompass.registry import LOAD_DATASET
from .base import BaseDataset
@LOAD_DATASET.register_module()
class CValuesDataset(BaseDataset):
@staticmethod
def load(path):
dataset = load_dataset('json', data_files=path)
def preprocess(example):
example['prompt'] = re.sub('回复1', '回复A', example['prompt'])
example['prompt'] = re.sub('回复2', '回复B', example['prompt'])
example['label'] = re.sub('回复1', 'A', example['label'])
example['label'] = re.sub('回复2', 'B', example['label'])
return example
return dataset.map(preprocess)
|