TwT-6
/

api-demo

Model card Files Files and versions Community

api-demo / opencompass-my-api /opencompass /models /claude_api /postprocessors.py

TwT-6

Upload 2667 files

256a159 verified 8 months ago

raw

history blame contribute delete

3.95 kB

	import re

	from opencompass.datasets.humaneval import humaneval_gpt_postprocess
	from opencompass.datasets.record import ReCoRD_postprocess
	from opencompass.datasets.xsum import Xsum_postprocess
	from opencompass.utils.text_postprocessors import first_option_postprocess


	def gsm8k_postprocess(text: str) -> str:
	text = text.split(' ')[::-1]
	flag = False
	ret = ''
	for i in range(len(text)):
	s = text[i]
	for i in range(len(s)):
	if s[i].isdigit():
	flag = True
	ret = s
	break
	if flag:
	break
	ret1 = ''
	for i in range(len(ret)):
	if ret[i].isdigit():
	ret1 += ret[i]
	return ret1


	def humaneval_postprocess(text: str) -> str:
	text = '\n'.join(text.split('\n')[1:]).strip()
	if '```' in text:
	blocks = re.findall(r'```(.*?)```', text, re.DOTALL)
	if len(blocks) == 0:
	text = text.split('```')[1] # fall back to default strategy
	else:
	text = blocks[0] # fetch the first code block
	if not text.startswith('\n'): # in case starting with ```python
	text = text[max(text.find('\n') + 1, 0):]
	if text.strip().startswith('from') or text.strip().startswith('import'):
	def_idx = text.find('def')
	if def_idx != -1:
	text = text[max(text.find('\n', def_idx) + 1, 0):]
	if text.strip().startswith('def'):
	text = '\n'.join(text.split('\n')[1:])
	if not text.startswith(' '):
	if text.startswith(' '):
	text = ' ' + text.lstrip()
	else:
	text = '\n'.join([' ' + line for line in text.split('\n')])
	return text


	def lcsts_postprocess(text: str) -> str:
	text = text.strip()
	text = text.replace('1. ', '') if text.startswith('1. ') else text
	text = text.replace('- ', '') if text.startswith('- ') else text
	text = text.strip('“，。！”')
	return text


	def mbpp_postprocess(text: str) -> str:
	if text.startswith('Here'):
	text = '\n'.join(text.split('\n')[1:]).strip()
	if '```' in text:
	blocks = re.findall(r'```(.*?)```', text, re.DOTALL)
	if len(blocks) == 0:
	text = text.split('```')[1] # fall back to default strategy
	else:
	text = blocks[0] # fetch the first code block
	if not text.startswith('\n'): # in case starting with ```python
	text = text[max(text.find('\n') + 1, 0):]
	return text


	def strategyqa_pred_postprocess(text: str) -> str:
	if text.startswith('Here'):
	text = '\n'.join(text.split('\n')[1:]).strip()
	text = text.split('answer is ')[-1]
	match = re.search(r'(yes\|no)', text.lower())
	if match:
	return match.group(1)
	return ''


	def flores_postprocess(text: str) -> str:
	text = text.strip().split('\n')[-1].strip()
	return text


	def flores_postprocess_chinese(text: str) -> str:
	text = text.strip().split('\n')[-1].strip()
	import jieba
	truncated_text = text.strip().split('\n')[0]
	cleaned_text = re.sub(r'\s+', ' ', truncated_text).strip()
	cleaned_text = ' '.join(jieba.cut(cleaned_text))
	return cleaned_text


	def record_postprocess(text: str) -> str:
	match = re.search(r'(?<=refers to )[^.]+', text)

	if match:
	return match.group().strip() # Outputs: abc def

	return ReCoRD_postprocess(text)


	def humaneval_claude2_postprocess(text: str) -> str:
	if text.startswith('Here'):
	text = '\n\n'.join(text.split('\n\n')[1:])
	return humaneval_gpt_postprocess(text)


	def xsum_postprocess(text: str) -> str:
	if text.startswith('Here'):
	text = '\n\n'.join(text.split('\n\n')[1:])
	return Xsum_postprocess(text)


	def yes_no_postprocess(text: str) -> str:
	if 'yes' in text.lower():
	return 'A'
	elif 'no' in text.lower():
	return 'B'
	return first_option_postprocess(text, 'AB')