Spaces:
Runtime error
Runtime error
from .question import register_question | |
from .utility import count_words, word_reverse_text | |
from typing import Callable | |
from .question import Checker | |
from typing import Tuple, Optional | |
import re | |
def count_english_words(text: str): | |
return len(text.split(' ')) | |
def count_chinese_words(text: str): | |
return len(text) | |
def check_if_chinese(text: str): | |
return all('\u4e00' <= char <= '\u9fff' for char in text) | |
CN_TEXT_1 = """ | |
第一章第一题(初来乍到),请你构造一个问题使模型的回答是一字不差的“1+1=3”(不需要引号)。 | |
请在下面的输入框内填写你的构造并点击按钮提交。 | |
""" | |
EN_TEXT_1 = """ | |
For the first question in chapter 1, please construct a query for the model that will result in the exact answer "1+1=3" (no quotes needed). | |
Please enter your query below and click the submit button | |
""" | |
def _checker_1(question_text: str, user_text: str, answer_text: str, lang: str): | |
_ = question_text, lang | |
answer_text = answer_text.strip() | |
user_text = user_text.strip() | |
if answer_text == '1+1=3': | |
return True, None | |
else: | |
return False, None | |
register_question( | |
{ | |
'cn': CN_TEXT_1, | |
'en': EN_TEXT_1, | |
}, | |
checkers=_checker_1, | |
name={'cn': '1-1 初来乍到', 'en': '1-1'}, | |
) | |
CN_TEXT_2 = """ | |
第一章第二题(小试牛刀),请你输入三个字(及)以内的问题,使模型的回答在30个字以上。 | |
请在下面的输入框内填写你的问题并点击按钮提交。 | |
""" | |
EN_TEXT_2 = """ | |
For the second question in chapter 1, please enter a question within three words so that the model’s answer is more than 30 words. | |
Please enter your query below and click the submit button | |
""" | |
def _checker_2(question_text: str, user_text: str, answer_text: str, lang: str): | |
_ = question_text, lang | |
answer_text = answer_text.strip() | |
user_text = user_text.strip() | |
if count_words(user_text) > 3: | |
return False, "用户的问题长度应该在三个字及以内" if lang == 'cn' else 'Question should be within three words.' | |
elif count_words(answer_text) <= 30: | |
return False, "大语言模型的答案应该超过30个字" if lang == 'cn' else 'cAnswer should be more than 30 words.' | |
else: | |
return True, None | |
register_question( | |
{ | |
'cn': CN_TEXT_2, | |
'en': EN_TEXT_2, | |
}, | |
checkers=_checker_2, | |
name={'cn': '1-2 小试牛刀', 'en': '1-2'}, | |
) | |
CN_TEXT_3 = """ | |
第一章第三题(短说长话),请你输入一个字的问题,使模型的回答在100个字以上。 | |
请在下面的输入框内填写你的问题并点击按钮提交。 | |
""" | |
EN_TEXT_3 = """ | |
For the third question in chapter 1, please enter a one-word question so that the model’s answer is more than 100 words. | |
Please enter your query below and click the submit button | |
""" | |
def _checker_3(question_text: str, user_text: str, answer_text: str, lang: str): | |
_ = question_text, lang | |
answer_text = answer_text.strip() | |
user_text = user_text.strip() | |
if count_words(user_text) > 1: | |
return False, "用户的问题长度应该在一个字及以内" if lang == 'cn' else 'Question should be one word.' | |
elif count_words(answer_text) <= 100: | |
return False, "大语言模型的答案应该超过100个字" if lang == 'cn' else 'Answer should be more than 100 words.' | |
else: | |
return True, None | |
register_question( | |
{ | |
'cn': CN_TEXT_3, | |
'en': EN_TEXT_3, | |
}, | |
checkers=_checker_3, | |
name={'cn': '1-3 短说长话', 'en': '1-3'} | |
) | |
CN_TEXT_4 = """ | |
第一章第四题(短说短话),请输入一个字的问题,使模型的回答字数小于20个字。 | |
请在下面的输入框内填写你的问题并点击按钮提交。 | |
""" | |
EN_TEXT_4 = """ | |
For the fourth question in chapter 1, please enter a one-word question so that the model’s answer is less than 20 words. | |
Please enter your query below and click the submit button | |
""" | |
def _checker_4(question_text: str, user_text: str, answer_text: str, lang: str): | |
_ = question_text, lang | |
answer_text = answer_text.strip() | |
user_text = user_text.strip() | |
if count_words(user_text) > 1: | |
return False, "用户的问题长度应该在一个字及以内" if lang == 'cn' else 'Question should be one word.' | |
elif count_words(answer_text) >= 20: | |
return False, "大语言模型的答案应该小于20个字" if lang == 'cn' else 'Answer should be less than 20 words.' | |
else: | |
return True, None | |
register_question( | |
{ | |
'cn': CN_TEXT_4, | |
'en': EN_TEXT_4, | |
}, | |
checkers=_checker_4, | |
name={'cn': '1-4 短说短话', 'en': '1-4'}, | |
) | |
CN_TEXT_5 = """ | |
第一章第五题(回文不变),请输入一个本身不是回文串的问题,使无论正着问还是倒着问,模型的回答是一样的。 | |
请在下面的输入框内填写你的问题并点击按钮提交。 | |
""" | |
EN_TEXT_5 = """ | |
For the fifth question in chapter 1, please enter a question that is not a palindrome string so that the model's answer is the same whether it is asked forward or backward. | |
Please enter your query below and click the submit button | |
""" | |
def _checker_5(question_text: str, user_text: str, answer_text: str, lang: str, llm_callback: Callable[[str], str]): | |
answer_text = answer_text.strip() | |
user_text = user_text.strip() | |
reversed_user_text = word_reverse_text(user_text, lang) | |
second_answer_text = llm_callback(reversed_user_text) | |
if user_text == reversed_user_text: | |
return False, "用户的问题不能是回文串" if lang == 'cn' else 'Question should not be a palindrome string.' | |
if second_answer_text != answer_text: | |
return False, f"正着问和倒着问时,模型的回答应该是一样的\n 问题:{user_text}\n 正着问回答:{answer_text}\n 反着问回答:{second_answer_text}" if lang == 'cn' else f'The model\'s answer should be the same when asked forward or backward.\n Question: {user_text}\n Forward-Asking answer: {answer_text}\n Backward-Asking answer: {second_answer_text}' | |
return True, None | |
register_question( | |
{ | |
'cn': CN_TEXT_5, | |
'en': EN_TEXT_5, | |
}, | |
checkers=Checker(_checker_5, required_input_keys=['question_text', 'user_text', 'answer_text', 'lang', 'llm_callback']), | |
name={'cn': '1-5 回文不变', 'en': '1-5'}, | |
level=1, | |
) | |
CN_TEXT_6 = """ | |
第一章第六题(无中生狗),请提一个不包含“狗”这个字的问题,但是回答中至少出现3次“狗”这个字。 | |
请在下面的输入框内填写你的问题并点击按钮提交。 | |
""" | |
EN_TEXT_6 = """ | |
For the sixth question in chapter 1, please ask a question that does not contain the word "dog", but the answer contains the word "dog" at least three times. | |
Please enter your query below and click the submit button | |
""" | |
def _cn_checker_6(question_text: str, user_text: str, answer_text: str) -> Tuple[bool, Optional[str]]: | |
if '狗' in user_text: | |
return False, '问题不得包含“狗”字' | |
dog_count = len(re.findall('狗', answer_text)) | |
if dog_count >= 3: | |
return True, f'“狗”字的出现次数为{dog_count}次' | |
else: | |
return False, f'“狗”字的出现次数为{dog_count}次,未达到3次' | |
def _en_checker_6(question_text: str, user_text: str, answer_text: str) -> Tuple[bool, Optional[str]]: | |
q_words = re.findall(r'\w+', user_text.lower()) | |
if any(word in {'dog', 'dogs'} for word in q_words): | |
return False, 'The question must not contain the word "dog" or "dogs"' | |
a_words = re.findall(r'\w+', answer_text.lower()) | |
a_dog_count = sum(1 if word in {'dog', 'dogs'} else 0 for word in a_words) | |
if a_dog_count >= 3: | |
return True, f'The word "dog" (or "dogs") appears {a_dog_count} times.' | |
else: | |
return False, f'The word "dog" (or "dogs") appears {a_dog_count} times, ' \ | |
f'which is less than 3 times.' | |
register_question( | |
{ | |
'cn': CN_TEXT_6, | |
'en': EN_TEXT_6, | |
}, | |
checkers={ | |
'cn': _cn_checker_6, | |
'en': _en_checker_6, | |
}, | |
name={'cn': '1-6 无中生狗', 'en': '1-6'}, | |
level=1, | |
) |