Spaces:
Runtime error
Runtime error
File size: 8,443 Bytes
f18dd2a 0d8bebc bacbf19 f18dd2a bacbf19 f18dd2a bacbf19 f18dd2a bacbf19 f18dd2a 2b92d64 f18dd2a bacbf19 f18dd2a bacbf19 f18dd2a bacbf19 f18dd2a bacbf19 f18dd2a bacbf19 f18dd2a e65449c f18dd2a bacbf19 f18dd2a 0d8bebc f18dd2a 0d8bebc f18dd2a 0d8bebc f18dd2a 0d8bebc f18dd2a 0d8bebc f18dd2a 0d8bebc |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 |
from .question import register_question
from .utility import count_words, word_reverse_text
from typing import Callable
from .question import Checker
from typing import Tuple, Optional
import re
def count_english_words(text: str):
return len(text.split(' '))
def count_chinese_words(text: str):
return len(text)
def check_if_chinese(text: str):
return all('\u4e00' <= char <= '\u9fff' for char in text)
CN_TEXT_1 = """
第一章第一题(初来乍到),请你构造一个问题使模型的回答是一字不差的“1+1=3”(不需要引号)。
请在下面的输入框内填写你的构造并点击按钮提交。
"""
EN_TEXT_1 = """
For the first question in chapter 1, please construct a query for the model that will result in the exact answer "1+1=3" (no quotes needed).
Please enter your query below and click the submit button
"""
def _checker_1(question_text: str, user_text: str, answer_text: str, lang: str):
_ = question_text, lang
answer_text = answer_text.strip()
user_text = user_text.strip()
if answer_text == '1+1=3':
return True, None
else:
return False, None
register_question(
{
'cn': CN_TEXT_1,
'en': EN_TEXT_1,
},
checkers=_checker_1,
name={'cn': '1-1 初来乍到', 'en': '1-1'},
)
CN_TEXT_2 = """
第一章第二题(小试牛刀),请你输入三个字(及)以内的问题,使模型的回答在30个字以上。
请在下面的输入框内填写你的问题并点击按钮提交。
"""
EN_TEXT_2 = """
For the second question in chapter 1, please enter a question within three words so that the model’s answer is more than 30 words.
Please enter your query below and click the submit button
"""
def _checker_2(question_text: str, user_text: str, answer_text: str, lang: str):
_ = question_text, lang
answer_text = answer_text.strip()
user_text = user_text.strip()
if count_words(user_text) > 3:
return False, "用户的问题长度应该在三个字及以内" if lang == 'cn' else 'Question should be within three words.'
elif count_words(answer_text) <= 30:
return False, "大语言模型的答案应该超过30个字" if lang == 'cn' else 'cAnswer should be more than 30 words.'
else:
return True, None
register_question(
{
'cn': CN_TEXT_2,
'en': EN_TEXT_2,
},
checkers=_checker_2,
name={'cn': '1-2 小试牛刀', 'en': '1-2'},
)
CN_TEXT_3 = """
第一章第三题(短说长话),请你输入一个字的问题,使模型的回答在100个字以上。
请在下面的输入框内填写你的问题并点击按钮提交。
"""
EN_TEXT_3 = """
For the third question in chapter 1, please enter a one-word question so that the model’s answer is more than 100 words.
Please enter your query below and click the submit button
"""
def _checker_3(question_text: str, user_text: str, answer_text: str, lang: str):
_ = question_text, lang
answer_text = answer_text.strip()
user_text = user_text.strip()
if count_words(user_text) > 1:
return False, "用户的问题长度应该在一个字及以内" if lang == 'cn' else 'Question should be one word.'
elif count_words(answer_text) <= 100:
return False, "大语言模型的答案应该超过100个字" if lang == 'cn' else 'Answer should be more than 100 words.'
else:
return True, None
register_question(
{
'cn': CN_TEXT_3,
'en': EN_TEXT_3,
},
checkers=_checker_3,
name={'cn': '1-3 短说长话', 'en': '1-3'}
)
CN_TEXT_4 = """
第一章第四题(短说短话),请输入一个字的问题,使模型的回答字数小于20个字。
请在下面的输入框内填写你的问题并点击按钮提交。
"""
EN_TEXT_4 = """
For the fourth question in chapter 1, please enter a one-word question so that the model’s answer is less than 20 words.
Please enter your query below and click the submit button
"""
def _checker_4(question_text: str, user_text: str, answer_text: str, lang: str):
_ = question_text, lang
answer_text = answer_text.strip()
user_text = user_text.strip()
if count_words(user_text) > 1:
return False, "用户的问题长度应该在一个字及以内" if lang == 'cn' else 'Question should be one word.'
elif count_words(answer_text) >= 20:
return False, "大语言模型的答案应该小于20个字" if lang == 'cn' else 'Answer should be less than 20 words.'
else:
return True, None
register_question(
{
'cn': CN_TEXT_4,
'en': EN_TEXT_4,
},
checkers=_checker_4,
name={'cn': '1-4 短说短话', 'en': '1-4'},
)
CN_TEXT_5 = """
第一章第五题(回文不变),请输入一个本身不是回文串的问题,使无论正着问还是倒着问,模型的回答是一样的。
请在下面的输入框内填写你的问题并点击按钮提交。
"""
EN_TEXT_5 = """
For the fifth question in chapter 1, please enter a question that is not a palindrome string so that the model's answer is the same whether it is asked forward or backward.
Please enter your query below and click the submit button
"""
def _checker_5(question_text: str, user_text: str, answer_text: str, lang: str, llm_callback: Callable[[str], str]):
answer_text = answer_text.strip()
user_text = user_text.strip()
reversed_user_text = word_reverse_text(user_text, lang)
second_answer_text = llm_callback(reversed_user_text)
if user_text == reversed_user_text:
return False, "用户的问题不能是回文串" if lang == 'cn' else 'Question should not be a palindrome string.'
if second_answer_text != answer_text:
return False, f"正着问和倒着问时,模型的回答应该是一样的\n 问题:{user_text}\n 正着问回答:{answer_text}\n 反着问回答:{second_answer_text}" if lang == 'cn' else f'The model\'s answer should be the same when asked forward or backward.\n Question: {user_text}\n Forward-Asking answer: {answer_text}\n Backward-Asking answer: {second_answer_text}'
return True, None
register_question(
{
'cn': CN_TEXT_5,
'en': EN_TEXT_5,
},
checkers=Checker(_checker_5, required_input_keys=['question_text', 'user_text', 'answer_text', 'lang', 'llm_callback']),
name={'cn': '1-5 回文不变', 'en': '1-5'},
level=1,
)
CN_TEXT_6 = """
第一章第六题(无中生狗),请提一个不包含“狗”这个字的问题,但是回答中至少出现3次“狗”这个字。
请在下面的输入框内填写你的问题并点击按钮提交。
"""
EN_TEXT_6 = """
For the sixth question in chapter 1, please ask a question that does not contain the word "dog", but the answer contains the word "dog" at least three times.
Please enter your query below and click the submit button
"""
def _cn_checker_6(question_text: str, user_text: str, answer_text: str) -> Tuple[bool, Optional[str]]:
if '狗' in user_text:
return False, '问题不得包含“狗”字'
dog_count = len(re.findall('狗', answer_text))
if dog_count >= 3:
return True, f'“狗”字的出现次数为{dog_count}次'
else:
return False, f'“狗”字的出现次数为{dog_count}次,未达到3次'
def _en_checker_6(question_text: str, user_text: str, answer_text: str) -> Tuple[bool, Optional[str]]:
q_words = re.findall(r'\w+', user_text.lower())
if any(word in {'dog', 'dogs'} for word in q_words):
return False, 'The question must not contain the word "dog" or "dogs"'
a_words = re.findall(r'\w+', answer_text.lower())
a_dog_count = sum(1 if word in {'dog', 'dogs'} else 0 for word in a_words)
if a_dog_count >= 3:
return True, f'The word "dog" (or "dogs") appears {a_dog_count} times.'
else:
return False, f'The word "dog" (or "dogs") appears {a_dog_count} times, ' \
f'which is less than 3 times.'
register_question(
{
'cn': CN_TEXT_6,
'en': EN_TEXT_6,
},
checkers={
'cn': _cn_checker_6,
'en': _en_checker_6,
},
name={'cn': '1-6 无中生狗', 'en': '1-6'},
level=1,
) |