File size: 8,443 Bytes
f18dd2a
0d8bebc
 
 
 
 
bacbf19
f18dd2a
 
 
bacbf19
f18dd2a
 
 
bacbf19
f18dd2a
 
 
bacbf19
f18dd2a
 
 
2b92d64
f18dd2a
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
bacbf19
 
 
 
 
 
 
 
f18dd2a
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
bacbf19
 
 
 
 
 
 
 
f18dd2a
 
 
 
 
 
 
 
 
 
 
 
 
bacbf19
f18dd2a
 
 
 
 
 
 
 
 
 
 
 
 
bacbf19
 
 
 
 
 
 
 
f18dd2a
 
 
 
 
 
 
 
 
 
 
 
 
bacbf19
f18dd2a
 
 
 
 
 
 
 
e65449c
f18dd2a
 
 
 
bacbf19
 
 
 
 
 
 
 
f18dd2a
0d8bebc
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
f18dd2a
0d8bebc
 
f18dd2a
0d8bebc
 
f18dd2a
0d8bebc
 
f18dd2a
 
0d8bebc
 
 
f18dd2a
0d8bebc
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
from .question import register_question
from .utility import count_words, word_reverse_text
from typing import Callable
from .question import Checker
from typing import Tuple, Optional
import re

def count_english_words(text: str):
    return len(text.split(' '))


def count_chinese_words(text: str):
    return len(text)


def check_if_chinese(text: str):
    return all('\u4e00' <= char <= '\u9fff' for char in text)


CN_TEXT_1 = """

第一章第一题(初来乍到),请你构造一个问题使模型的回答是一字不差的“1+1=3”(不需要引号)。



请在下面的输入框内填写你的构造并点击按钮提交。

"""

EN_TEXT_1 = """

For the first question in chapter 1, please construct a query for the model that will result in the exact answer "1+1=3" (no quotes needed).



Please enter your query below and click the submit button

"""


def _checker_1(question_text: str, user_text: str, answer_text: str, lang: str):
    _ = question_text, lang
    answer_text = answer_text.strip()
    user_text = user_text.strip()
    if answer_text == '1+1=3':
        return True, None
    else:
        return False, None


register_question(
    {
        'cn': CN_TEXT_1,
        'en': EN_TEXT_1,
    },
    checkers=_checker_1,
    name={'cn': '1-1 初来乍到', 'en': '1-1'},
)

CN_TEXT_2 = """

第一章第二题(小试牛刀),请你输入三个字(及)以内的问题,使模型的回答在30个字以上。



请在下面的输入框内填写你的问题并点击按钮提交。

"""

EN_TEXT_2 = """

For the second question in chapter 1, please enter a question within three words so that the model’s answer is more than 30 words.



Please enter your query below and click the submit button

"""


def _checker_2(question_text: str, user_text: str, answer_text: str, lang: str):
    _ = question_text, lang
    answer_text = answer_text.strip()
    user_text = user_text.strip()

    if count_words(user_text) > 3:
        return False, "用户的问题长度应该在三个字及以内" if lang == 'cn' else 'Question should be within three words.'
    elif count_words(answer_text) <= 30:
        return False, "大语言模型的答案应该超过30个字" if lang == 'cn' else 'cAnswer should be more than 30 words.'
    else:
        return True, None


register_question(
    {
        'cn': CN_TEXT_2,
        'en': EN_TEXT_2,
    },
    checkers=_checker_2,
    name={'cn': '1-2 小试牛刀', 'en': '1-2'},
)

CN_TEXT_3 = """

第一章第三题(短说长话),请你输入一个字的问题,使模型的回答在100个字以上。



请在下面的输入框内填写你的问题并点击按钮提交。

"""

EN_TEXT_3 = """

For the third question in chapter 1, please enter a one-word question so that the model’s answer is more than 100 words.



Please enter your query below and click the submit button

"""


def _checker_3(question_text: str, user_text: str, answer_text: str, lang: str):
    _ = question_text, lang
    answer_text = answer_text.strip()
    user_text = user_text.strip()

    if count_words(user_text) > 1:
        return False, "用户的问题长度应该在一个字及以内" if lang == 'cn' else 'Question should be one word.'
    elif count_words(answer_text) <= 100:
        return False, "大语言模型的答案应该超过100个字" if lang == 'cn' else 'Answer should be more than 100 words.'
    else:
        return True, None


register_question(
    {
        'cn': CN_TEXT_3,
        'en': EN_TEXT_3,
    },
    checkers=_checker_3,
    name={'cn': '1-3 短说长话', 'en': '1-3'}
)

CN_TEXT_4 = """

第一章第四题(短说短话),请输入一个字的问题,使模型的回答字数小于20个字。



请在下面的输入框内填写你的问题并点击按钮提交。

"""

EN_TEXT_4 = """

For the fourth question in chapter 1, please enter a one-word question so that the model’s answer is less than 20 words.



Please enter your query below and click the submit button

"""


def _checker_4(question_text: str, user_text: str, answer_text: str, lang: str):
    _ = question_text, lang
    answer_text = answer_text.strip()
    user_text = user_text.strip()

    if count_words(user_text) > 1:
        return False, "用户的问题长度应该在一个字及以内" if lang == 'cn' else 'Question should be one word.'
    elif count_words(answer_text) >= 20:
        return False, "大语言模型的答案应该小于20个字" if lang == 'cn' else 'Answer should be less than 20 words.'
    else:
        return True, None


register_question(
    {
        'cn': CN_TEXT_4,
        'en': EN_TEXT_4,
    },
    checkers=_checker_4,
    name={'cn': '1-4 短说短话', 'en': '1-4'},
)

CN_TEXT_5 = """

第一章第五题(回文不变),请输入一个本身不是回文串的问题,使无论正着问还是倒着问,模型的回答是一样的。



请在下面的输入框内填写你的问题并点击按钮提交。

"""

EN_TEXT_5 = """

For the fifth question in chapter 1, please enter a question that is not a palindrome string so that the model's answer is the same whether it is asked forward or backward.



Please enter your query below and click the submit button

"""

def _checker_5(question_text: str, user_text: str, answer_text: str, lang: str, llm_callback: Callable[[str], str]):
    answer_text = answer_text.strip()
    user_text = user_text.strip()
    reversed_user_text = word_reverse_text(user_text, lang)
    second_answer_text = llm_callback(reversed_user_text)

    if user_text == reversed_user_text:
        return False, "用户的问题不能是回文串" if lang == 'cn' else 'Question should not be a palindrome string.'

    if second_answer_text != answer_text:
        return False, f"正着问和倒着问时,模型的回答应该是一样的\n 问题:{user_text}\n 正着问回答:{answer_text}\n 反着问回答:{second_answer_text}" if lang == 'cn' else f'The model\'s answer should be the same when asked forward or backward.\n Question: {user_text}\n Forward-Asking answer: {answer_text}\n Backward-Asking answer: {second_answer_text}'
    return True, None

register_question(
    {
        'cn': CN_TEXT_5,
        'en': EN_TEXT_5,
    }, 
    checkers=Checker(_checker_5, required_input_keys=['question_text', 'user_text', 'answer_text', 'lang', 'llm_callback']), 
    name={'cn': '1-5 回文不变', 'en': '1-5'},
    level=1,
)

CN_TEXT_6 = """

第一章第六题(无中生狗),请提一个不包含“狗”这个字的问题,但是回答中至少出现3次“狗”这个字。



请在下面的输入框内填写你的问题并点击按钮提交。

"""

EN_TEXT_6 = """

For the sixth question in chapter 1, please ask a question that does not contain the word "dog", but the answer contains the word "dog" at least three times.



Please enter your query below and click the submit button

"""


def _cn_checker_6(question_text: str, user_text: str, answer_text: str) -> Tuple[bool, Optional[str]]:
    if '狗' in user_text:
        return False, '问题不得包含“狗”字'

    dog_count = len(re.findall('狗', answer_text))
    if dog_count >= 3:
        return True, f'“狗”字的出现次数为{dog_count}次'
    else:
        return False, f'“狗”字的出现次数为{dog_count}次,未达到3次'

def _en_checker_6(question_text: str, user_text: str, answer_text: str) -> Tuple[bool, Optional[str]]:
    q_words = re.findall(r'\w+', user_text.lower())
    if any(word in {'dog', 'dogs'} for word in q_words):
        return False, 'The question must not contain the word "dog" or "dogs"'

    a_words = re.findall(r'\w+', answer_text.lower())
    a_dog_count = sum(1 if word in {'dog', 'dogs'} else 0 for word in a_words)
    if a_dog_count >= 3:
        return True, f'The word "dog" (or "dogs") appears {a_dog_count} times.'
    else:
        return False, f'The word "dog" (or "dogs") appears {a_dog_count} times, ' \
                      f'which is less than 3 times.'

register_question(
    {
        'cn': CN_TEXT_6,
        'en': EN_TEXT_6,
    },
    checkers={
        'cn': _cn_checker_6,
        'en': _en_checker_6,
    },
    name={'cn': '1-6 无中生狗', 'en': '1-6'},
    level=1,
)